[PATCH net-next v10 3/5] hinic3: Add ethtool coalesce ops
From: Fan Gong <gongfan1@huawei.com>
Date: 2026-06-29 07:38:09
Also in:
linux-doc, lkml
Subsystem:
huawei 3rd gen ethernet driver, networking drivers, the rest · Maintainers:
Fan Gong, Andrew Lunn, "David S. Miller", Eric Dumazet, Jakub Kicinski, Paolo Abeni, Linus Torvalds
Implement following ethtool callback function: .get_coalesce .set_coalesce These callbacks allow users to utilize ethtool for detailed RX coalesce configuration and monitoring. Co-developed-by: Wu Di <redacted> Signed-off-by: Wu Di <redacted> Co-developed-by: Teng Peisen <redacted> Signed-off-by: Teng Peisen <redacted> Signed-off-by: Fan Gong <gongfan1@huawei.com> --- .../ethernet/huawei/hinic3/hinic3_ethtool.c | 286 +++++++++++++++++- .../net/ethernet/huawei/hinic3/hinic3_irq.c | 15 +- 2 files changed, 296 insertions(+), 5 deletions(-)
diff --git a/drivers/net/ethernet/huawei/hinic3/hinic3_ethtool.c b/drivers/net/ethernet/huawei/hinic3/hinic3_ethtool.c
index 0e1f83806933..c329f1c62f0e 100644
--- a/drivers/net/ethernet/huawei/hinic3/hinic3_ethtool.c
+++ b/drivers/net/ethernet/huawei/hinic3/hinic3_ethtool.c@@ -18,6 +18,11 @@ #include "hinic3_nic_cfg.h" #define HINIC3_MGMT_VERSION_MAX_LEN 32 +/* Coalesce time properties in microseconds */ +#define COALESCE_PENDING_LIMIT_UNIT 8 +#define COALESCE_TIMER_CFG_UNIT 5 +#define COALESCE_MAX_PENDING_LIMIT (255 * COALESCE_PENDING_LIMIT_UNIT) +#define COALESCE_MAX_TIMER_CFG (255 * COALESCE_TIMER_CFG_UNIT) static void hinic3_get_drvinfo(struct net_device *netdev, struct ethtool_drvinfo *info)
@@ -973,9 +978,284 @@ static void hinic3_get_pause_stats(struct net_device *netdev, kfree(ps); } +static int hinic3_set_queue_coalesce(struct net_device *netdev, u16 q_id, + struct hinic3_intr_coal_info *coal, + struct netlink_ext_ack *extack) +{ + struct hinic3_nic_dev *nic_dev = netdev_priv(netdev); + struct hinic3_intr_coal_info *intr_coal; + struct hinic3_intr_coal_info old_coal; + struct hinic3_interrupt_info info = {}; + int err; + + mutex_lock(&nic_dev->state_lock); + intr_coal = &nic_dev->intr_coalesce[q_id]; + old_coal = *intr_coal; + + intr_coal->coalesce_timer_cfg = coal->coalesce_timer_cfg; + intr_coal->pending_limit = coal->pending_limit; + intr_coal->rx_pending_limit_low = coal->rx_pending_limit_low; + intr_coal->rx_pending_limit_high = coal->rx_pending_limit_high; + + info.resend_timer_cfg = intr_coal->resend_timer_cfg; + mutex_unlock(&nic_dev->state_lock); + + if (!test_bit(HINIC3_INTF_UP, &nic_dev->flags) || + q_id >= nic_dev->q_params.num_qps) + return 0; + + info.msix_index = nic_dev->q_params.irq_cfg[q_id].msix_entry_idx; + info.interrupt_coalesc_set = 1; + + info.coalesc_timer_cfg = coal->coalesce_timer_cfg; + info.pending_limit = coal->pending_limit; + + mutex_lock(&nic_dev->state_lock); + err = hinic3_set_interrupt_cfg(nic_dev->hwdev, info); + mutex_unlock(&nic_dev->state_lock); + + if (err) { + NL_SET_ERR_MSG_FMT_MOD(extack, "Failed to set queue%u coalesce", + q_id); + mutex_lock(&nic_dev->state_lock); + *intr_coal = old_coal; + mutex_unlock(&nic_dev->state_lock); + return err; + } + + return 0; +} + +static int is_coalesce_exceed_limit(const struct ethtool_coalesce *coal, + struct netlink_ext_ack *extack) +{ + const struct { + const char *name; + u32 value; + u32 limit; + } coalesce_limits[] = { + {"rx_coalesce_usecs", + coal->rx_coalesce_usecs, + COALESCE_MAX_TIMER_CFG}, + {"rx_max_coalesced_frames", + coal->rx_max_coalesced_frames, + COALESCE_MAX_PENDING_LIMIT}, + {"rx_max_coalesced_frames_low", + coal->rx_max_coalesced_frames_low, + COALESCE_MAX_PENDING_LIMIT}, + {"rx_max_coalesced_frames_high", + coal->rx_max_coalesced_frames_high, + COALESCE_MAX_PENDING_LIMIT}, + }; + + for (int i = 0; i < ARRAY_SIZE(coalesce_limits); i++) { + if (coalesce_limits[i].value > coalesce_limits[i].limit) { + NL_SET_ERR_MSG_FMT_MOD(extack, + "%s out of range %d-%d", + coalesce_limits[i].name, + 0, + coalesce_limits[i].limit); + return -ERANGE; + } + } + return 0; +} + +static int is_coalesce_legal(const struct ethtool_coalesce *coal, + struct netlink_ext_ack *extack) +{ + int err; + + err = is_coalesce_exceed_limit(coal, extack); + if (err) + return err; + + if (coal->rx_max_coalesced_frames_low > + coal->rx_max_coalesced_frames_high) { + NL_SET_ERR_MSG_FMT_MOD(extack, + "invalid coalesce frame high %u, low %u", + coal->rx_max_coalesced_frames_high, + coal->rx_max_coalesced_frames_low); + return -ERANGE; + } + + return 0; +} + +static void check_coalesce_align(struct net_device *netdev, + u32 item, u32 unit, const char *str) +{ + if (item % unit) + netdev_warn(netdev, "%s in %d units, change to %u\n", + str, unit, item - item % unit); +} + +#define CHECK_COALESCE_ALIGN(member, unit) \ + check_coalesce_align(netdev, member, unit, #member) + +static void check_coalesce_changed(struct net_device *netdev, + u32 item, u32 unit, u32 ori_val, + const char *obj_str, const char *str) +{ + if ((item / unit) != ori_val) + netdev_dbg(netdev, "Change %s from %d to %u %s\n", + str, ori_val * unit, item - item % unit, obj_str); +} + +#define CHECK_COALESCE_CHANGED(member, unit, ori_val, obj_str) \ + check_coalesce_changed(netdev, member, unit, ori_val, obj_str, #member) + +static int hinic3_set_hw_coal_param(struct net_device *netdev, + struct hinic3_intr_coal_info *intr_coal, + struct netlink_ext_ack *extack) +{ + struct hinic3_nic_dev *nic_dev = netdev_priv(netdev); + int err; + u16 i; + + for (i = 0; i < nic_dev->max_qps; i++) { + err = hinic3_set_queue_coalesce(netdev, i, intr_coal, extack); + if (err) + return err; + } + + return 0; +} + +static int hinic3_get_coalesce(struct net_device *netdev, + struct ethtool_coalesce *coal, + struct kernel_ethtool_coalesce *kernel_coal, + struct netlink_ext_ack *extack) +{ + struct hinic3_nic_dev *nic_dev = netdev_priv(netdev); + struct hinic3_intr_coal_info *interrupt_info; + + interrupt_info = &nic_dev->intr_coalesce[0]; + + coal->use_adaptive_rx_coalesce = nic_dev->adaptive_rx_coal; + + mutex_lock(&nic_dev->state_lock); + + coal->rx_max_coalesced_frames_low = + interrupt_info->rx_pending_limit_low * + COALESCE_PENDING_LIMIT_UNIT; + + coal->rx_max_coalesced_frames_high = + interrupt_info->rx_pending_limit_high * + COALESCE_PENDING_LIMIT_UNIT; + + /* TX/RX uses the same interrupt. + * So we only declare RX ethtool_coalesce parameters. + */ + coal->rx_coalesce_usecs = interrupt_info->coalesce_timer_cfg * + COALESCE_TIMER_CFG_UNIT; + + coal->rx_max_coalesced_frames = interrupt_info->pending_limit * + COALESCE_PENDING_LIMIT_UNIT; + + mutex_unlock(&nic_dev->state_lock); + + return 0; +} + +static int hinic3_set_coalesce(struct net_device *netdev, + struct ethtool_coalesce *coal, + struct kernel_ethtool_coalesce *kernel_coal, + struct netlink_ext_ack *extack) +{ + struct hinic3_nic_dev *nic_dev = netdev_priv(netdev); + struct hinic3_intr_coal_info *ori_intr_coal; + struct hinic3_intr_coal_info intr_coal = {}; + const char *obj_str = "for netdev"; + bool old_adaptive, new_adaptive; + bool dim_stopped = false; + int err; + int i; + + err = is_coalesce_legal(coal, extack); + if (err) + return err; + + CHECK_COALESCE_ALIGN(coal->rx_coalesce_usecs, COALESCE_TIMER_CFG_UNIT); + CHECK_COALESCE_ALIGN(coal->rx_max_coalesced_frames, + COALESCE_PENDING_LIMIT_UNIT); + CHECK_COALESCE_ALIGN(coal->rx_max_coalesced_frames_high, + COALESCE_PENDING_LIMIT_UNIT); + CHECK_COALESCE_ALIGN(coal->rx_max_coalesced_frames_low, + COALESCE_PENDING_LIMIT_UNIT); + + ori_intr_coal = &nic_dev->intr_coalesce[0]; + + CHECK_COALESCE_CHANGED(coal->rx_coalesce_usecs, COALESCE_TIMER_CFG_UNIT, + ori_intr_coal->coalesce_timer_cfg, obj_str); + CHECK_COALESCE_CHANGED(coal->rx_max_coalesced_frames, + COALESCE_PENDING_LIMIT_UNIT, + ori_intr_coal->pending_limit, obj_str); + CHECK_COALESCE_CHANGED(coal->rx_max_coalesced_frames_high, + COALESCE_PENDING_LIMIT_UNIT, + ori_intr_coal->rx_pending_limit_high, obj_str); + CHECK_COALESCE_CHANGED(coal->rx_max_coalesced_frames_low, + COALESCE_PENDING_LIMIT_UNIT, + ori_intr_coal->rx_pending_limit_low, obj_str); + + old_adaptive = READ_ONCE(nic_dev->adaptive_rx_coal); + new_adaptive = !!coal->use_adaptive_rx_coalesce; + + if (old_adaptive) { + WRITE_ONCE(nic_dev->adaptive_rx_coal, false); + + synchronize_net(); + + for (i = 0; i < nic_dev->q_params.num_qps; i++) { + if (!nic_dev->q_params.irq_cfg[i].rxq) + continue; + + cancel_work_sync(&nic_dev->q_params.irq_cfg[i].rxq + ->dim.work); + } + + dim_stopped = true; + } + + intr_coal.coalesce_timer_cfg = + (u8)(coal->rx_coalesce_usecs / COALESCE_TIMER_CFG_UNIT); + + intr_coal.pending_limit = + (u8)(coal->rx_max_coalesced_frames / + COALESCE_PENDING_LIMIT_UNIT); + + intr_coal.rx_pending_limit_high = + (u8)(coal->rx_max_coalesced_frames_high / + COALESCE_PENDING_LIMIT_UNIT); + + intr_coal.rx_pending_limit_low = + (u8)(coal->rx_max_coalesced_frames_low / + COALESCE_PENDING_LIMIT_UNIT); + + /* coalesce timer or pending set to zero will disable coalesce */ + if (!new_adaptive && + (!intr_coal.coalesce_timer_cfg || !intr_coal.pending_limit)) + netdev_info(netdev, "Coalesce will be disabled\n"); + + err = hinic3_set_hw_coal_param(netdev, &intr_coal, extack); + if (err) { + if (dim_stopped) + WRITE_ONCE(nic_dev->adaptive_rx_coal, old_adaptive); + + return err; + } + + WRITE_ONCE(nic_dev->adaptive_rx_coal, new_adaptive); + + return 0; +} + static const struct ethtool_ops hinic3_ethtool_ops = { - .supported_coalesce_params = ETHTOOL_COALESCE_USECS | - ETHTOOL_COALESCE_PKT_RATE_RX_USECS, + .supported_coalesce_params = ETHTOOL_COALESCE_RX_USECS | + ETHTOOL_COALESCE_RX_MAX_FRAMES | + ETHTOOL_COALESCE_USE_ADAPTIVE_RX | + ETHTOOL_COALESCE_RX_MAX_FRAMES_LOW | + ETHTOOL_COALESCE_RX_MAX_FRAMES_HIGH, .get_link_ksettings = hinic3_get_link_ksettings, .get_drvinfo = hinic3_get_drvinfo, .get_msglevel = hinic3_get_msglevel,
@@ -991,6 +1271,8 @@ static const struct ethtool_ops hinic3_ethtool_ops = { .get_eth_ctrl_stats = hinic3_get_eth_ctrl_stats, .get_rmon_stats = hinic3_get_rmon_stats, .get_pause_stats = hinic3_get_pause_stats, + .get_coalesce = hinic3_get_coalesce, + .set_coalesce = hinic3_set_coalesce, }; void hinic3_set_ethtool_ops(struct net_device *netdev)
diff --git a/drivers/net/ethernet/huawei/hinic3/hinic3_irq.c b/drivers/net/ethernet/huawei/hinic3/hinic3_irq.c
index 5479c235e3de..4e3b8e3c31f9 100644
--- a/drivers/net/ethernet/huawei/hinic3/hinic3_irq.c
+++ b/drivers/net/ethernet/huawei/hinic3/hinic3_irq.c@@ -101,10 +101,14 @@ static int hinic3_request_irq(struct hinic3_irq_cfg *irq_cfg, u16 q_id) info.msix_index = irq_cfg->msix_entry_idx; info.interrupt_coalesc_set = 1; + + mutex_lock(&nic_dev->state_lock); info.pending_limit = nic_dev->intr_coalesce[q_id].pending_limit; info.coalesc_timer_cfg = nic_dev->intr_coalesce[q_id].coalesce_timer_cfg; info.resend_timer_cfg = nic_dev->intr_coalesce[q_id].resend_timer_cfg; + mutex_unlock(&nic_dev->state_lock); + err = hinic3_set_interrupt_cfg(nic_dev->hwdev, info); if (err) { netdev_err(netdev, "Failed to set RX interrupt coalescing attribute.\n");
@@ -169,17 +173,22 @@ static int hinic3_set_interrupt_moder(struct net_device *netdev, u16 q_id, static void hinic3_update_queue_coal(struct net_device *netdev, u16 q_id, u16 coal_timer, u16 coal_pkts) { + u8 coalesc_timer_cfg, pending_limit, limit_low, limit_high; struct hinic3_intr_coal_info *q_coal; - u8 coalesc_timer_cfg, pending_limit; struct hinic3_nic_dev *nic_dev; nic_dev = netdev_priv(netdev); q_coal = &nic_dev->intr_coalesce[q_id]; coalesc_timer_cfg = (u8)coal_timer; + + mutex_lock(&nic_dev->state_lock); + limit_low = q_coal->rx_pending_limit_low; + limit_high = q_coal->rx_pending_limit_high; + mutex_unlock(&nic_dev->state_lock); + pending_limit = clamp_t(u8, coal_pkts >> HINIC3_COAL_PKT_SHIFT, - q_coal->rx_pending_limit_low, - q_coal->rx_pending_limit_high); + limit_low, limit_high); hinic3_set_interrupt_moder(nic_dev->netdev, q_id, coalesc_timer_cfg, pending_limit);
--
2.43.0