RE: [PATCH] net :mana : Add per-cpu stats for MANA device
From: Haiyang Zhang
Date: Thu Mar 07 2024 - 11:18:17 EST
> -----Original Message-----
> From: Shradha Gupta <shradhagupta@xxxxxxxxxxxxxxxxxxx>
> Sent: Thursday, March 7, 2024 9:52 AM
> To: linux-kernel@xxxxxxxxxxxxxxx; linux-hyperv@xxxxxxxxxxxxxxx; linux-
> rdma@xxxxxxxxxxxxxxx; netdev@xxxxxxxxxxxxxxx
> Cc: Shradha Gupta <shradhagupta@xxxxxxxxxxxxxxxxxxx>; Eric Dumazet
> <edumazet@xxxxxxxxxx>; Jakub Kicinski <kuba@xxxxxxxxxx>; Paolo Abeni
> <pabeni@xxxxxxxxxx>; Ajay Sharma <sharmaajay@xxxxxxxxxxxxx>; Leon
> Romanovsky <leon@xxxxxxxxxx>; Thomas Gleixner <tglx@xxxxxxxxxxxxx>;
> Sebastian Andrzej Siewior <bigeasy@xxxxxxxxxxxxx>; KY Srinivasan
> <kys@xxxxxxxxxxxxx>; Haiyang Zhang <haiyangz@xxxxxxxxxxxxx>; Wei Liu
> <wei.liu@xxxxxxxxxx>; Dexuan Cui <decui@xxxxxxxxxxxxx>; Long Li
> <longli@xxxxxxxxxxxxx>; Michael Kelley <mikelley@xxxxxxxxxxxxx>; Shradha
> Gupta <shradhagupta@xxxxxxxxxxxxx>
> Subject: [PATCH] net :mana : Add per-cpu stats for MANA device
>
> Extend 'ethtool -S' output for mana devices to include per-CPU packet
> stats
>
> Built-on: Ubuntu22
> Tested-on: Ubuntu22
> Signed-off-by: Shradha Gupta <shradhagupta@xxxxxxxxxxxxxxxxxxx>
> ---
> drivers/net/ethernet/microsoft/mana/mana_en.c | 22 ++++++++++
> .../ethernet/microsoft/mana/mana_ethtool.c | 40 ++++++++++++++++++-
> include/net/mana/mana.h | 12 ++++++
> 3 files changed, 72 insertions(+), 2 deletions(-)
>
> diff --git a/drivers/net/ethernet/microsoft/mana/mana_en.c
> b/drivers/net/ethernet/microsoft/mana/mana_en.c
> index 59287c6e6cee..b27ee6684936 100644
> --- a/drivers/net/ethernet/microsoft/mana/mana_en.c
> +++ b/drivers/net/ethernet/microsoft/mana/mana_en.c
> @@ -224,6 +224,7 @@ netdev_tx_t mana_start_xmit(struct sk_buff *skb,
> struct net_device *ndev)
> int gso_hs = 0; /* zero for non-GSO pkts */
> u16 txq_idx = skb_get_queue_mapping(skb);
> struct gdma_dev *gd = apc->ac->gdma_dev;
> + struct mana_pcpu_stats *pcpu_stats;
> bool ipv4 = false, ipv6 = false;
> struct mana_tx_package pkg = {};
> struct netdev_queue *net_txq;
> @@ -234,6 +235,8 @@ netdev_tx_t mana_start_xmit(struct sk_buff *skb,
> struct net_device *ndev)
> struct mana_cq *cq;
> int err, len;
>
> + pcpu_stats = this_cpu_ptr(apc->pcpu_stats);
> +
> if (unlikely(!apc->port_is_up))
> goto tx_drop;
>
> @@ -412,6 +415,12 @@ netdev_tx_t mana_start_xmit(struct sk_buff *skb,
> struct net_device *ndev)
> tx_stats->bytes += len;
> u64_stats_update_end(&tx_stats->syncp);
>
> + /* Also update the per-CPU stats */
> + u64_stats_update_begin(&pcpu_stats->syncp);
> + pcpu_stats->tx_packets++;
> + pcpu_stats->tx_bytes += len;
> + u64_stats_update_end(&pcpu_stats->syncp);
> +
> tx_busy:
> if (netif_tx_queue_stopped(net_txq) && mana_can_tx(gdma_sq)) {
> netif_tx_wake_queue(net_txq);
> @@ -425,6 +434,9 @@ netdev_tx_t mana_start_xmit(struct sk_buff *skb,
> struct net_device *ndev)
> kfree(pkg.sgl_ptr);
> tx_drop_count:
> ndev->stats.tx_dropped++;
> + u64_stats_update_begin(&pcpu_stats->syncp);
> + pcpu_stats->tx_dropped++;
> + u64_stats_update_end(&pcpu_stats->syncp);
> tx_drop:
> dev_kfree_skb_any(skb);
> return NETDEV_TX_OK;
> @@ -1505,6 +1517,8 @@ static void mana_rx_skb(void *buf_va, bool
> from_pool,
> struct mana_stats_rx *rx_stats = &rxq->stats;
> struct net_device *ndev = rxq->ndev;
> uint pkt_len = cqe->ppi[0].pkt_len;
> + struct mana_pcpu_stats *pcpu_stats;
> + struct mana_port_context *apc;
> u16 rxq_idx = rxq->rxq_idx;
> struct napi_struct *napi;
> struct xdp_buff xdp = {};
> @@ -1512,6 +1526,9 @@ static void mana_rx_skb(void *buf_va, bool
> from_pool,
> u32 hash_value;
> u32 act;
>
> + apc = netdev_priv(ndev);
> + pcpu_stats = this_cpu_ptr(apc->pcpu_stats);
> +
> rxq->rx_cq.work_done++;
> napi = &rxq->rx_cq.napi;
>
> @@ -1570,6 +1587,11 @@ static void mana_rx_skb(void *buf_va, bool
> from_pool,
> rx_stats->xdp_tx++;
> u64_stats_update_end(&rx_stats->syncp);
>
> + u64_stats_update_begin(&pcpu_stats->syncp);
> + pcpu_stats->rx_packets++;
> + pcpu_stats->rx_bytes += pkt_len;
> + u64_stats_update_end(&pcpu_stats->syncp);
> +
> if (act == XDP_TX) {
> skb_set_queue_mapping(skb, rxq_idx);
> mana_xdp_tx(skb, ndev);
> diff --git a/drivers/net/ethernet/microsoft/mana/mana_ethtool.c
> b/drivers/net/ethernet/microsoft/mana/mana_ethtool.c
> index ab2413d71f6c..e3aa47ead601 100644
> --- a/drivers/net/ethernet/microsoft/mana/mana_ethtool.c
> +++ b/drivers/net/ethernet/microsoft/mana/mana_ethtool.c
> @@ -83,8 +83,9 @@ static int mana_get_sset_count(struct net_device *ndev,
> int stringset)
> if (stringset != ETH_SS_STATS)
> return -EINVAL;
>
> - return ARRAY_SIZE(mana_eth_stats) + num_queues *
> - (MANA_STATS_RX_COUNT + MANA_STATS_TX_COUNT);
> + return ARRAY_SIZE(mana_eth_stats) +
> + (num_queues * (MANA_STATS_RX_COUNT + MANA_STATS_TX_COUNT)) +
> + (num_present_cpus() * (MANA_STATS_RX_PCPU +
> MANA_STATS_TX_PCPU));
> }
>
> static void mana_get_strings(struct net_device *ndev, u32 stringset, u8
> *data)
> @@ -139,6 +140,19 @@ static void mana_get_strings(struct net_device
> *ndev, u32 stringset, u8 *data)
> sprintf(p, "tx_%d_mana_map_err", i);
> p += ETH_GSTRING_LEN;
> }
> +
> + for (i = 0; i < num_present_cpus(); i++) {
> + sprintf(p, "cpu%d_rx_packets", i);
> + p += ETH_GSTRING_LEN;
> + sprintf(p, "cpu%d_rx_bytes", i);
> + p += ETH_GSTRING_LEN;
> + sprintf(p, "cpu%d_tx_packets", i);
> + p += ETH_GSTRING_LEN;
> + sprintf(p, "cpu%d_tx_bytes", i);
> + p += ETH_GSTRING_LEN;
> + sprintf(p, "cpu%d_tx_dropped", i);
> + p += ETH_GSTRING_LEN;
> + }
> }
>
> static void mana_get_ethtool_stats(struct net_device *ndev,
> @@ -222,6 +236,28 @@ static void mana_get_ethtool_stats(struct net_device
> *ndev,
> data[i++] = csum_partial;
> data[i++] = mana_map_err;
> }
> +
> + for_each_possible_cpu(q) {
> + const struct mana_pcpu_stats *pcpu_stats =
> + per_cpu_ptr(apc->pcpu_stats, q);
> + u64 rx_packets, rx_bytes, tx_packets, tx_bytes, tx_dropped;
> + unsigned int start;
> +
> + do {
> + start = u64_stats_fetch_begin(&pcpu_stats->syncp);
> + rx_packets = pcpu_stats->rx_packets;
> + tx_packets = pcpu_stats->tx_packets;
> + rx_bytes = pcpu_stats->rx_bytes;
> + tx_bytes = pcpu_stats->tx_bytes;
> + tx_dropped = pcpu_stats->tx_dropped;
> + } while (u64_stats_fetch_retry(&pcpu_stats->syncp, start));
> +
> + data[i++] = rx_packets;
> + data[i++] = rx_bytes;
> + data[i++] = tx_packets;
> + data[i++] = tx_bytes;
> + data[i++] = tx_dropped;
> + }
> }
>
> static int mana_get_rxnfc(struct net_device *ndev, struct ethtool_rxnfc
> *cmd,
> diff --git a/include/net/mana/mana.h b/include/net/mana/mana.h
> index 76147feb0d10..9a2414ee7f02 100644
> --- a/include/net/mana/mana.h
> +++ b/include/net/mana/mana.h
> @@ -51,6 +51,8 @@ enum TRI_STATE {
> /* Update this count whenever the respective structures are changed */
> #define MANA_STATS_RX_COUNT 5
> #define MANA_STATS_TX_COUNT 11
> +#define MANA_STATS_RX_PCPU 2
> +#define MANA_STATS_TX_PCPU 3
>
> struct mana_stats_rx {
> u64 packets;
> @@ -386,6 +388,15 @@ struct mana_ethtool_stats {
> u64 rx_cqe_unknown_type;
> };
>
> +struct mana_pcpu_stats {
> + u64 rx_packets;
> + u64 rx_bytes;
> + u64 tx_packets;
> + u64 tx_bytes;
> + u64 tx_dropped;
> + struct u64_stats_sync syncp;
> +};
> +
> struct mana_context {
> struct gdma_dev *gdma_dev;
>
> @@ -449,6 +460,7 @@ struct mana_port_context {
> bool port_st_save; /* Saved port state */
>
> struct mana_ethtool_stats eth_stats;
> + struct mana_pcpu_stats __percpu *pcpu_stats;
Where are pcpu_stats alloc-ed?
Seems I cannot see any alloc in the patch.
Thanks,
- Haiyang