1 // SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
2 /* Copyright (c) 2019 Mellanox Technologies. */
3
4 #include "setup.h"
5 #include "en/params.h"
6 #include "en/txrx.h"
7 #include "en/health.h"
8
9 /* It matches XDP_UMEM_MIN_CHUNK_SIZE, but as this constant is private and may
10 * change unexpectedly, and mlx5e has a minimum valid stride size for striding
11 * RQ, keep this check in the driver.
12 */
13 #define MLX5E_MIN_XSK_CHUNK_SIZE 2048
14
mlx5e_validate_xsk_param(struct mlx5e_params * params,struct mlx5e_xsk_param * xsk,struct mlx5_core_dev * mdev)15 bool mlx5e_validate_xsk_param(struct mlx5e_params *params,
16 struct mlx5e_xsk_param *xsk,
17 struct mlx5_core_dev *mdev)
18 {
19 /* AF_XDP doesn't support frames larger than PAGE_SIZE. */
20 if (xsk->chunk_size > PAGE_SIZE ||
21 xsk->chunk_size < MLX5E_MIN_XSK_CHUNK_SIZE)
22 return false;
23
24 /* Current MTU and XSK headroom don't allow packets to fit the frames. */
25 if (mlx5e_rx_get_min_frag_sz(params, xsk) > xsk->chunk_size)
26 return false;
27
28 /* frag_sz is different for regular and XSK RQs, so ensure that linear
29 * SKB mode is possible.
30 */
31 switch (params->rq_wq_type) {
32 case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
33 return mlx5e_rx_mpwqe_is_linear_skb(mdev, params, xsk);
34 default: /* MLX5_WQ_TYPE_CYCLIC */
35 return mlx5e_rx_is_linear_skb(params, xsk);
36 }
37 }
38
mlx5e_build_xsk_cparam(struct mlx5_core_dev * mdev,struct mlx5e_params * params,struct mlx5e_xsk_param * xsk,u16 q_counter,struct mlx5e_channel_param * cparam)39 static void mlx5e_build_xsk_cparam(struct mlx5_core_dev *mdev,
40 struct mlx5e_params *params,
41 struct mlx5e_xsk_param *xsk,
42 u16 q_counter,
43 struct mlx5e_channel_param *cparam)
44 {
45 mlx5e_build_rq_param(mdev, params, xsk, q_counter, &cparam->rq);
46 mlx5e_build_xdpsq_param(mdev, params, &cparam->xdp_sq);
47 }
48
mlx5e_init_xsk_rq(struct mlx5e_channel * c,struct mlx5e_params * params,struct xsk_buff_pool * pool,struct mlx5e_xsk_param * xsk,struct mlx5e_rq * rq)49 static int mlx5e_init_xsk_rq(struct mlx5e_channel *c,
50 struct mlx5e_params *params,
51 struct xsk_buff_pool *pool,
52 struct mlx5e_xsk_param *xsk,
53 struct mlx5e_rq *rq)
54 {
55 struct mlx5_core_dev *mdev = c->mdev;
56 int rq_xdp_ix;
57 int err;
58
59 rq->wq_type = params->rq_wq_type;
60 rq->pdev = c->pdev;
61 rq->netdev = c->netdev;
62 rq->priv = c->priv;
63 rq->tstamp = c->tstamp;
64 rq->clock = &mdev->clock;
65 rq->icosq = &c->icosq;
66 rq->ix = c->ix;
67 rq->mdev = mdev;
68 rq->hw_mtu = MLX5E_SW2HW_MTU(params, params->sw_mtu);
69 rq->xdpsq = &c->rq_xdpsq;
70 rq->xsk_pool = pool;
71 rq->stats = &c->priv->channel_stats[c->ix].xskrq;
72 rq->ptp_cyc2time = mlx5_rq_ts_translator(mdev);
73 rq_xdp_ix = c->ix + params->num_channels * MLX5E_RQ_GROUP_XSK;
74 err = mlx5e_rq_set_handlers(rq, params, xsk);
75 if (err)
76 return err;
77
78 return xdp_rxq_info_reg(&rq->xdp_rxq, rq->netdev, rq_xdp_ix, 0);
79 }
80
mlx5e_open_xsk_rq(struct mlx5e_channel * c,struct mlx5e_params * params,struct mlx5e_rq_param * rq_params,struct xsk_buff_pool * pool,struct mlx5e_xsk_param * xsk)81 static int mlx5e_open_xsk_rq(struct mlx5e_channel *c, struct mlx5e_params *params,
82 struct mlx5e_rq_param *rq_params, struct xsk_buff_pool *pool,
83 struct mlx5e_xsk_param *xsk)
84 {
85 int err;
86
87 err = mlx5e_init_xsk_rq(c, params, pool, xsk, &c->xskrq);
88 if (err)
89 return err;
90
91 return mlx5e_open_rq(params, rq_params, xsk, cpu_to_node(c->cpu), &c->xskrq);
92 }
93
mlx5e_open_xsk(struct mlx5e_priv * priv,struct mlx5e_params * params,struct mlx5e_xsk_param * xsk,struct xsk_buff_pool * pool,struct mlx5e_channel * c)94 int mlx5e_open_xsk(struct mlx5e_priv *priv, struct mlx5e_params *params,
95 struct mlx5e_xsk_param *xsk, struct xsk_buff_pool *pool,
96 struct mlx5e_channel *c)
97 {
98 struct mlx5e_channel_param *cparam;
99 struct mlx5e_create_cq_param ccp;
100 int err;
101
102 mlx5e_build_create_cq_param(&ccp, c);
103
104 if (!mlx5e_validate_xsk_param(params, xsk, priv->mdev))
105 return -EINVAL;
106
107 cparam = kvzalloc(sizeof(*cparam), GFP_KERNEL);
108 if (!cparam)
109 return -ENOMEM;
110
111 mlx5e_build_xsk_cparam(priv->mdev, params, xsk, priv->q_counter, cparam);
112
113 err = mlx5e_open_cq(c->priv, params->rx_cq_moderation, &cparam->rq.cqp, &ccp,
114 &c->xskrq.cq);
115 if (unlikely(err))
116 goto err_free_cparam;
117
118 err = mlx5e_open_xsk_rq(c, params, &cparam->rq, pool, xsk);
119 if (unlikely(err))
120 goto err_close_rx_cq;
121
122 err = mlx5e_open_cq(c->priv, params->tx_cq_moderation, &cparam->xdp_sq.cqp, &ccp,
123 &c->xsksq.cq);
124 if (unlikely(err))
125 goto err_close_rq;
126
127 /* Create a separate SQ, so that when the buff pool is disabled, we could
128 * close this SQ safely and stop receiving CQEs. In other case, e.g., if
129 * the XDPSQ was used instead, we might run into trouble when the buff pool
130 * is disabled and then re-enabled, but the SQ continues receiving CQEs
131 * from the old buff pool.
132 */
133 err = mlx5e_open_xdpsq(c, params, &cparam->xdp_sq, pool, &c->xsksq, true);
134 if (unlikely(err))
135 goto err_close_tx_cq;
136
137 kvfree(cparam);
138
139 set_bit(MLX5E_CHANNEL_STATE_XSK, c->state);
140
141 return 0;
142
143 err_close_tx_cq:
144 mlx5e_close_cq(&c->xsksq.cq);
145
146 err_close_rq:
147 mlx5e_close_rq(&c->xskrq);
148
149 err_close_rx_cq:
150 mlx5e_close_cq(&c->xskrq.cq);
151
152 err_free_cparam:
153 kvfree(cparam);
154
155 return err;
156 }
157
mlx5e_close_xsk(struct mlx5e_channel * c)158 void mlx5e_close_xsk(struct mlx5e_channel *c)
159 {
160 clear_bit(MLX5E_CHANNEL_STATE_XSK, c->state);
161 synchronize_net(); /* Sync with the XSK wakeup and with NAPI. */
162
163 mlx5e_close_rq(&c->xskrq);
164 mlx5e_close_cq(&c->xskrq.cq);
165 mlx5e_close_xdpsq(&c->xsksq);
166 mlx5e_close_cq(&c->xsksq.cq);
167
168 memset(&c->xskrq, 0, sizeof(c->xskrq));
169 memset(&c->xsksq, 0, sizeof(c->xsksq));
170 }
171
mlx5e_activate_xsk(struct mlx5e_channel * c)172 void mlx5e_activate_xsk(struct mlx5e_channel *c)
173 {
174 /* ICOSQ recovery deactivates RQs. Suspend the recovery to avoid
175 * activating XSKRQ in the middle of recovery.
176 */
177 mlx5e_reporter_icosq_suspend_recovery(c);
178 set_bit(MLX5E_RQ_STATE_ENABLED, &c->xskrq.state);
179 mlx5e_reporter_icosq_resume_recovery(c);
180
181 /* TX queue is created active. */
182
183 spin_lock_bh(&c->async_icosq_lock);
184 mlx5e_trigger_irq(&c->async_icosq);
185 spin_unlock_bh(&c->async_icosq_lock);
186 }
187
mlx5e_deactivate_xsk(struct mlx5e_channel * c)188 void mlx5e_deactivate_xsk(struct mlx5e_channel *c)
189 {
190 /* ICOSQ recovery may reactivate XSKRQ if clear_bit is called in the
191 * middle of recovery. Suspend the recovery to avoid it.
192 */
193 mlx5e_reporter_icosq_suspend_recovery(c);
194 clear_bit(MLX5E_RQ_STATE_ENABLED, &c->xskrq.state);
195 mlx5e_reporter_icosq_resume_recovery(c);
196 synchronize_net(); /* Sync with NAPI to prevent mlx5e_post_rx_wqes. */
197
198 /* TX queue is disabled on close. */
199 }
200