1 // SPDX-License-Identifier: (GPL-2.0 OR MIT)
2 /* Google virtual Ethernet (gve) driver
3 *
4 * Copyright (C) 2015-2024 Google LLC
5 */
6
7 #include <linux/rtnetlink.h>
8 #include "gve.h"
9 #include "gve_adminq.h"
10 #include "gve_dqo.h"
11 #include "gve_utils.h"
12
gve_get_drvinfo(struct net_device * netdev,struct ethtool_drvinfo * info)13 static void gve_get_drvinfo(struct net_device *netdev,
14 struct ethtool_drvinfo *info)
15 {
16 struct gve_priv *priv = netdev_priv(netdev);
17
18 strscpy(info->driver, gve_driver_name, sizeof(info->driver));
19 strscpy(info->version, gve_version_str, sizeof(info->version));
20 strscpy(info->bus_info, pci_name(priv->pdev), sizeof(info->bus_info));
21 }
22
gve_set_msglevel(struct net_device * netdev,u32 value)23 static void gve_set_msglevel(struct net_device *netdev, u32 value)
24 {
25 struct gve_priv *priv = netdev_priv(netdev);
26
27 priv->msg_enable = value;
28 }
29
gve_get_msglevel(struct net_device * netdev)30 static u32 gve_get_msglevel(struct net_device *netdev)
31 {
32 struct gve_priv *priv = netdev_priv(netdev);
33
34 return priv->msg_enable;
35 }
36
37 /* For the following stats column string names, make sure the order
38 * matches how it is filled in the code. For xdp_aborted, xdp_drop,
39 * xdp_pass, xdp_tx, xdp_redirect, make sure it also matches the order
40 * as declared in enum xdp_action inside file uapi/linux/bpf.h .
41 */
42 static const char gve_gstrings_main_stats[][ETH_GSTRING_LEN] = {
43 "rx_packets", "rx_hsplit_pkt", "tx_packets", "rx_bytes",
44 "tx_bytes", "rx_dropped", "tx_dropped", "tx_timeouts",
45 "rx_skb_alloc_fail", "rx_buf_alloc_fail", "rx_desc_err_dropped_pkt",
46 "rx_hsplit_unsplit_pkt",
47 "interface_up_cnt", "interface_down_cnt", "reset_cnt",
48 "page_alloc_fail", "dma_mapping_error", "stats_report_trigger_cnt",
49 };
50
51 static const char gve_gstrings_rx_stats[][ETH_GSTRING_LEN] = {
52 "rx_posted_desc[%u]", "rx_completed_desc[%u]", "rx_consumed_desc[%u]",
53 "rx_bytes[%u]", "rx_hsplit_bytes[%u]", "rx_cont_packet_cnt[%u]",
54 "rx_frag_flip_cnt[%u]", "rx_frag_copy_cnt[%u]", "rx_frag_alloc_cnt[%u]",
55 "rx_dropped_pkt[%u]", "rx_copybreak_pkt[%u]", "rx_copied_pkt[%u]",
56 "rx_queue_drop_cnt[%u]", "rx_no_buffers_posted[%u]",
57 "rx_drops_packet_over_mru[%u]", "rx_drops_invalid_checksum[%u]",
58 "rx_xdp_aborted[%u]", "rx_xdp_drop[%u]", "rx_xdp_pass[%u]",
59 "rx_xdp_tx[%u]", "rx_xdp_redirect[%u]",
60 "rx_xdp_tx_errors[%u]", "rx_xdp_redirect_errors[%u]", "rx_xdp_alloc_fails[%u]",
61 };
62
63 static const char gve_gstrings_tx_stats[][ETH_GSTRING_LEN] = {
64 "tx_posted_desc[%u]", "tx_completed_desc[%u]", "tx_consumed_desc[%u]", "tx_bytes[%u]",
65 "tx_wake[%u]", "tx_stop[%u]", "tx_event_counter[%u]",
66 "tx_dma_mapping_error[%u]",
67 "tx_xsk_sent[%u]", "tx_xdp_xmit[%u]", "tx_xdp_xmit_errors[%u]"
68 };
69
70 static const char gve_gstrings_adminq_stats[][ETH_GSTRING_LEN] = {
71 "adminq_prod_cnt", "adminq_cmd_fail", "adminq_timeouts",
72 "adminq_describe_device_cnt", "adminq_cfg_device_resources_cnt",
73 "adminq_register_page_list_cnt", "adminq_unregister_page_list_cnt",
74 "adminq_create_tx_queue_cnt", "adminq_create_rx_queue_cnt",
75 "adminq_destroy_tx_queue_cnt", "adminq_destroy_rx_queue_cnt",
76 "adminq_dcfg_device_resources_cnt", "adminq_set_driver_parameter_cnt",
77 "adminq_report_stats_cnt", "adminq_report_link_speed_cnt", "adminq_get_ptype_map_cnt",
78 "adminq_query_flow_rules", "adminq_cfg_flow_rule", "adminq_cfg_rss_cnt",
79 "adminq_query_rss_cnt",
80 };
81
82 static const char gve_gstrings_priv_flags[][ETH_GSTRING_LEN] = {
83 "report-stats",
84 };
85
86 #define GVE_MAIN_STATS_LEN ARRAY_SIZE(gve_gstrings_main_stats)
87 #define GVE_ADMINQ_STATS_LEN ARRAY_SIZE(gve_gstrings_adminq_stats)
88 #define NUM_GVE_TX_CNTS ARRAY_SIZE(gve_gstrings_tx_stats)
89 #define NUM_GVE_RX_CNTS ARRAY_SIZE(gve_gstrings_rx_stats)
90 #define GVE_PRIV_FLAGS_STR_LEN ARRAY_SIZE(gve_gstrings_priv_flags)
91
gve_get_strings(struct net_device * netdev,u32 stringset,u8 * data)92 static void gve_get_strings(struct net_device *netdev, u32 stringset, u8 *data)
93 {
94 struct gve_priv *priv = netdev_priv(netdev);
95 u8 *s = (char *)data;
96 int num_tx_queues;
97 int i, j;
98
99 num_tx_queues = gve_num_tx_queues(priv);
100 switch (stringset) {
101 case ETH_SS_STATS:
102 for (i = 0; i < ARRAY_SIZE(gve_gstrings_main_stats); i++)
103 ethtool_puts(&s, gve_gstrings_main_stats[i]);
104
105 for (i = 0; i < priv->rx_cfg.num_queues; i++)
106 for (j = 0; j < NUM_GVE_RX_CNTS; j++)
107 ethtool_sprintf(&s, gve_gstrings_rx_stats[j],
108 i);
109
110 for (i = 0; i < num_tx_queues; i++)
111 for (j = 0; j < NUM_GVE_TX_CNTS; j++)
112 ethtool_sprintf(&s, gve_gstrings_tx_stats[j],
113 i);
114
115 for (i = 0; i < ARRAY_SIZE(gve_gstrings_adminq_stats); i++)
116 ethtool_puts(&s, gve_gstrings_adminq_stats[i]);
117
118 break;
119
120 case ETH_SS_PRIV_FLAGS:
121 for (i = 0; i < ARRAY_SIZE(gve_gstrings_priv_flags); i++)
122 ethtool_puts(&s, gve_gstrings_priv_flags[i]);
123 break;
124
125 default:
126 break;
127 }
128 }
129
gve_get_sset_count(struct net_device * netdev,int sset)130 static int gve_get_sset_count(struct net_device *netdev, int sset)
131 {
132 struct gve_priv *priv = netdev_priv(netdev);
133 int num_tx_queues;
134
135 num_tx_queues = gve_num_tx_queues(priv);
136 switch (sset) {
137 case ETH_SS_STATS:
138 return GVE_MAIN_STATS_LEN + GVE_ADMINQ_STATS_LEN +
139 (priv->rx_cfg.num_queues * NUM_GVE_RX_CNTS) +
140 (num_tx_queues * NUM_GVE_TX_CNTS);
141 case ETH_SS_PRIV_FLAGS:
142 return GVE_PRIV_FLAGS_STR_LEN;
143 default:
144 return -EOPNOTSUPP;
145 }
146 }
147
148 static void
gve_get_ethtool_stats(struct net_device * netdev,struct ethtool_stats * stats,u64 * data)149 gve_get_ethtool_stats(struct net_device *netdev,
150 struct ethtool_stats *stats, u64 *data)
151 {
152 u64 tmp_rx_pkts, tmp_rx_hsplit_pkt, tmp_rx_bytes, tmp_rx_hsplit_bytes,
153 tmp_rx_skb_alloc_fail, tmp_rx_buf_alloc_fail,
154 tmp_rx_desc_err_dropped_pkt, tmp_rx_hsplit_unsplit_pkt,
155 tmp_tx_pkts, tmp_tx_bytes;
156 u64 rx_buf_alloc_fail, rx_desc_err_dropped_pkt, rx_hsplit_unsplit_pkt,
157 rx_pkts, rx_hsplit_pkt, rx_skb_alloc_fail, rx_bytes, tx_pkts, tx_bytes,
158 tx_dropped;
159 int stats_idx, base_stats_idx, max_stats_idx;
160 struct stats *report_stats;
161 int *rx_qid_to_stats_idx;
162 int *tx_qid_to_stats_idx;
163 int num_stopped_rxqs = 0;
164 int num_stopped_txqs = 0;
165 struct gve_priv *priv;
166 bool skip_nic_stats;
167 unsigned int start;
168 int num_tx_queues;
169 int ring;
170 int i, j;
171
172 ASSERT_RTNL();
173
174 priv = netdev_priv(netdev);
175 num_tx_queues = gve_num_tx_queues(priv);
176 report_stats = priv->stats_report->stats;
177 rx_qid_to_stats_idx = kmalloc_array(priv->rx_cfg.num_queues,
178 sizeof(int), GFP_KERNEL);
179 if (!rx_qid_to_stats_idx)
180 return;
181 for (ring = 0; ring < priv->rx_cfg.num_queues; ring++) {
182 rx_qid_to_stats_idx[ring] = -1;
183 if (!gve_rx_was_added_to_block(priv, ring))
184 num_stopped_rxqs++;
185 }
186 tx_qid_to_stats_idx = kmalloc_array(num_tx_queues,
187 sizeof(int), GFP_KERNEL);
188 if (!tx_qid_to_stats_idx) {
189 kfree(rx_qid_to_stats_idx);
190 return;
191 }
192 for (ring = 0; ring < num_tx_queues; ring++) {
193 tx_qid_to_stats_idx[ring] = -1;
194 if (!gve_tx_was_added_to_block(priv, ring))
195 num_stopped_txqs++;
196 }
197
198 for (rx_pkts = 0, rx_bytes = 0, rx_hsplit_pkt = 0,
199 rx_skb_alloc_fail = 0, rx_buf_alloc_fail = 0,
200 rx_desc_err_dropped_pkt = 0, rx_hsplit_unsplit_pkt = 0,
201 ring = 0;
202 ring < priv->rx_cfg.num_queues; ring++) {
203 if (priv->rx) {
204 do {
205 struct gve_rx_ring *rx = &priv->rx[ring];
206
207 start =
208 u64_stats_fetch_begin(&priv->rx[ring].statss);
209 tmp_rx_pkts = rx->rpackets;
210 tmp_rx_hsplit_pkt = rx->rx_hsplit_pkt;
211 tmp_rx_bytes = rx->rbytes;
212 tmp_rx_skb_alloc_fail = rx->rx_skb_alloc_fail;
213 tmp_rx_buf_alloc_fail = rx->rx_buf_alloc_fail;
214 tmp_rx_desc_err_dropped_pkt =
215 rx->rx_desc_err_dropped_pkt;
216 tmp_rx_hsplit_unsplit_pkt =
217 rx->rx_hsplit_unsplit_pkt;
218 } while (u64_stats_fetch_retry(&priv->rx[ring].statss,
219 start));
220 rx_pkts += tmp_rx_pkts;
221 rx_hsplit_pkt += tmp_rx_hsplit_pkt;
222 rx_bytes += tmp_rx_bytes;
223 rx_skb_alloc_fail += tmp_rx_skb_alloc_fail;
224 rx_buf_alloc_fail += tmp_rx_buf_alloc_fail;
225 rx_desc_err_dropped_pkt += tmp_rx_desc_err_dropped_pkt;
226 rx_hsplit_unsplit_pkt += tmp_rx_hsplit_unsplit_pkt;
227 }
228 }
229 for (tx_pkts = 0, tx_bytes = 0, tx_dropped = 0, ring = 0;
230 ring < num_tx_queues; ring++) {
231 if (priv->tx) {
232 do {
233 start =
234 u64_stats_fetch_begin(&priv->tx[ring].statss);
235 tmp_tx_pkts = priv->tx[ring].pkt_done;
236 tmp_tx_bytes = priv->tx[ring].bytes_done;
237 } while (u64_stats_fetch_retry(&priv->tx[ring].statss,
238 start));
239 tx_pkts += tmp_tx_pkts;
240 tx_bytes += tmp_tx_bytes;
241 tx_dropped += priv->tx[ring].dropped_pkt;
242 }
243 }
244
245 i = 0;
246 data[i++] = rx_pkts;
247 data[i++] = rx_hsplit_pkt;
248 data[i++] = tx_pkts;
249 data[i++] = rx_bytes;
250 data[i++] = tx_bytes;
251 /* total rx dropped packets */
252 data[i++] = rx_skb_alloc_fail + rx_buf_alloc_fail +
253 rx_desc_err_dropped_pkt;
254 data[i++] = tx_dropped;
255 data[i++] = priv->tx_timeo_cnt;
256 data[i++] = rx_skb_alloc_fail;
257 data[i++] = rx_buf_alloc_fail;
258 data[i++] = rx_desc_err_dropped_pkt;
259 data[i++] = rx_hsplit_unsplit_pkt;
260 data[i++] = priv->interface_up_cnt;
261 data[i++] = priv->interface_down_cnt;
262 data[i++] = priv->reset_cnt;
263 data[i++] = priv->page_alloc_fail;
264 data[i++] = priv->dma_mapping_error;
265 data[i++] = priv->stats_report_trigger_cnt;
266 i = GVE_MAIN_STATS_LEN;
267
268 /* For rx cross-reporting stats, start from nic rx stats in report */
269 base_stats_idx = GVE_TX_STATS_REPORT_NUM * num_tx_queues +
270 GVE_RX_STATS_REPORT_NUM * priv->rx_cfg.num_queues;
271 /* The boundary between driver stats and NIC stats shifts if there are
272 * stopped queues.
273 */
274 base_stats_idx += NIC_RX_STATS_REPORT_NUM * num_stopped_rxqs +
275 NIC_TX_STATS_REPORT_NUM * num_stopped_txqs;
276 max_stats_idx = NIC_RX_STATS_REPORT_NUM *
277 (priv->rx_cfg.num_queues - num_stopped_rxqs) +
278 base_stats_idx;
279 /* Preprocess the stats report for rx, map queue id to start index */
280 skip_nic_stats = false;
281 for (stats_idx = base_stats_idx; stats_idx < max_stats_idx;
282 stats_idx += NIC_RX_STATS_REPORT_NUM) {
283 u32 stat_name = be32_to_cpu(report_stats[stats_idx].stat_name);
284 u32 queue_id = be32_to_cpu(report_stats[stats_idx].queue_id);
285
286 if (stat_name == 0) {
287 /* no stats written by NIC yet */
288 skip_nic_stats = true;
289 break;
290 }
291 if (queue_id < 0 || queue_id >= priv->rx_cfg.num_queues) {
292 net_err_ratelimited("Invalid rxq id in NIC stats\n");
293 continue;
294 }
295 rx_qid_to_stats_idx[queue_id] = stats_idx;
296 }
297 /* walk RX rings */
298 if (priv->rx) {
299 for (ring = 0; ring < priv->rx_cfg.num_queues; ring++) {
300 struct gve_rx_ring *rx = &priv->rx[ring];
301
302 data[i++] = rx->fill_cnt;
303 data[i++] = rx->cnt;
304 data[i++] = rx->fill_cnt - rx->cnt;
305 do {
306 start =
307 u64_stats_fetch_begin(&priv->rx[ring].statss);
308 tmp_rx_bytes = rx->rbytes;
309 tmp_rx_hsplit_bytes = rx->rx_hsplit_bytes;
310 tmp_rx_skb_alloc_fail = rx->rx_skb_alloc_fail;
311 tmp_rx_buf_alloc_fail = rx->rx_buf_alloc_fail;
312 tmp_rx_desc_err_dropped_pkt =
313 rx->rx_desc_err_dropped_pkt;
314 } while (u64_stats_fetch_retry(&priv->rx[ring].statss,
315 start));
316 data[i++] = tmp_rx_bytes;
317 data[i++] = tmp_rx_hsplit_bytes;
318 data[i++] = rx->rx_cont_packet_cnt;
319 data[i++] = rx->rx_frag_flip_cnt;
320 data[i++] = rx->rx_frag_copy_cnt;
321 data[i++] = rx->rx_frag_alloc_cnt;
322 /* rx dropped packets */
323 data[i++] = tmp_rx_skb_alloc_fail +
324 tmp_rx_buf_alloc_fail +
325 tmp_rx_desc_err_dropped_pkt;
326 data[i++] = rx->rx_copybreak_pkt;
327 data[i++] = rx->rx_copied_pkt;
328 /* stats from NIC */
329 stats_idx = rx_qid_to_stats_idx[ring];
330 if (skip_nic_stats || stats_idx < 0) {
331 /* skip NIC rx stats */
332 i += NIC_RX_STATS_REPORT_NUM;
333 } else {
334 for (j = 0; j < NIC_RX_STATS_REPORT_NUM; j++) {
335 u64 value =
336 be64_to_cpu(report_stats[stats_idx + j].value);
337
338 data[i++] = value;
339 }
340 }
341 /* XDP rx counters */
342 do {
343 start = u64_stats_fetch_begin(&priv->rx[ring].statss);
344 for (j = 0; j < GVE_XDP_ACTIONS; j++)
345 data[i + j] = rx->xdp_actions[j];
346 data[i + j++] = rx->xdp_tx_errors;
347 data[i + j++] = rx->xdp_redirect_errors;
348 data[i + j++] = rx->xdp_alloc_fails;
349 } while (u64_stats_fetch_retry(&priv->rx[ring].statss,
350 start));
351 i += GVE_XDP_ACTIONS + 3; /* XDP rx counters */
352 }
353 } else {
354 i += priv->rx_cfg.num_queues * NUM_GVE_RX_CNTS;
355 }
356
357 /* For tx cross-reporting stats, start from nic tx stats in report */
358 base_stats_idx = max_stats_idx;
359 max_stats_idx = NIC_TX_STATS_REPORT_NUM *
360 (num_tx_queues - num_stopped_txqs) +
361 max_stats_idx;
362 /* Preprocess the stats report for tx, map queue id to start index */
363 skip_nic_stats = false;
364 for (stats_idx = base_stats_idx; stats_idx < max_stats_idx;
365 stats_idx += NIC_TX_STATS_REPORT_NUM) {
366 u32 stat_name = be32_to_cpu(report_stats[stats_idx].stat_name);
367 u32 queue_id = be32_to_cpu(report_stats[stats_idx].queue_id);
368
369 if (stat_name == 0) {
370 /* no stats written by NIC yet */
371 skip_nic_stats = true;
372 break;
373 }
374 if (queue_id < 0 || queue_id >= num_tx_queues) {
375 net_err_ratelimited("Invalid txq id in NIC stats\n");
376 continue;
377 }
378 tx_qid_to_stats_idx[queue_id] = stats_idx;
379 }
380 /* walk TX rings */
381 if (priv->tx) {
382 for (ring = 0; ring < num_tx_queues; ring++) {
383 struct gve_tx_ring *tx = &priv->tx[ring];
384
385 if (gve_is_gqi(priv)) {
386 data[i++] = tx->req;
387 data[i++] = tx->done;
388 data[i++] = tx->req - tx->done;
389 } else {
390 /* DQO doesn't currently support
391 * posted/completed descriptor counts;
392 */
393 data[i++] = 0;
394 data[i++] = 0;
395 data[i++] =
396 (tx->dqo_tx.tail - tx->dqo_tx.head) &
397 tx->mask;
398 }
399 do {
400 start =
401 u64_stats_fetch_begin(&priv->tx[ring].statss);
402 tmp_tx_bytes = tx->bytes_done;
403 } while (u64_stats_fetch_retry(&priv->tx[ring].statss,
404 start));
405 data[i++] = tmp_tx_bytes;
406 data[i++] = tx->wake_queue;
407 data[i++] = tx->stop_queue;
408 data[i++] = gve_tx_load_event_counter(priv, tx);
409 data[i++] = tx->dma_mapping_error;
410 /* stats from NIC */
411 stats_idx = tx_qid_to_stats_idx[ring];
412 if (skip_nic_stats || stats_idx < 0) {
413 /* skip NIC tx stats */
414 i += NIC_TX_STATS_REPORT_NUM;
415 } else {
416 for (j = 0; j < NIC_TX_STATS_REPORT_NUM; j++) {
417 u64 value =
418 be64_to_cpu(report_stats[stats_idx + j].value);
419 data[i++] = value;
420 }
421 }
422 /* XDP counters */
423 do {
424 start = u64_stats_fetch_begin(&priv->tx[ring].statss);
425 data[i] = tx->xdp_xsk_sent;
426 data[i + 1] = tx->xdp_xmit;
427 data[i + 2] = tx->xdp_xmit_errors;
428 } while (u64_stats_fetch_retry(&priv->tx[ring].statss,
429 start));
430 i += 3; /* XDP tx counters */
431 }
432 } else {
433 i += num_tx_queues * NUM_GVE_TX_CNTS;
434 }
435
436 kfree(rx_qid_to_stats_idx);
437 kfree(tx_qid_to_stats_idx);
438 /* AQ Stats */
439 data[i++] = priv->adminq_prod_cnt;
440 data[i++] = priv->adminq_cmd_fail;
441 data[i++] = priv->adminq_timeouts;
442 data[i++] = priv->adminq_describe_device_cnt;
443 data[i++] = priv->adminq_cfg_device_resources_cnt;
444 data[i++] = priv->adminq_register_page_list_cnt;
445 data[i++] = priv->adminq_unregister_page_list_cnt;
446 data[i++] = priv->adminq_create_tx_queue_cnt;
447 data[i++] = priv->adminq_create_rx_queue_cnt;
448 data[i++] = priv->adminq_destroy_tx_queue_cnt;
449 data[i++] = priv->adminq_destroy_rx_queue_cnt;
450 data[i++] = priv->adminq_dcfg_device_resources_cnt;
451 data[i++] = priv->adminq_set_driver_parameter_cnt;
452 data[i++] = priv->adminq_report_stats_cnt;
453 data[i++] = priv->adminq_report_link_speed_cnt;
454 data[i++] = priv->adminq_get_ptype_map_cnt;
455 data[i++] = priv->adminq_query_flow_rules_cnt;
456 data[i++] = priv->adminq_cfg_flow_rule_cnt;
457 data[i++] = priv->adminq_cfg_rss_cnt;
458 data[i++] = priv->adminq_query_rss_cnt;
459 }
460
gve_get_channels(struct net_device * netdev,struct ethtool_channels * cmd)461 static void gve_get_channels(struct net_device *netdev,
462 struct ethtool_channels *cmd)
463 {
464 struct gve_priv *priv = netdev_priv(netdev);
465
466 cmd->max_rx = priv->rx_cfg.max_queues;
467 cmd->max_tx = priv->tx_cfg.max_queues;
468 cmd->max_other = 0;
469 cmd->max_combined = 0;
470 cmd->rx_count = priv->rx_cfg.num_queues;
471 cmd->tx_count = priv->tx_cfg.num_queues;
472 cmd->other_count = 0;
473 cmd->combined_count = 0;
474 }
475
gve_set_channels(struct net_device * netdev,struct ethtool_channels * cmd)476 static int gve_set_channels(struct net_device *netdev,
477 struct ethtool_channels *cmd)
478 {
479 struct gve_priv *priv = netdev_priv(netdev);
480 struct gve_tx_queue_config new_tx_cfg = priv->tx_cfg;
481 struct gve_rx_queue_config new_rx_cfg = priv->rx_cfg;
482 struct ethtool_channels old_settings;
483 int new_tx = cmd->tx_count;
484 int new_rx = cmd->rx_count;
485 bool reset_rss = false;
486
487 gve_get_channels(netdev, &old_settings);
488
489 /* Changing combined is not allowed */
490 if (cmd->combined_count != old_settings.combined_count)
491 return -EINVAL;
492
493 if (!new_rx || !new_tx)
494 return -EINVAL;
495
496 if (priv->xdp_prog) {
497 if (new_tx != new_rx ||
498 (2 * new_tx > priv->tx_cfg.max_queues)) {
499 dev_err(&priv->pdev->dev, "The number of configured RX queues should be equal to the number of configured TX queues and the number of configured RX/TX queues should be less than or equal to half the maximum number of RX/TX queues when XDP program is installed");
500 return -EINVAL;
501 }
502
503 /* One XDP TX queue per RX queue. */
504 new_tx_cfg.num_xdp_queues = new_rx;
505 } else {
506 new_tx_cfg.num_xdp_queues = 0;
507 }
508
509 if (new_rx != priv->rx_cfg.num_queues &&
510 priv->cache_rss_config && !netif_is_rxfh_configured(netdev))
511 reset_rss = true;
512
513 new_tx_cfg.num_queues = new_tx;
514 new_rx_cfg.num_queues = new_rx;
515
516 return gve_adjust_queues(priv, new_rx_cfg, new_tx_cfg, reset_rss);
517 }
518
gve_get_ringparam(struct net_device * netdev,struct ethtool_ringparam * cmd,struct kernel_ethtool_ringparam * kernel_cmd,struct netlink_ext_ack * extack)519 static void gve_get_ringparam(struct net_device *netdev,
520 struct ethtool_ringparam *cmd,
521 struct kernel_ethtool_ringparam *kernel_cmd,
522 struct netlink_ext_ack *extack)
523 {
524 struct gve_priv *priv = netdev_priv(netdev);
525
526 cmd->rx_max_pending = priv->max_rx_desc_cnt;
527 cmd->tx_max_pending = priv->max_tx_desc_cnt;
528 cmd->rx_pending = priv->rx_desc_cnt;
529 cmd->tx_pending = priv->tx_desc_cnt;
530
531 if (!gve_header_split_supported(priv))
532 kernel_cmd->tcp_data_split = ETHTOOL_TCP_DATA_SPLIT_UNKNOWN;
533 else if (priv->header_split_enabled)
534 kernel_cmd->tcp_data_split = ETHTOOL_TCP_DATA_SPLIT_ENABLED;
535 else
536 kernel_cmd->tcp_data_split = ETHTOOL_TCP_DATA_SPLIT_DISABLED;
537 }
538
gve_adjust_ring_sizes(struct gve_priv * priv,u16 new_tx_desc_cnt,u16 new_rx_desc_cnt)539 static int gve_adjust_ring_sizes(struct gve_priv *priv,
540 u16 new_tx_desc_cnt,
541 u16 new_rx_desc_cnt)
542 {
543 struct gve_tx_alloc_rings_cfg tx_alloc_cfg = {0};
544 struct gve_rx_alloc_rings_cfg rx_alloc_cfg = {0};
545 int err;
546
547 /* get current queue configuration */
548 gve_get_curr_alloc_cfgs(priv, &tx_alloc_cfg, &rx_alloc_cfg);
549
550 /* copy over the new ring_size from ethtool */
551 tx_alloc_cfg.ring_size = new_tx_desc_cnt;
552 rx_alloc_cfg.ring_size = new_rx_desc_cnt;
553
554 if (netif_running(priv->dev)) {
555 err = gve_adjust_config(priv, &tx_alloc_cfg, &rx_alloc_cfg);
556 if (err)
557 return err;
558 }
559
560 /* Set new ring_size for the next up */
561 priv->tx_desc_cnt = new_tx_desc_cnt;
562 priv->rx_desc_cnt = new_rx_desc_cnt;
563
564 return 0;
565 }
566
gve_validate_req_ring_size(struct gve_priv * priv,u16 new_tx_desc_cnt,u16 new_rx_desc_cnt)567 static int gve_validate_req_ring_size(struct gve_priv *priv, u16 new_tx_desc_cnt,
568 u16 new_rx_desc_cnt)
569 {
570 /* check for valid range */
571 if (new_tx_desc_cnt < priv->min_tx_desc_cnt ||
572 new_tx_desc_cnt > priv->max_tx_desc_cnt ||
573 new_rx_desc_cnt < priv->min_rx_desc_cnt ||
574 new_rx_desc_cnt > priv->max_rx_desc_cnt) {
575 dev_err(&priv->pdev->dev, "Requested descriptor count out of range\n");
576 return -EINVAL;
577 }
578
579 if (!is_power_of_2(new_tx_desc_cnt) || !is_power_of_2(new_rx_desc_cnt)) {
580 dev_err(&priv->pdev->dev, "Requested descriptor count has to be a power of 2\n");
581 return -EINVAL;
582 }
583 return 0;
584 }
585
gve_set_ringparam(struct net_device * netdev,struct ethtool_ringparam * cmd,struct kernel_ethtool_ringparam * kernel_cmd,struct netlink_ext_ack * extack)586 static int gve_set_ringparam(struct net_device *netdev,
587 struct ethtool_ringparam *cmd,
588 struct kernel_ethtool_ringparam *kernel_cmd,
589 struct netlink_ext_ack *extack)
590 {
591 struct gve_priv *priv = netdev_priv(netdev);
592 u16 new_tx_cnt, new_rx_cnt;
593 int err;
594
595 err = gve_set_hsplit_config(priv, kernel_cmd->tcp_data_split);
596 if (err)
597 return err;
598
599 if (cmd->tx_pending == priv->tx_desc_cnt && cmd->rx_pending == priv->rx_desc_cnt)
600 return 0;
601
602 if (!priv->modify_ring_size_enabled) {
603 dev_err(&priv->pdev->dev, "Modify ring size is not supported.\n");
604 return -EOPNOTSUPP;
605 }
606
607 new_tx_cnt = cmd->tx_pending;
608 new_rx_cnt = cmd->rx_pending;
609
610 if (gve_validate_req_ring_size(priv, new_tx_cnt, new_rx_cnt))
611 return -EINVAL;
612
613 return gve_adjust_ring_sizes(priv, new_tx_cnt, new_rx_cnt);
614 }
615
gve_user_reset(struct net_device * netdev,u32 * flags)616 static int gve_user_reset(struct net_device *netdev, u32 *flags)
617 {
618 struct gve_priv *priv = netdev_priv(netdev);
619
620 if (*flags == ETH_RESET_ALL) {
621 *flags = 0;
622 return gve_reset(priv, true);
623 }
624
625 return -EOPNOTSUPP;
626 }
627
gve_get_tunable(struct net_device * netdev,const struct ethtool_tunable * etuna,void * value)628 static int gve_get_tunable(struct net_device *netdev,
629 const struct ethtool_tunable *etuna, void *value)
630 {
631 struct gve_priv *priv = netdev_priv(netdev);
632
633 switch (etuna->id) {
634 case ETHTOOL_RX_COPYBREAK:
635 *(u32 *)value = priv->rx_copybreak;
636 return 0;
637 default:
638 return -EOPNOTSUPP;
639 }
640 }
641
gve_set_tunable(struct net_device * netdev,const struct ethtool_tunable * etuna,const void * value)642 static int gve_set_tunable(struct net_device *netdev,
643 const struct ethtool_tunable *etuna,
644 const void *value)
645 {
646 struct gve_priv *priv = netdev_priv(netdev);
647 u32 len;
648
649 switch (etuna->id) {
650 case ETHTOOL_RX_COPYBREAK:
651 {
652 u32 max_copybreak = priv->rx_cfg.packet_buffer_size;
653
654 len = *(u32 *)value;
655 if (len > max_copybreak)
656 return -EINVAL;
657 priv->rx_copybreak = len;
658 return 0;
659 }
660 default:
661 return -EOPNOTSUPP;
662 }
663 }
664
gve_get_priv_flags(struct net_device * netdev)665 static u32 gve_get_priv_flags(struct net_device *netdev)
666 {
667 struct gve_priv *priv = netdev_priv(netdev);
668 u32 ret_flags = 0;
669
670 /* Only 1 flag exists currently: report-stats (BIT(O)), so set that flag. */
671 if (priv->ethtool_flags & BIT(0))
672 ret_flags |= BIT(0);
673 return ret_flags;
674 }
675
gve_set_priv_flags(struct net_device * netdev,u32 flags)676 static int gve_set_priv_flags(struct net_device *netdev, u32 flags)
677 {
678 struct gve_priv *priv = netdev_priv(netdev);
679 u64 ori_flags, new_flags;
680 int num_tx_queues;
681
682 num_tx_queues = gve_num_tx_queues(priv);
683 ori_flags = READ_ONCE(priv->ethtool_flags);
684 new_flags = ori_flags;
685
686 /* Only one priv flag exists: report-stats (BIT(0))*/
687 if (flags & BIT(0))
688 new_flags |= BIT(0);
689 else
690 new_flags &= ~(BIT(0));
691 priv->ethtool_flags = new_flags;
692 /* start report-stats timer when user turns report stats on. */
693 if (flags & BIT(0)) {
694 mod_timer(&priv->stats_report_timer,
695 round_jiffies(jiffies +
696 msecs_to_jiffies(priv->stats_report_timer_period)));
697 }
698 /* Zero off gve stats when report-stats turned off and */
699 /* delete report stats timer. */
700 if (!(flags & BIT(0)) && (ori_flags & BIT(0))) {
701 int tx_stats_num = GVE_TX_STATS_REPORT_NUM *
702 num_tx_queues;
703 int rx_stats_num = GVE_RX_STATS_REPORT_NUM *
704 priv->rx_cfg.num_queues;
705
706 memset(priv->stats_report->stats, 0, (tx_stats_num + rx_stats_num) *
707 sizeof(struct stats));
708 timer_delete_sync(&priv->stats_report_timer);
709 }
710 return 0;
711 }
712
gve_get_link_ksettings(struct net_device * netdev,struct ethtool_link_ksettings * cmd)713 static int gve_get_link_ksettings(struct net_device *netdev,
714 struct ethtool_link_ksettings *cmd)
715 {
716 struct gve_priv *priv = netdev_priv(netdev);
717 int err = 0;
718
719 if (priv->link_speed == 0)
720 err = gve_adminq_report_link_speed(priv);
721
722 cmd->base.speed = priv->link_speed;
723
724 cmd->base.duplex = DUPLEX_FULL;
725
726 return err;
727 }
728
gve_get_coalesce(struct net_device * netdev,struct ethtool_coalesce * ec,struct kernel_ethtool_coalesce * kernel_ec,struct netlink_ext_ack * extack)729 static int gve_get_coalesce(struct net_device *netdev,
730 struct ethtool_coalesce *ec,
731 struct kernel_ethtool_coalesce *kernel_ec,
732 struct netlink_ext_ack *extack)
733 {
734 struct gve_priv *priv = netdev_priv(netdev);
735
736 if (gve_is_gqi(priv))
737 return -EOPNOTSUPP;
738 ec->tx_coalesce_usecs = priv->tx_coalesce_usecs;
739 ec->rx_coalesce_usecs = priv->rx_coalesce_usecs;
740
741 return 0;
742 }
743
gve_set_coalesce(struct net_device * netdev,struct ethtool_coalesce * ec,struct kernel_ethtool_coalesce * kernel_ec,struct netlink_ext_ack * extack)744 static int gve_set_coalesce(struct net_device *netdev,
745 struct ethtool_coalesce *ec,
746 struct kernel_ethtool_coalesce *kernel_ec,
747 struct netlink_ext_ack *extack)
748 {
749 struct gve_priv *priv = netdev_priv(netdev);
750 u32 tx_usecs_orig = priv->tx_coalesce_usecs;
751 u32 rx_usecs_orig = priv->rx_coalesce_usecs;
752 int idx;
753
754 if (gve_is_gqi(priv))
755 return -EOPNOTSUPP;
756
757 if (ec->tx_coalesce_usecs > GVE_MAX_ITR_INTERVAL_DQO ||
758 ec->rx_coalesce_usecs > GVE_MAX_ITR_INTERVAL_DQO)
759 return -EINVAL;
760 priv->tx_coalesce_usecs = ec->tx_coalesce_usecs;
761 priv->rx_coalesce_usecs = ec->rx_coalesce_usecs;
762
763 if (tx_usecs_orig != priv->tx_coalesce_usecs) {
764 for (idx = 0; idx < priv->tx_cfg.num_queues; idx++) {
765 int ntfy_idx = gve_tx_idx_to_ntfy(priv, idx);
766 struct gve_notify_block *block = &priv->ntfy_blocks[ntfy_idx];
767
768 gve_set_itr_coalesce_usecs_dqo(priv, block,
769 priv->tx_coalesce_usecs);
770 }
771 }
772
773 if (rx_usecs_orig != priv->rx_coalesce_usecs) {
774 for (idx = 0; idx < priv->rx_cfg.num_queues; idx++) {
775 int ntfy_idx = gve_rx_idx_to_ntfy(priv, idx);
776 struct gve_notify_block *block = &priv->ntfy_blocks[ntfy_idx];
777
778 gve_set_itr_coalesce_usecs_dqo(priv, block,
779 priv->rx_coalesce_usecs);
780 }
781 }
782
783 return 0;
784 }
785
gve_set_rxnfc(struct net_device * netdev,struct ethtool_rxnfc * cmd)786 static int gve_set_rxnfc(struct net_device *netdev, struct ethtool_rxnfc *cmd)
787 {
788 struct gve_priv *priv = netdev_priv(netdev);
789 int err = 0;
790
791 if (!(netdev->features & NETIF_F_NTUPLE))
792 return -EOPNOTSUPP;
793
794 switch (cmd->cmd) {
795 case ETHTOOL_SRXCLSRLINS:
796 err = gve_add_flow_rule(priv, cmd);
797 break;
798 case ETHTOOL_SRXCLSRLDEL:
799 err = gve_del_flow_rule(priv, cmd);
800 break;
801 case ETHTOOL_SRXFH:
802 err = -EOPNOTSUPP;
803 break;
804 default:
805 err = -EOPNOTSUPP;
806 break;
807 }
808
809 return err;
810 }
811
gve_get_rxnfc(struct net_device * netdev,struct ethtool_rxnfc * cmd,u32 * rule_locs)812 static int gve_get_rxnfc(struct net_device *netdev, struct ethtool_rxnfc *cmd, u32 *rule_locs)
813 {
814 struct gve_priv *priv = netdev_priv(netdev);
815 int err = 0;
816
817 switch (cmd->cmd) {
818 case ETHTOOL_GRXRINGS:
819 cmd->data = priv->rx_cfg.num_queues;
820 break;
821 case ETHTOOL_GRXCLSRLCNT:
822 if (!priv->max_flow_rules)
823 return -EOPNOTSUPP;
824
825 err = gve_adminq_query_flow_rules(priv, GVE_FLOW_RULE_QUERY_STATS, 0);
826 if (err)
827 return err;
828
829 cmd->rule_cnt = priv->num_flow_rules;
830 cmd->data = priv->max_flow_rules;
831 break;
832 case ETHTOOL_GRXCLSRULE:
833 err = gve_get_flow_rule_entry(priv, cmd);
834 break;
835 case ETHTOOL_GRXCLSRLALL:
836 err = gve_get_flow_rule_ids(priv, cmd, (u32 *)rule_locs);
837 break;
838 case ETHTOOL_GRXFH:
839 err = -EOPNOTSUPP;
840 break;
841 default:
842 err = -EOPNOTSUPP;
843 break;
844 }
845
846 return err;
847 }
848
gve_get_rxfh_key_size(struct net_device * netdev)849 static u32 gve_get_rxfh_key_size(struct net_device *netdev)
850 {
851 struct gve_priv *priv = netdev_priv(netdev);
852
853 return priv->rss_key_size;
854 }
855
gve_get_rxfh_indir_size(struct net_device * netdev)856 static u32 gve_get_rxfh_indir_size(struct net_device *netdev)
857 {
858 struct gve_priv *priv = netdev_priv(netdev);
859
860 return priv->rss_lut_size;
861 }
862
gve_get_rss_config_cache(struct gve_priv * priv,struct ethtool_rxfh_param * rxfh)863 static void gve_get_rss_config_cache(struct gve_priv *priv,
864 struct ethtool_rxfh_param *rxfh)
865 {
866 struct gve_rss_config *rss_config = &priv->rss_config;
867
868 rxfh->hfunc = ETH_RSS_HASH_TOP;
869
870 if (rxfh->key) {
871 rxfh->key_size = priv->rss_key_size;
872 memcpy(rxfh->key, rss_config->hash_key, priv->rss_key_size);
873 }
874
875 if (rxfh->indir) {
876 rxfh->indir_size = priv->rss_lut_size;
877 memcpy(rxfh->indir, rss_config->hash_lut,
878 priv->rss_lut_size * sizeof(*rxfh->indir));
879 }
880 }
881
gve_get_rxfh(struct net_device * netdev,struct ethtool_rxfh_param * rxfh)882 static int gve_get_rxfh(struct net_device *netdev, struct ethtool_rxfh_param *rxfh)
883 {
884 struct gve_priv *priv = netdev_priv(netdev);
885
886 if (!priv->rss_key_size || !priv->rss_lut_size)
887 return -EOPNOTSUPP;
888
889 if (priv->cache_rss_config) {
890 gve_get_rss_config_cache(priv, rxfh);
891 return 0;
892 }
893
894 return gve_adminq_query_rss_config(priv, rxfh);
895 }
896
gve_set_rss_config_cache(struct gve_priv * priv,struct ethtool_rxfh_param * rxfh)897 static void gve_set_rss_config_cache(struct gve_priv *priv,
898 struct ethtool_rxfh_param *rxfh)
899 {
900 struct gve_rss_config *rss_config = &priv->rss_config;
901
902 if (rxfh->key)
903 memcpy(rss_config->hash_key, rxfh->key, priv->rss_key_size);
904
905 if (rxfh->indir)
906 memcpy(rss_config->hash_lut, rxfh->indir,
907 priv->rss_lut_size * sizeof(*rxfh->indir));
908 }
909
gve_set_rxfh(struct net_device * netdev,struct ethtool_rxfh_param * rxfh,struct netlink_ext_ack * extack)910 static int gve_set_rxfh(struct net_device *netdev, struct ethtool_rxfh_param *rxfh,
911 struct netlink_ext_ack *extack)
912 {
913 struct gve_priv *priv = netdev_priv(netdev);
914 int err;
915
916 if (!priv->rss_key_size || !priv->rss_lut_size)
917 return -EOPNOTSUPP;
918
919 err = gve_adminq_configure_rss(priv, rxfh);
920 if (err) {
921 NL_SET_ERR_MSG_MOD(extack, "Fail to configure RSS config");
922 return err;
923 }
924
925 if (priv->cache_rss_config)
926 gve_set_rss_config_cache(priv, rxfh);
927
928 return 0;
929 }
930
931 const struct ethtool_ops gve_ethtool_ops = {
932 .supported_coalesce_params = ETHTOOL_COALESCE_USECS,
933 .supported_ring_params = ETHTOOL_RING_USE_TCP_DATA_SPLIT,
934 .get_drvinfo = gve_get_drvinfo,
935 .get_strings = gve_get_strings,
936 .get_sset_count = gve_get_sset_count,
937 .get_ethtool_stats = gve_get_ethtool_stats,
938 .set_msglevel = gve_set_msglevel,
939 .get_msglevel = gve_get_msglevel,
940 .set_channels = gve_set_channels,
941 .get_channels = gve_get_channels,
942 .set_rxnfc = gve_set_rxnfc,
943 .get_rxnfc = gve_get_rxnfc,
944 .get_rxfh_indir_size = gve_get_rxfh_indir_size,
945 .get_rxfh_key_size = gve_get_rxfh_key_size,
946 .get_rxfh = gve_get_rxfh,
947 .set_rxfh = gve_set_rxfh,
948 .get_link = ethtool_op_get_link,
949 .get_coalesce = gve_get_coalesce,
950 .set_coalesce = gve_set_coalesce,
951 .get_ringparam = gve_get_ringparam,
952 .set_ringparam = gve_set_ringparam,
953 .reset = gve_user_reset,
954 .get_tunable = gve_get_tunable,
955 .set_tunable = gve_set_tunable,
956 .get_priv_flags = gve_get_priv_flags,
957 .set_priv_flags = gve_set_priv_flags,
958 .get_link_ksettings = gve_get_link_ksettings,
959 .get_ts_info = ethtool_op_get_ts_info,
960 };
961