xref: /linux-6.15/net/core/netdev-genl.c (revision 8af2136e)
1 // SPDX-License-Identifier: GPL-2.0-only
2 
3 #include <linux/netdevice.h>
4 #include <linux/notifier.h>
5 #include <linux/rtnetlink.h>
6 #include <net/busy_poll.h>
7 #include <net/net_namespace.h>
8 #include <net/netdev_queues.h>
9 #include <net/netdev_rx_queue.h>
10 #include <net/sock.h>
11 #include <net/xdp.h>
12 #include <net/xdp_sock.h>
13 #include <net/page_pool/memory_provider.h>
14 
15 #include "dev.h"
16 #include "devmem.h"
17 #include "netdev-genl-gen.h"
18 
19 struct netdev_nl_dump_ctx {
20 	unsigned long	ifindex;
21 	unsigned int	rxq_idx;
22 	unsigned int	txq_idx;
23 	unsigned int	napi_id;
24 };
25 
26 static struct netdev_nl_dump_ctx *netdev_dump_ctx(struct netlink_callback *cb)
27 {
28 	NL_ASSERT_CTX_FITS(struct netdev_nl_dump_ctx);
29 
30 	return (struct netdev_nl_dump_ctx *)cb->ctx;
31 }
32 
33 static int
34 netdev_nl_dev_fill(struct net_device *netdev, struct sk_buff *rsp,
35 		   const struct genl_info *info)
36 {
37 	u64 xsk_features = 0;
38 	u64 xdp_rx_meta = 0;
39 	void *hdr;
40 
41 	hdr = genlmsg_iput(rsp, info);
42 	if (!hdr)
43 		return -EMSGSIZE;
44 
45 #define XDP_METADATA_KFUNC(_, flag, __, xmo) \
46 	if (netdev->xdp_metadata_ops && netdev->xdp_metadata_ops->xmo) \
47 		xdp_rx_meta |= flag;
48 XDP_METADATA_KFUNC_xxx
49 #undef XDP_METADATA_KFUNC
50 
51 	if (netdev->xsk_tx_metadata_ops) {
52 		if (netdev->xsk_tx_metadata_ops->tmo_fill_timestamp)
53 			xsk_features |= NETDEV_XSK_FLAGS_TX_TIMESTAMP;
54 		if (netdev->xsk_tx_metadata_ops->tmo_request_checksum)
55 			xsk_features |= NETDEV_XSK_FLAGS_TX_CHECKSUM;
56 	}
57 
58 	if (nla_put_u32(rsp, NETDEV_A_DEV_IFINDEX, netdev->ifindex) ||
59 	    nla_put_u64_64bit(rsp, NETDEV_A_DEV_XDP_FEATURES,
60 			      netdev->xdp_features, NETDEV_A_DEV_PAD) ||
61 	    nla_put_u64_64bit(rsp, NETDEV_A_DEV_XDP_RX_METADATA_FEATURES,
62 			      xdp_rx_meta, NETDEV_A_DEV_PAD) ||
63 	    nla_put_u64_64bit(rsp, NETDEV_A_DEV_XSK_FEATURES,
64 			      xsk_features, NETDEV_A_DEV_PAD))
65 		goto err_cancel_msg;
66 
67 	if (netdev->xdp_features & NETDEV_XDP_ACT_XSK_ZEROCOPY) {
68 		if (nla_put_u32(rsp, NETDEV_A_DEV_XDP_ZC_MAX_SEGS,
69 				netdev->xdp_zc_max_segs))
70 			goto err_cancel_msg;
71 	}
72 
73 	genlmsg_end(rsp, hdr);
74 
75 	return 0;
76 
77 err_cancel_msg:
78 	genlmsg_cancel(rsp, hdr);
79 	return -EMSGSIZE;
80 }
81 
82 static void
83 netdev_genl_dev_notify(struct net_device *netdev, int cmd)
84 {
85 	struct genl_info info;
86 	struct sk_buff *ntf;
87 
88 	if (!genl_has_listeners(&netdev_nl_family, dev_net(netdev),
89 				NETDEV_NLGRP_MGMT))
90 		return;
91 
92 	genl_info_init_ntf(&info, &netdev_nl_family, cmd);
93 
94 	ntf = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL);
95 	if (!ntf)
96 		return;
97 
98 	if (netdev_nl_dev_fill(netdev, ntf, &info)) {
99 		nlmsg_free(ntf);
100 		return;
101 	}
102 
103 	genlmsg_multicast_netns(&netdev_nl_family, dev_net(netdev), ntf,
104 				0, NETDEV_NLGRP_MGMT, GFP_KERNEL);
105 }
106 
107 int netdev_nl_dev_get_doit(struct sk_buff *skb, struct genl_info *info)
108 {
109 	struct net_device *netdev;
110 	struct sk_buff *rsp;
111 	u32 ifindex;
112 	int err;
113 
114 	if (GENL_REQ_ATTR_CHECK(info, NETDEV_A_DEV_IFINDEX))
115 		return -EINVAL;
116 
117 	ifindex = nla_get_u32(info->attrs[NETDEV_A_DEV_IFINDEX]);
118 
119 	rsp = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL);
120 	if (!rsp)
121 		return -ENOMEM;
122 
123 	rtnl_lock();
124 
125 	netdev = __dev_get_by_index(genl_info_net(info), ifindex);
126 	if (netdev)
127 		err = netdev_nl_dev_fill(netdev, rsp, info);
128 	else
129 		err = -ENODEV;
130 
131 	rtnl_unlock();
132 
133 	if (err)
134 		goto err_free_msg;
135 
136 	return genlmsg_reply(rsp, info);
137 
138 err_free_msg:
139 	nlmsg_free(rsp);
140 	return err;
141 }
142 
143 int netdev_nl_dev_get_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
144 {
145 	struct netdev_nl_dump_ctx *ctx = netdev_dump_ctx(cb);
146 	struct net *net = sock_net(skb->sk);
147 	struct net_device *netdev;
148 	int err = 0;
149 
150 	rtnl_lock();
151 	for_each_netdev_dump(net, netdev, ctx->ifindex) {
152 		err = netdev_nl_dev_fill(netdev, skb, genl_info_dump(cb));
153 		if (err < 0)
154 			break;
155 	}
156 	rtnl_unlock();
157 
158 	return err;
159 }
160 
161 static int
162 netdev_nl_napi_fill_one(struct sk_buff *rsp, struct napi_struct *napi,
163 			const struct genl_info *info)
164 {
165 	unsigned long irq_suspend_timeout;
166 	unsigned long gro_flush_timeout;
167 	u32 napi_defer_hard_irqs;
168 	void *hdr;
169 	pid_t pid;
170 
171 	if (!napi->dev->up)
172 		return 0;
173 
174 	hdr = genlmsg_iput(rsp, info);
175 	if (!hdr)
176 		return -EMSGSIZE;
177 
178 	if (nla_put_u32(rsp, NETDEV_A_NAPI_ID, napi->napi_id))
179 		goto nla_put_failure;
180 
181 	if (nla_put_u32(rsp, NETDEV_A_NAPI_IFINDEX, napi->dev->ifindex))
182 		goto nla_put_failure;
183 
184 	if (napi->irq >= 0 && nla_put_u32(rsp, NETDEV_A_NAPI_IRQ, napi->irq))
185 		goto nla_put_failure;
186 
187 	if (napi->thread) {
188 		pid = task_pid_nr(napi->thread);
189 		if (nla_put_u32(rsp, NETDEV_A_NAPI_PID, pid))
190 			goto nla_put_failure;
191 	}
192 
193 	napi_defer_hard_irqs = napi_get_defer_hard_irqs(napi);
194 	if (nla_put_s32(rsp, NETDEV_A_NAPI_DEFER_HARD_IRQS,
195 			napi_defer_hard_irqs))
196 		goto nla_put_failure;
197 
198 	irq_suspend_timeout = napi_get_irq_suspend_timeout(napi);
199 	if (nla_put_uint(rsp, NETDEV_A_NAPI_IRQ_SUSPEND_TIMEOUT,
200 			 irq_suspend_timeout))
201 		goto nla_put_failure;
202 
203 	gro_flush_timeout = napi_get_gro_flush_timeout(napi);
204 	if (nla_put_uint(rsp, NETDEV_A_NAPI_GRO_FLUSH_TIMEOUT,
205 			 gro_flush_timeout))
206 		goto nla_put_failure;
207 
208 	genlmsg_end(rsp, hdr);
209 
210 	return 0;
211 
212 nla_put_failure:
213 	genlmsg_cancel(rsp, hdr);
214 	return -EMSGSIZE;
215 }
216 
217 int netdev_nl_napi_get_doit(struct sk_buff *skb, struct genl_info *info)
218 {
219 	struct napi_struct *napi;
220 	struct sk_buff *rsp;
221 	u32 napi_id;
222 	int err;
223 
224 	if (GENL_REQ_ATTR_CHECK(info, NETDEV_A_NAPI_ID))
225 		return -EINVAL;
226 
227 	napi_id = nla_get_u32(info->attrs[NETDEV_A_NAPI_ID]);
228 
229 	rsp = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL);
230 	if (!rsp)
231 		return -ENOMEM;
232 
233 	napi = netdev_napi_by_id_lock(genl_info_net(info), napi_id);
234 	if (napi) {
235 		err = netdev_nl_napi_fill_one(rsp, napi, info);
236 		netdev_unlock(napi->dev);
237 	} else {
238 		NL_SET_BAD_ATTR(info->extack, info->attrs[NETDEV_A_NAPI_ID]);
239 		err = -ENOENT;
240 	}
241 
242 	if (err) {
243 		goto err_free_msg;
244 	} else if (!rsp->len) {
245 		err = -ENOENT;
246 		goto err_free_msg;
247 	}
248 
249 	return genlmsg_reply(rsp, info);
250 
251 err_free_msg:
252 	nlmsg_free(rsp);
253 	return err;
254 }
255 
256 static int
257 netdev_nl_napi_dump_one(struct net_device *netdev, struct sk_buff *rsp,
258 			const struct genl_info *info,
259 			struct netdev_nl_dump_ctx *ctx)
260 {
261 	struct napi_struct *napi;
262 	unsigned int prev_id;
263 	int err = 0;
264 
265 	if (!netdev->up)
266 		return err;
267 
268 	prev_id = UINT_MAX;
269 	list_for_each_entry(napi, &netdev->napi_list, dev_list) {
270 		if (!napi_id_valid(napi->napi_id))
271 			continue;
272 
273 		/* Dump continuation below depends on the list being sorted */
274 		WARN_ON_ONCE(napi->napi_id >= prev_id);
275 		prev_id = napi->napi_id;
276 
277 		if (ctx->napi_id && napi->napi_id >= ctx->napi_id)
278 			continue;
279 
280 		err = netdev_nl_napi_fill_one(rsp, napi, info);
281 		if (err)
282 			return err;
283 		ctx->napi_id = napi->napi_id;
284 	}
285 	return err;
286 }
287 
288 int netdev_nl_napi_get_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
289 {
290 	struct netdev_nl_dump_ctx *ctx = netdev_dump_ctx(cb);
291 	const struct genl_info *info = genl_info_dump(cb);
292 	struct net *net = sock_net(skb->sk);
293 	struct net_device *netdev;
294 	u32 ifindex = 0;
295 	int err = 0;
296 
297 	if (info->attrs[NETDEV_A_NAPI_IFINDEX])
298 		ifindex = nla_get_u32(info->attrs[NETDEV_A_NAPI_IFINDEX]);
299 
300 	if (ifindex) {
301 		netdev = netdev_get_by_index_lock(net, ifindex);
302 		if (netdev) {
303 			err = netdev_nl_napi_dump_one(netdev, skb, info, ctx);
304 			netdev_unlock(netdev);
305 		} else {
306 			err = -ENODEV;
307 		}
308 	} else {
309 		for_each_netdev_lock_scoped(net, netdev, ctx->ifindex) {
310 			err = netdev_nl_napi_dump_one(netdev, skb, info, ctx);
311 			if (err < 0)
312 				break;
313 			ctx->napi_id = 0;
314 		}
315 	}
316 
317 	return err;
318 }
319 
320 static int
321 netdev_nl_napi_set_config(struct napi_struct *napi, struct genl_info *info)
322 {
323 	u64 irq_suspend_timeout = 0;
324 	u64 gro_flush_timeout = 0;
325 	u32 defer = 0;
326 
327 	if (info->attrs[NETDEV_A_NAPI_DEFER_HARD_IRQS]) {
328 		defer = nla_get_u32(info->attrs[NETDEV_A_NAPI_DEFER_HARD_IRQS]);
329 		napi_set_defer_hard_irqs(napi, defer);
330 	}
331 
332 	if (info->attrs[NETDEV_A_NAPI_IRQ_SUSPEND_TIMEOUT]) {
333 		irq_suspend_timeout = nla_get_uint(info->attrs[NETDEV_A_NAPI_IRQ_SUSPEND_TIMEOUT]);
334 		napi_set_irq_suspend_timeout(napi, irq_suspend_timeout);
335 	}
336 
337 	if (info->attrs[NETDEV_A_NAPI_GRO_FLUSH_TIMEOUT]) {
338 		gro_flush_timeout = nla_get_uint(info->attrs[NETDEV_A_NAPI_GRO_FLUSH_TIMEOUT]);
339 		napi_set_gro_flush_timeout(napi, gro_flush_timeout);
340 	}
341 
342 	return 0;
343 }
344 
345 int netdev_nl_napi_set_doit(struct sk_buff *skb, struct genl_info *info)
346 {
347 	struct napi_struct *napi;
348 	unsigned int napi_id;
349 	int err;
350 
351 	if (GENL_REQ_ATTR_CHECK(info, NETDEV_A_NAPI_ID))
352 		return -EINVAL;
353 
354 	napi_id = nla_get_u32(info->attrs[NETDEV_A_NAPI_ID]);
355 
356 	napi = netdev_napi_by_id_lock(genl_info_net(info), napi_id);
357 	if (napi) {
358 		err = netdev_nl_napi_set_config(napi, info);
359 		netdev_unlock(napi->dev);
360 	} else {
361 		NL_SET_BAD_ATTR(info->extack, info->attrs[NETDEV_A_NAPI_ID]);
362 		err = -ENOENT;
363 	}
364 
365 	return err;
366 }
367 
368 static int nla_put_napi_id(struct sk_buff *skb, const struct napi_struct *napi)
369 {
370 	if (napi && napi_id_valid(napi->napi_id))
371 		return nla_put_u32(skb, NETDEV_A_QUEUE_NAPI_ID, napi->napi_id);
372 	return 0;
373 }
374 
375 static int
376 netdev_nl_queue_fill_one(struct sk_buff *rsp, struct net_device *netdev,
377 			 u32 q_idx, u32 q_type, const struct genl_info *info)
378 {
379 	struct pp_memory_provider_params *params;
380 	struct netdev_rx_queue *rxq;
381 	struct netdev_queue *txq;
382 	void *hdr;
383 
384 	hdr = genlmsg_iput(rsp, info);
385 	if (!hdr)
386 		return -EMSGSIZE;
387 
388 	if (nla_put_u32(rsp, NETDEV_A_QUEUE_ID, q_idx) ||
389 	    nla_put_u32(rsp, NETDEV_A_QUEUE_TYPE, q_type) ||
390 	    nla_put_u32(rsp, NETDEV_A_QUEUE_IFINDEX, netdev->ifindex))
391 		goto nla_put_failure;
392 
393 	switch (q_type) {
394 	case NETDEV_QUEUE_TYPE_RX:
395 		rxq = __netif_get_rx_queue(netdev, q_idx);
396 		if (nla_put_napi_id(rsp, rxq->napi))
397 			goto nla_put_failure;
398 
399 		params = &rxq->mp_params;
400 		if (params->mp_ops &&
401 		    params->mp_ops->nl_fill(params->mp_priv, rsp, rxq))
402 			goto nla_put_failure;
403 #ifdef CONFIG_XDP_SOCKETS
404 		if (rxq->pool)
405 			if (nla_put_empty_nest(rsp, NETDEV_A_QUEUE_XSK))
406 				goto nla_put_failure;
407 #endif
408 
409 		break;
410 	case NETDEV_QUEUE_TYPE_TX:
411 		txq = netdev_get_tx_queue(netdev, q_idx);
412 		if (nla_put_napi_id(rsp, txq->napi))
413 			goto nla_put_failure;
414 #ifdef CONFIG_XDP_SOCKETS
415 		if (txq->pool)
416 			if (nla_put_empty_nest(rsp, NETDEV_A_QUEUE_XSK))
417 				goto nla_put_failure;
418 #endif
419 		break;
420 	}
421 
422 	genlmsg_end(rsp, hdr);
423 
424 	return 0;
425 
426 nla_put_failure:
427 	genlmsg_cancel(rsp, hdr);
428 	return -EMSGSIZE;
429 }
430 
431 static int netdev_nl_queue_validate(struct net_device *netdev, u32 q_id,
432 				    u32 q_type)
433 {
434 	switch (q_type) {
435 	case NETDEV_QUEUE_TYPE_RX:
436 		if (q_id >= netdev->real_num_rx_queues)
437 			return -EINVAL;
438 		return 0;
439 	case NETDEV_QUEUE_TYPE_TX:
440 		if (q_id >= netdev->real_num_tx_queues)
441 			return -EINVAL;
442 	}
443 	return 0;
444 }
445 
446 static int
447 netdev_nl_queue_fill(struct sk_buff *rsp, struct net_device *netdev, u32 q_idx,
448 		     u32 q_type, const struct genl_info *info)
449 {
450 	int err;
451 
452 	if (!netdev->up)
453 		return -ENOENT;
454 
455 	err = netdev_nl_queue_validate(netdev, q_idx, q_type);
456 	if (err)
457 		return err;
458 
459 	return netdev_nl_queue_fill_one(rsp, netdev, q_idx, q_type, info);
460 }
461 
462 int netdev_nl_queue_get_doit(struct sk_buff *skb, struct genl_info *info)
463 {
464 	u32 q_id, q_type, ifindex;
465 	struct net_device *netdev;
466 	struct sk_buff *rsp;
467 	int err;
468 
469 	if (GENL_REQ_ATTR_CHECK(info, NETDEV_A_QUEUE_ID) ||
470 	    GENL_REQ_ATTR_CHECK(info, NETDEV_A_QUEUE_TYPE) ||
471 	    GENL_REQ_ATTR_CHECK(info, NETDEV_A_QUEUE_IFINDEX))
472 		return -EINVAL;
473 
474 	q_id = nla_get_u32(info->attrs[NETDEV_A_QUEUE_ID]);
475 	q_type = nla_get_u32(info->attrs[NETDEV_A_QUEUE_TYPE]);
476 	ifindex = nla_get_u32(info->attrs[NETDEV_A_QUEUE_IFINDEX]);
477 
478 	rsp = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL);
479 	if (!rsp)
480 		return -ENOMEM;
481 
482 	rtnl_lock();
483 
484 	netdev = netdev_get_by_index_lock(genl_info_net(info), ifindex);
485 	if (netdev) {
486 		err = netdev_nl_queue_fill(rsp, netdev, q_id, q_type, info);
487 		netdev_unlock(netdev);
488 	} else {
489 		err = -ENODEV;
490 	}
491 
492 	rtnl_unlock();
493 
494 	if (err)
495 		goto err_free_msg;
496 
497 	return genlmsg_reply(rsp, info);
498 
499 err_free_msg:
500 	nlmsg_free(rsp);
501 	return err;
502 }
503 
504 static int
505 netdev_nl_queue_dump_one(struct net_device *netdev, struct sk_buff *rsp,
506 			 const struct genl_info *info,
507 			 struct netdev_nl_dump_ctx *ctx)
508 {
509 	int err = 0;
510 
511 	if (!netdev->up)
512 		return err;
513 
514 	for (; ctx->rxq_idx < netdev->real_num_rx_queues; ctx->rxq_idx++) {
515 		err = netdev_nl_queue_fill_one(rsp, netdev, ctx->rxq_idx,
516 					       NETDEV_QUEUE_TYPE_RX, info);
517 		if (err)
518 			return err;
519 	}
520 	for (; ctx->txq_idx < netdev->real_num_tx_queues; ctx->txq_idx++) {
521 		err = netdev_nl_queue_fill_one(rsp, netdev, ctx->txq_idx,
522 					       NETDEV_QUEUE_TYPE_TX, info);
523 		if (err)
524 			return err;
525 	}
526 
527 	return err;
528 }
529 
530 int netdev_nl_queue_get_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
531 {
532 	struct netdev_nl_dump_ctx *ctx = netdev_dump_ctx(cb);
533 	const struct genl_info *info = genl_info_dump(cb);
534 	struct net *net = sock_net(skb->sk);
535 	struct net_device *netdev;
536 	u32 ifindex = 0;
537 	int err = 0;
538 
539 	if (info->attrs[NETDEV_A_QUEUE_IFINDEX])
540 		ifindex = nla_get_u32(info->attrs[NETDEV_A_QUEUE_IFINDEX]);
541 
542 	rtnl_lock();
543 	if (ifindex) {
544 		netdev = netdev_get_by_index_lock(net, ifindex);
545 		if (netdev) {
546 			err = netdev_nl_queue_dump_one(netdev, skb, info, ctx);
547 			netdev_unlock(netdev);
548 		} else {
549 			err = -ENODEV;
550 		}
551 	} else {
552 		for_each_netdev_lock_scoped(net, netdev, ctx->ifindex) {
553 			err = netdev_nl_queue_dump_one(netdev, skb, info, ctx);
554 			if (err < 0)
555 				break;
556 			ctx->rxq_idx = 0;
557 			ctx->txq_idx = 0;
558 		}
559 	}
560 	rtnl_unlock();
561 
562 	return err;
563 }
564 
565 #define NETDEV_STAT_NOT_SET		(~0ULL)
566 
567 static void netdev_nl_stats_add(void *_sum, const void *_add, size_t size)
568 {
569 	const u64 *add = _add;
570 	u64 *sum = _sum;
571 
572 	while (size) {
573 		if (*add != NETDEV_STAT_NOT_SET && *sum != NETDEV_STAT_NOT_SET)
574 			*sum += *add;
575 		sum++;
576 		add++;
577 		size -= 8;
578 	}
579 }
580 
581 static int netdev_stat_put(struct sk_buff *rsp, unsigned int attr_id, u64 value)
582 {
583 	if (value == NETDEV_STAT_NOT_SET)
584 		return 0;
585 	return nla_put_uint(rsp, attr_id, value);
586 }
587 
588 static int
589 netdev_nl_stats_write_rx(struct sk_buff *rsp, struct netdev_queue_stats_rx *rx)
590 {
591 	if (netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_PACKETS, rx->packets) ||
592 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_BYTES, rx->bytes) ||
593 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_ALLOC_FAIL, rx->alloc_fail) ||
594 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_HW_DROPS, rx->hw_drops) ||
595 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_HW_DROP_OVERRUNS, rx->hw_drop_overruns) ||
596 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_CSUM_COMPLETE, rx->csum_complete) ||
597 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_CSUM_UNNECESSARY, rx->csum_unnecessary) ||
598 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_CSUM_NONE, rx->csum_none) ||
599 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_CSUM_BAD, rx->csum_bad) ||
600 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_HW_GRO_PACKETS, rx->hw_gro_packets) ||
601 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_HW_GRO_BYTES, rx->hw_gro_bytes) ||
602 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_HW_GRO_WIRE_PACKETS, rx->hw_gro_wire_packets) ||
603 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_HW_GRO_WIRE_BYTES, rx->hw_gro_wire_bytes) ||
604 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_RX_HW_DROP_RATELIMITS, rx->hw_drop_ratelimits))
605 		return -EMSGSIZE;
606 	return 0;
607 }
608 
609 static int
610 netdev_nl_stats_write_tx(struct sk_buff *rsp, struct netdev_queue_stats_tx *tx)
611 {
612 	if (netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_PACKETS, tx->packets) ||
613 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_BYTES, tx->bytes) ||
614 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_HW_DROPS, tx->hw_drops) ||
615 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_HW_DROP_ERRORS, tx->hw_drop_errors) ||
616 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_CSUM_NONE, tx->csum_none) ||
617 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_NEEDS_CSUM, tx->needs_csum) ||
618 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_HW_GSO_PACKETS, tx->hw_gso_packets) ||
619 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_HW_GSO_BYTES, tx->hw_gso_bytes) ||
620 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_HW_GSO_WIRE_PACKETS, tx->hw_gso_wire_packets) ||
621 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_HW_GSO_WIRE_BYTES, tx->hw_gso_wire_bytes) ||
622 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_HW_DROP_RATELIMITS, tx->hw_drop_ratelimits) ||
623 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_STOP, tx->stop) ||
624 	    netdev_stat_put(rsp, NETDEV_A_QSTATS_TX_WAKE, tx->wake))
625 		return -EMSGSIZE;
626 	return 0;
627 }
628 
629 static int
630 netdev_nl_stats_queue(struct net_device *netdev, struct sk_buff *rsp,
631 		      u32 q_type, int i, const struct genl_info *info)
632 {
633 	const struct netdev_stat_ops *ops = netdev->stat_ops;
634 	struct netdev_queue_stats_rx rx;
635 	struct netdev_queue_stats_tx tx;
636 	void *hdr;
637 
638 	hdr = genlmsg_iput(rsp, info);
639 	if (!hdr)
640 		return -EMSGSIZE;
641 	if (nla_put_u32(rsp, NETDEV_A_QSTATS_IFINDEX, netdev->ifindex) ||
642 	    nla_put_u32(rsp, NETDEV_A_QSTATS_QUEUE_TYPE, q_type) ||
643 	    nla_put_u32(rsp, NETDEV_A_QSTATS_QUEUE_ID, i))
644 		goto nla_put_failure;
645 
646 	switch (q_type) {
647 	case NETDEV_QUEUE_TYPE_RX:
648 		memset(&rx, 0xff, sizeof(rx));
649 		ops->get_queue_stats_rx(netdev, i, &rx);
650 		if (!memchr_inv(&rx, 0xff, sizeof(rx)))
651 			goto nla_cancel;
652 		if (netdev_nl_stats_write_rx(rsp, &rx))
653 			goto nla_put_failure;
654 		break;
655 	case NETDEV_QUEUE_TYPE_TX:
656 		memset(&tx, 0xff, sizeof(tx));
657 		ops->get_queue_stats_tx(netdev, i, &tx);
658 		if (!memchr_inv(&tx, 0xff, sizeof(tx)))
659 			goto nla_cancel;
660 		if (netdev_nl_stats_write_tx(rsp, &tx))
661 			goto nla_put_failure;
662 		break;
663 	}
664 
665 	genlmsg_end(rsp, hdr);
666 	return 0;
667 
668 nla_cancel:
669 	genlmsg_cancel(rsp, hdr);
670 	return 0;
671 nla_put_failure:
672 	genlmsg_cancel(rsp, hdr);
673 	return -EMSGSIZE;
674 }
675 
676 static int
677 netdev_nl_stats_by_queue(struct net_device *netdev, struct sk_buff *rsp,
678 			 const struct genl_info *info,
679 			 struct netdev_nl_dump_ctx *ctx)
680 {
681 	const struct netdev_stat_ops *ops = netdev->stat_ops;
682 	int i, err;
683 
684 	if (!(netdev->flags & IFF_UP))
685 		return 0;
686 
687 	i = ctx->rxq_idx;
688 	while (ops->get_queue_stats_rx && i < netdev->real_num_rx_queues) {
689 		err = netdev_nl_stats_queue(netdev, rsp, NETDEV_QUEUE_TYPE_RX,
690 					    i, info);
691 		if (err)
692 			return err;
693 		ctx->rxq_idx = ++i;
694 	}
695 	i = ctx->txq_idx;
696 	while (ops->get_queue_stats_tx && i < netdev->real_num_tx_queues) {
697 		err = netdev_nl_stats_queue(netdev, rsp, NETDEV_QUEUE_TYPE_TX,
698 					    i, info);
699 		if (err)
700 			return err;
701 		ctx->txq_idx = ++i;
702 	}
703 
704 	ctx->rxq_idx = 0;
705 	ctx->txq_idx = 0;
706 	return 0;
707 }
708 
709 static int
710 netdev_nl_stats_by_netdev(struct net_device *netdev, struct sk_buff *rsp,
711 			  const struct genl_info *info)
712 {
713 	struct netdev_queue_stats_rx rx_sum, rx;
714 	struct netdev_queue_stats_tx tx_sum, tx;
715 	const struct netdev_stat_ops *ops;
716 	void *hdr;
717 	int i;
718 
719 	ops = netdev->stat_ops;
720 	/* Netdev can't guarantee any complete counters */
721 	if (!ops->get_base_stats)
722 		return 0;
723 
724 	memset(&rx_sum, 0xff, sizeof(rx_sum));
725 	memset(&tx_sum, 0xff, sizeof(tx_sum));
726 
727 	ops->get_base_stats(netdev, &rx_sum, &tx_sum);
728 
729 	/* The op was there, but nothing reported, don't bother */
730 	if (!memchr_inv(&rx_sum, 0xff, sizeof(rx_sum)) &&
731 	    !memchr_inv(&tx_sum, 0xff, sizeof(tx_sum)))
732 		return 0;
733 
734 	hdr = genlmsg_iput(rsp, info);
735 	if (!hdr)
736 		return -EMSGSIZE;
737 	if (nla_put_u32(rsp, NETDEV_A_QSTATS_IFINDEX, netdev->ifindex))
738 		goto nla_put_failure;
739 
740 	for (i = 0; i < netdev->real_num_rx_queues; i++) {
741 		memset(&rx, 0xff, sizeof(rx));
742 		if (ops->get_queue_stats_rx)
743 			ops->get_queue_stats_rx(netdev, i, &rx);
744 		netdev_nl_stats_add(&rx_sum, &rx, sizeof(rx));
745 	}
746 	for (i = 0; i < netdev->real_num_tx_queues; i++) {
747 		memset(&tx, 0xff, sizeof(tx));
748 		if (ops->get_queue_stats_tx)
749 			ops->get_queue_stats_tx(netdev, i, &tx);
750 		netdev_nl_stats_add(&tx_sum, &tx, sizeof(tx));
751 	}
752 
753 	if (netdev_nl_stats_write_rx(rsp, &rx_sum) ||
754 	    netdev_nl_stats_write_tx(rsp, &tx_sum))
755 		goto nla_put_failure;
756 
757 	genlmsg_end(rsp, hdr);
758 	return 0;
759 
760 nla_put_failure:
761 	genlmsg_cancel(rsp, hdr);
762 	return -EMSGSIZE;
763 }
764 
765 static int
766 netdev_nl_qstats_get_dump_one(struct net_device *netdev, unsigned int scope,
767 			      struct sk_buff *skb, const struct genl_info *info,
768 			      struct netdev_nl_dump_ctx *ctx)
769 {
770 	if (!netdev->stat_ops)
771 		return 0;
772 
773 	switch (scope) {
774 	case 0:
775 		return netdev_nl_stats_by_netdev(netdev, skb, info);
776 	case NETDEV_QSTATS_SCOPE_QUEUE:
777 		return netdev_nl_stats_by_queue(netdev, skb, info, ctx);
778 	}
779 
780 	return -EINVAL;	/* Should not happen, per netlink policy */
781 }
782 
783 int netdev_nl_qstats_get_dumpit(struct sk_buff *skb,
784 				struct netlink_callback *cb)
785 {
786 	struct netdev_nl_dump_ctx *ctx = netdev_dump_ctx(cb);
787 	const struct genl_info *info = genl_info_dump(cb);
788 	struct net *net = sock_net(skb->sk);
789 	struct net_device *netdev;
790 	unsigned int ifindex;
791 	unsigned int scope;
792 	int err = 0;
793 
794 	scope = 0;
795 	if (info->attrs[NETDEV_A_QSTATS_SCOPE])
796 		scope = nla_get_uint(info->attrs[NETDEV_A_QSTATS_SCOPE]);
797 
798 	ifindex = 0;
799 	if (info->attrs[NETDEV_A_QSTATS_IFINDEX])
800 		ifindex = nla_get_u32(info->attrs[NETDEV_A_QSTATS_IFINDEX]);
801 
802 	rtnl_lock();
803 	if (ifindex) {
804 		netdev = __dev_get_by_index(net, ifindex);
805 		if (netdev && netdev->stat_ops) {
806 			err = netdev_nl_qstats_get_dump_one(netdev, scope, skb,
807 							    info, ctx);
808 		} else {
809 			NL_SET_BAD_ATTR(info->extack,
810 					info->attrs[NETDEV_A_QSTATS_IFINDEX]);
811 			err = netdev ? -EOPNOTSUPP : -ENODEV;
812 		}
813 	} else {
814 		for_each_netdev_dump(net, netdev, ctx->ifindex) {
815 			err = netdev_nl_qstats_get_dump_one(netdev, scope, skb,
816 							    info, ctx);
817 			if (err < 0)
818 				break;
819 		}
820 	}
821 	rtnl_unlock();
822 
823 	return err;
824 }
825 
826 int netdev_nl_bind_rx_doit(struct sk_buff *skb, struct genl_info *info)
827 {
828 	struct nlattr *tb[ARRAY_SIZE(netdev_queue_id_nl_policy)];
829 	struct net_devmem_dmabuf_binding *binding;
830 	struct list_head *sock_binding_list;
831 	u32 ifindex, dmabuf_fd, rxq_idx;
832 	struct net_device *netdev;
833 	struct sk_buff *rsp;
834 	struct nlattr *attr;
835 	int rem, err = 0;
836 	void *hdr;
837 
838 	if (GENL_REQ_ATTR_CHECK(info, NETDEV_A_DEV_IFINDEX) ||
839 	    GENL_REQ_ATTR_CHECK(info, NETDEV_A_DMABUF_FD) ||
840 	    GENL_REQ_ATTR_CHECK(info, NETDEV_A_DMABUF_QUEUES))
841 		return -EINVAL;
842 
843 	ifindex = nla_get_u32(info->attrs[NETDEV_A_DEV_IFINDEX]);
844 	dmabuf_fd = nla_get_u32(info->attrs[NETDEV_A_DMABUF_FD]);
845 
846 	sock_binding_list = genl_sk_priv_get(&netdev_nl_family,
847 					     NETLINK_CB(skb).sk);
848 	if (IS_ERR(sock_binding_list))
849 		return PTR_ERR(sock_binding_list);
850 
851 	rsp = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL);
852 	if (!rsp)
853 		return -ENOMEM;
854 
855 	hdr = genlmsg_iput(rsp, info);
856 	if (!hdr) {
857 		err = -EMSGSIZE;
858 		goto err_genlmsg_free;
859 	}
860 
861 	rtnl_lock();
862 
863 	netdev = __dev_get_by_index(genl_info_net(info), ifindex);
864 	if (!netdev || !netif_device_present(netdev)) {
865 		err = -ENODEV;
866 		goto err_unlock;
867 	}
868 
869 	if (dev_xdp_prog_count(netdev)) {
870 		NL_SET_ERR_MSG(info->extack, "unable to bind dmabuf to device with XDP program attached");
871 		err = -EEXIST;
872 		goto err_unlock;
873 	}
874 
875 	binding = net_devmem_bind_dmabuf(netdev, dmabuf_fd, info->extack);
876 	if (IS_ERR(binding)) {
877 		err = PTR_ERR(binding);
878 		goto err_unlock;
879 	}
880 
881 	nla_for_each_attr_type(attr, NETDEV_A_DMABUF_QUEUES,
882 			       genlmsg_data(info->genlhdr),
883 			       genlmsg_len(info->genlhdr), rem) {
884 		err = nla_parse_nested(
885 			tb, ARRAY_SIZE(netdev_queue_id_nl_policy) - 1, attr,
886 			netdev_queue_id_nl_policy, info->extack);
887 		if (err < 0)
888 			goto err_unbind;
889 
890 		if (NL_REQ_ATTR_CHECK(info->extack, attr, tb, NETDEV_A_QUEUE_ID) ||
891 		    NL_REQ_ATTR_CHECK(info->extack, attr, tb, NETDEV_A_QUEUE_TYPE)) {
892 			err = -EINVAL;
893 			goto err_unbind;
894 		}
895 
896 		if (nla_get_u32(tb[NETDEV_A_QUEUE_TYPE]) != NETDEV_QUEUE_TYPE_RX) {
897 			NL_SET_BAD_ATTR(info->extack, tb[NETDEV_A_QUEUE_TYPE]);
898 			err = -EINVAL;
899 			goto err_unbind;
900 		}
901 
902 		rxq_idx = nla_get_u32(tb[NETDEV_A_QUEUE_ID]);
903 
904 		err = net_devmem_bind_dmabuf_to_queue(netdev, rxq_idx, binding,
905 						      info->extack);
906 		if (err)
907 			goto err_unbind;
908 	}
909 
910 	list_add(&binding->list, sock_binding_list);
911 
912 	nla_put_u32(rsp, NETDEV_A_DMABUF_ID, binding->id);
913 	genlmsg_end(rsp, hdr);
914 
915 	err = genlmsg_reply(rsp, info);
916 	if (err)
917 		goto err_unbind;
918 
919 	rtnl_unlock();
920 
921 	return 0;
922 
923 err_unbind:
924 	net_devmem_unbind_dmabuf(binding);
925 err_unlock:
926 	rtnl_unlock();
927 err_genlmsg_free:
928 	nlmsg_free(rsp);
929 	return err;
930 }
931 
932 void netdev_nl_sock_priv_init(struct list_head *priv)
933 {
934 	INIT_LIST_HEAD(priv);
935 }
936 
937 void netdev_nl_sock_priv_destroy(struct list_head *priv)
938 {
939 	struct net_devmem_dmabuf_binding *binding;
940 	struct net_devmem_dmabuf_binding *temp;
941 
942 	list_for_each_entry_safe(binding, temp, priv, list) {
943 		rtnl_lock();
944 		net_devmem_unbind_dmabuf(binding);
945 		rtnl_unlock();
946 	}
947 }
948 
949 static int netdev_genl_netdevice_event(struct notifier_block *nb,
950 				       unsigned long event, void *ptr)
951 {
952 	struct net_device *netdev = netdev_notifier_info_to_dev(ptr);
953 
954 	switch (event) {
955 	case NETDEV_REGISTER:
956 		netdev_genl_dev_notify(netdev, NETDEV_CMD_DEV_ADD_NTF);
957 		break;
958 	case NETDEV_UNREGISTER:
959 		netdev_genl_dev_notify(netdev, NETDEV_CMD_DEV_DEL_NTF);
960 		break;
961 	case NETDEV_XDP_FEAT_CHANGE:
962 		netdev_genl_dev_notify(netdev, NETDEV_CMD_DEV_CHANGE_NTF);
963 		break;
964 	}
965 
966 	return NOTIFY_OK;
967 }
968 
969 static struct notifier_block netdev_genl_nb = {
970 	.notifier_call	= netdev_genl_netdevice_event,
971 };
972 
973 static int __init netdev_genl_init(void)
974 {
975 	int err;
976 
977 	err = register_netdevice_notifier(&netdev_genl_nb);
978 	if (err)
979 		return err;
980 
981 	err = genl_register_family(&netdev_nl_family);
982 	if (err)
983 		goto err_unreg_ntf;
984 
985 	return 0;
986 
987 err_unreg_ntf:
988 	unregister_netdevice_notifier(&netdev_genl_nb);
989 	return err;
990 }
991 
992 subsys_initcall(netdev_genl_init);
993