Skip to content

Commit 3d759e9

Browse files
committed
Merge branch 'devlink-code-split-and-structured-instance-walk'
Jakub Kicinski says: ==================== devlink: code split and structured instance walk Split devlink.c into a handful of files, trying to keep the "core" code away from all the command-specific implementations. The core code has been quite scattered until now. Going forward we can consider using a source file per-subobject, I think that it's quite beneficial to newcomers (based on relative ease with which folks contribute to ethtool vs devlink). But this series doesn't split everything out, yet - partially due to backporting concerns, but mostly due to lack of time. Bulk of the netlink command handling is left in a leftover.c file. Introduce a context structure for dumps, and use it to store the devlink instance ID of the last dumped devlink instance. This means we don't have to restart the walk from 0 each time. Finally - introduce a "structured walk". A centralized dump handler in devlink/netlink.c which walks the devlink instances, deals with refcounting/locking, simplifying the per-object implementations quite a bit. Inspired by the ethtool code. v1: https://lore.kernel.org/all/20230104041636.226398-1-kuba@kernel.org/ RFC: https://lore.kernel.org/all/20221215020155.1619839-1-kuba@kernel.org/ ==================== Link: https://lore.kernel.org/r/20230105040531.353563-1-kuba@kernel.org Signed-off-by: Jakub Kicinski <kuba@kernel.org>
2 parents 0da6855 + 5ce76d7 commit 3d759e9

File tree

10 files changed

+1161
-1106
lines changed

10 files changed

+1161
-1106
lines changed

MAINTAINERS

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6099,7 +6099,7 @@ S: Supported
60996099
F: Documentation/networking/devlink
61006100
F: include/net/devlink.h
61016101
F: include/uapi/linux/devlink.h
6102-
F: net/core/devlink.c
6102+
F: net/devlink/
61036103

61046104
DH ELECTRONICS IMX6 DHCOM/DHCOR BOARD SUPPORT
61056105
M: Christoph Niedermaier <cniedermaier@dh-electronics.com>

include/linux/netlink.h

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -263,6 +263,10 @@ struct netlink_callback {
263263
};
264264
};
265265

266+
#define NL_ASSET_DUMP_CTX_FITS(type_name) \
267+
BUILD_BUG_ON(sizeof(type_name) > \
268+
sizeof_field(struct netlink_callback, ctx))
269+
266270
struct netlink_notify {
267271
struct net *net;
268272
u32 portid;

net/Makefile

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,7 @@ obj-$(CONFIG_BPFILTER) += bpfilter/
2323
obj-$(CONFIG_PACKET) += packet/
2424
obj-$(CONFIG_NET_KEY) += key/
2525
obj-$(CONFIG_BRIDGE) += bridge/
26+
obj-$(CONFIG_NET_DEVLINK) += devlink/
2627
obj-$(CONFIG_NET_DSA) += dsa/
2728
obj-$(CONFIG_ATALK) += appletalk/
2829
obj-$(CONFIG_X25) += x25/

net/core/Makefile

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,6 @@ obj-$(CONFIG_LWTUNNEL) += lwtunnel.o
3333
obj-$(CONFIG_LWTUNNEL_BPF) += lwt_bpf.o
3434
obj-$(CONFIG_DST_CACHE) += dst_cache.o
3535
obj-$(CONFIG_HWBM) += hwbm.o
36-
obj-$(CONFIG_NET_DEVLINK) += devlink.o
3736
obj-$(CONFIG_GRO_CELLS) += gro_cells.o
3837
obj-$(CONFIG_FAILOVER) += failover.o
3938
obj-$(CONFIG_NET_SOCK_MSG) += skmsg.o

net/devlink/Makefile

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
# SPDX-License-Identifier: GPL-2.0
2+
3+
obj-y := leftover.o core.o netlink.o

net/devlink/core.c

Lines changed: 345 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,345 @@
1+
// SPDX-License-Identifier: GPL-2.0-or-later
2+
/*
3+
* Copyright (c) 2016 Mellanox Technologies. All rights reserved.
4+
* Copyright (c) 2016 Jiri Pirko <jiri@mellanox.com>
5+
*/
6+
7+
#include <net/genetlink.h>
8+
9+
#include "devl_internal.h"
10+
11+
DEFINE_XARRAY_FLAGS(devlinks, XA_FLAGS_ALLOC);
12+
13+
void *devlink_priv(struct devlink *devlink)
14+
{
15+
return &devlink->priv;
16+
}
17+
EXPORT_SYMBOL_GPL(devlink_priv);
18+
19+
struct devlink *priv_to_devlink(void *priv)
20+
{
21+
return container_of(priv, struct devlink, priv);
22+
}
23+
EXPORT_SYMBOL_GPL(priv_to_devlink);
24+
25+
struct device *devlink_to_dev(const struct devlink *devlink)
26+
{
27+
return devlink->dev;
28+
}
29+
EXPORT_SYMBOL_GPL(devlink_to_dev);
30+
31+
struct net *devlink_net(const struct devlink *devlink)
32+
{
33+
return read_pnet(&devlink->_net);
34+
}
35+
EXPORT_SYMBOL_GPL(devlink_net);
36+
37+
void devl_assert_locked(struct devlink *devlink)
38+
{
39+
lockdep_assert_held(&devlink->lock);
40+
}
41+
EXPORT_SYMBOL_GPL(devl_assert_locked);
42+
43+
#ifdef CONFIG_LOCKDEP
44+
/* For use in conjunction with LOCKDEP only e.g. rcu_dereference_protected() */
45+
bool devl_lock_is_held(struct devlink *devlink)
46+
{
47+
return lockdep_is_held(&devlink->lock);
48+
}
49+
EXPORT_SYMBOL_GPL(devl_lock_is_held);
50+
#endif
51+
52+
void devl_lock(struct devlink *devlink)
53+
{
54+
mutex_lock(&devlink->lock);
55+
}
56+
EXPORT_SYMBOL_GPL(devl_lock);
57+
58+
int devl_trylock(struct devlink *devlink)
59+
{
60+
return mutex_trylock(&devlink->lock);
61+
}
62+
EXPORT_SYMBOL_GPL(devl_trylock);
63+
64+
void devl_unlock(struct devlink *devlink)
65+
{
66+
mutex_unlock(&devlink->lock);
67+
}
68+
EXPORT_SYMBOL_GPL(devl_unlock);
69+
70+
struct devlink *__must_check devlink_try_get(struct devlink *devlink)
71+
{
72+
if (refcount_inc_not_zero(&devlink->refcount))
73+
return devlink;
74+
return NULL;
75+
}
76+
77+
static void __devlink_put_rcu(struct rcu_head *head)
78+
{
79+
struct devlink *devlink = container_of(head, struct devlink, rcu);
80+
81+
complete(&devlink->comp);
82+
}
83+
84+
void devlink_put(struct devlink *devlink)
85+
{
86+
if (refcount_dec_and_test(&devlink->refcount))
87+
/* Make sure unregister operation that may await the completion
88+
* is unblocked only after all users are after the end of
89+
* RCU grace period.
90+
*/
91+
call_rcu(&devlink->rcu, __devlink_put_rcu);
92+
}
93+
94+
struct devlink *
95+
devlinks_xa_find_get(struct net *net, unsigned long *indexp,
96+
void * (*xa_find_fn)(struct xarray *, unsigned long *,
97+
unsigned long, xa_mark_t))
98+
{
99+
struct devlink *devlink;
100+
101+
rcu_read_lock();
102+
retry:
103+
devlink = xa_find_fn(&devlinks, indexp, ULONG_MAX, DEVLINK_REGISTERED);
104+
if (!devlink)
105+
goto unlock;
106+
107+
/* In case devlink_unregister() was already called and "unregistering"
108+
* mark was set, do not allow to get a devlink reference here.
109+
* This prevents live-lock of devlink_unregister() wait for completion.
110+
*/
111+
if (xa_get_mark(&devlinks, *indexp, DEVLINK_UNREGISTERING))
112+
goto retry;
113+
114+
/* For a possible retry, the xa_find_after() should be always used */
115+
xa_find_fn = xa_find_after;
116+
if (!devlink_try_get(devlink))
117+
goto retry;
118+
if (!net_eq(devlink_net(devlink), net)) {
119+
devlink_put(devlink);
120+
goto retry;
121+
}
122+
unlock:
123+
rcu_read_unlock();
124+
return devlink;
125+
}
126+
127+
struct devlink *
128+
devlinks_xa_find_get_first(struct net *net, unsigned long *indexp)
129+
{
130+
return devlinks_xa_find_get(net, indexp, xa_find);
131+
}
132+
133+
struct devlink *
134+
devlinks_xa_find_get_next(struct net *net, unsigned long *indexp)
135+
{
136+
return devlinks_xa_find_get(net, indexp, xa_find_after);
137+
}
138+
139+
/**
140+
* devlink_set_features - Set devlink supported features
141+
*
142+
* @devlink: devlink
143+
* @features: devlink support features
144+
*
145+
* This interface allows us to set reload ops separatelly from
146+
* the devlink_alloc.
147+
*/
148+
void devlink_set_features(struct devlink *devlink, u64 features)
149+
{
150+
ASSERT_DEVLINK_NOT_REGISTERED(devlink);
151+
152+
WARN_ON(features & DEVLINK_F_RELOAD &&
153+
!devlink_reload_supported(devlink->ops));
154+
devlink->features = features;
155+
}
156+
EXPORT_SYMBOL_GPL(devlink_set_features);
157+
158+
/**
159+
* devlink_register - Register devlink instance
160+
*
161+
* @devlink: devlink
162+
*/
163+
void devlink_register(struct devlink *devlink)
164+
{
165+
ASSERT_DEVLINK_NOT_REGISTERED(devlink);
166+
/* Make sure that we are in .probe() routine */
167+
168+
xa_set_mark(&devlinks, devlink->index, DEVLINK_REGISTERED);
169+
devlink_notify_register(devlink);
170+
}
171+
EXPORT_SYMBOL_GPL(devlink_register);
172+
173+
/**
174+
* devlink_unregister - Unregister devlink instance
175+
*
176+
* @devlink: devlink
177+
*/
178+
void devlink_unregister(struct devlink *devlink)
179+
{
180+
ASSERT_DEVLINK_REGISTERED(devlink);
181+
/* Make sure that we are in .remove() routine */
182+
183+
xa_set_mark(&devlinks, devlink->index, DEVLINK_UNREGISTERING);
184+
devlink_put(devlink);
185+
wait_for_completion(&devlink->comp);
186+
187+
devlink_notify_unregister(devlink);
188+
xa_clear_mark(&devlinks, devlink->index, DEVLINK_REGISTERED);
189+
xa_clear_mark(&devlinks, devlink->index, DEVLINK_UNREGISTERING);
190+
}
191+
EXPORT_SYMBOL_GPL(devlink_unregister);
192+
193+
/**
194+
* devlink_alloc_ns - Allocate new devlink instance resources
195+
* in specific namespace
196+
*
197+
* @ops: ops
198+
* @priv_size: size of user private data
199+
* @net: net namespace
200+
* @dev: parent device
201+
*
202+
* Allocate new devlink instance resources, including devlink index
203+
* and name.
204+
*/
205+
struct devlink *devlink_alloc_ns(const struct devlink_ops *ops,
206+
size_t priv_size, struct net *net,
207+
struct device *dev)
208+
{
209+
struct devlink *devlink;
210+
static u32 last_id;
211+
int ret;
212+
213+
WARN_ON(!ops || !dev);
214+
if (!devlink_reload_actions_valid(ops))
215+
return NULL;
216+
217+
devlink = kzalloc(sizeof(*devlink) + priv_size, GFP_KERNEL);
218+
if (!devlink)
219+
return NULL;
220+
221+
ret = xa_alloc_cyclic(&devlinks, &devlink->index, devlink, xa_limit_31b,
222+
&last_id, GFP_KERNEL);
223+
if (ret < 0)
224+
goto err_xa_alloc;
225+
226+
devlink->netdevice_nb.notifier_call = devlink_port_netdevice_event;
227+
ret = register_netdevice_notifier_net(net, &devlink->netdevice_nb);
228+
if (ret)
229+
goto err_register_netdevice_notifier;
230+
231+
devlink->dev = dev;
232+
devlink->ops = ops;
233+
xa_init_flags(&devlink->ports, XA_FLAGS_ALLOC);
234+
xa_init_flags(&devlink->snapshot_ids, XA_FLAGS_ALLOC);
235+
write_pnet(&devlink->_net, net);
236+
INIT_LIST_HEAD(&devlink->rate_list);
237+
INIT_LIST_HEAD(&devlink->linecard_list);
238+
INIT_LIST_HEAD(&devlink->sb_list);
239+
INIT_LIST_HEAD_RCU(&devlink->dpipe_table_list);
240+
INIT_LIST_HEAD(&devlink->resource_list);
241+
INIT_LIST_HEAD(&devlink->param_list);
242+
INIT_LIST_HEAD(&devlink->region_list);
243+
INIT_LIST_HEAD(&devlink->reporter_list);
244+
INIT_LIST_HEAD(&devlink->trap_list);
245+
INIT_LIST_HEAD(&devlink->trap_group_list);
246+
INIT_LIST_HEAD(&devlink->trap_policer_list);
247+
lockdep_register_key(&devlink->lock_key);
248+
mutex_init(&devlink->lock);
249+
lockdep_set_class(&devlink->lock, &devlink->lock_key);
250+
mutex_init(&devlink->reporters_lock);
251+
mutex_init(&devlink->linecards_lock);
252+
refcount_set(&devlink->refcount, 1);
253+
init_completion(&devlink->comp);
254+
255+
return devlink;
256+
257+
err_register_netdevice_notifier:
258+
xa_erase(&devlinks, devlink->index);
259+
err_xa_alloc:
260+
kfree(devlink);
261+
return NULL;
262+
}
263+
EXPORT_SYMBOL_GPL(devlink_alloc_ns);
264+
265+
/**
266+
* devlink_free - Free devlink instance resources
267+
*
268+
* @devlink: devlink
269+
*/
270+
void devlink_free(struct devlink *devlink)
271+
{
272+
ASSERT_DEVLINK_NOT_REGISTERED(devlink);
273+
274+
mutex_destroy(&devlink->linecards_lock);
275+
mutex_destroy(&devlink->reporters_lock);
276+
mutex_destroy(&devlink->lock);
277+
lockdep_unregister_key(&devlink->lock_key);
278+
WARN_ON(!list_empty(&devlink->trap_policer_list));
279+
WARN_ON(!list_empty(&devlink->trap_group_list));
280+
WARN_ON(!list_empty(&devlink->trap_list));
281+
WARN_ON(!list_empty(&devlink->reporter_list));
282+
WARN_ON(!list_empty(&devlink->region_list));
283+
WARN_ON(!list_empty(&devlink->param_list));
284+
WARN_ON(!list_empty(&devlink->resource_list));
285+
WARN_ON(!list_empty(&devlink->dpipe_table_list));
286+
WARN_ON(!list_empty(&devlink->sb_list));
287+
WARN_ON(!list_empty(&devlink->rate_list));
288+
WARN_ON(!list_empty(&devlink->linecard_list));
289+
WARN_ON(!xa_empty(&devlink->ports));
290+
291+
xa_destroy(&devlink->snapshot_ids);
292+
xa_destroy(&devlink->ports);
293+
294+
WARN_ON_ONCE(unregister_netdevice_notifier_net(devlink_net(devlink),
295+
&devlink->netdevice_nb));
296+
297+
xa_erase(&devlinks, devlink->index);
298+
299+
kfree(devlink);
300+
}
301+
EXPORT_SYMBOL_GPL(devlink_free);
302+
303+
static void __net_exit devlink_pernet_pre_exit(struct net *net)
304+
{
305+
struct devlink *devlink;
306+
u32 actions_performed;
307+
unsigned long index;
308+
int err;
309+
310+
/* In case network namespace is getting destroyed, reload
311+
* all devlink instances from this namespace into init_net.
312+
*/
313+
devlinks_xa_for_each_registered_get(net, index, devlink) {
314+
WARN_ON(!(devlink->features & DEVLINK_F_RELOAD));
315+
mutex_lock(&devlink->lock);
316+
err = devlink_reload(devlink, &init_net,
317+
DEVLINK_RELOAD_ACTION_DRIVER_REINIT,
318+
DEVLINK_RELOAD_LIMIT_UNSPEC,
319+
&actions_performed, NULL);
320+
mutex_unlock(&devlink->lock);
321+
if (err && err != -EOPNOTSUPP)
322+
pr_warn("Failed to reload devlink instance into init_net\n");
323+
devlink_put(devlink);
324+
}
325+
}
326+
327+
static struct pernet_operations devlink_pernet_ops __net_initdata = {
328+
.pre_exit = devlink_pernet_pre_exit,
329+
};
330+
331+
static int __init devlink_init(void)
332+
{
333+
int err;
334+
335+
err = genl_register_family(&devlink_nl_family);
336+
if (err)
337+
goto out;
338+
err = register_pernet_subsys(&devlink_pernet_ops);
339+
340+
out:
341+
WARN_ON(err);
342+
return err;
343+
}
344+
345+
subsys_initcall(devlink_init);

0 commit comments

Comments
 (0)