xref: /linux/include/net/mctp.h (revision 1771c8c9e65a20128f93df107353a5f4cb91546a)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 /*
3  * Management Component Transport Protocol (MCTP)
4  *
5  * Copyright (c) 2021 Code Construct
6  * Copyright (c) 2021 Google
7  */
8 
9 #ifndef __NET_MCTP_H
10 #define __NET_MCTP_H
11 
12 #include <linux/bits.h>
13 #include <linux/mctp.h>
14 #include <linux/netdevice.h>
15 #include <net/net_namespace.h>
16 #include <net/sock.h>
17 
18 /* MCTP packet definitions */
19 struct mctp_hdr {
20 	u8	ver;
21 	u8	dest;
22 	u8	src;
23 	u8	flags_seq_tag;
24 };
25 
26 #define MCTP_VER_MIN	1
27 #define MCTP_VER_MAX	1
28 
29 /* Definitions for flags_seq_tag field */
30 #define MCTP_HDR_FLAG_SOM	BIT(7)
31 #define MCTP_HDR_FLAG_EOM	BIT(6)
32 #define MCTP_HDR_FLAG_TO	BIT(3)
33 #define MCTP_HDR_FLAGS		GENMASK(5, 3)
34 #define MCTP_HDR_SEQ_SHIFT	4
35 #define MCTP_HDR_SEQ_MASK	GENMASK(1, 0)
36 #define MCTP_HDR_TAG_SHIFT	0
37 #define MCTP_HDR_TAG_MASK	GENMASK(2, 0)
38 
39 #define MCTP_INITIAL_DEFAULT_NET	1
40 
41 static inline bool mctp_address_unicast(mctp_eid_t eid)
42 {
43 	return eid >= 8 && eid < 255;
44 }
45 
46 static inline bool mctp_address_broadcast(mctp_eid_t eid)
47 {
48 	return eid == 255;
49 }
50 
51 static inline bool mctp_address_null(mctp_eid_t eid)
52 {
53 	return eid == 0;
54 }
55 
56 static inline bool mctp_address_matches(mctp_eid_t match, mctp_eid_t eid)
57 {
58 	return match == eid || match == MCTP_ADDR_ANY;
59 }
60 
61 static inline struct mctp_hdr *mctp_hdr(struct sk_buff *skb)
62 {
63 	return (struct mctp_hdr *)skb_network_header(skb);
64 }
65 
66 /* socket implementation */
67 struct mctp_sock {
68 	struct sock	sk;
69 
70 	/* bind() params */
71 	unsigned int	bind_net;
72 	mctp_eid_t	bind_addr;
73 	__u8		bind_type;
74 
75 	/* sendmsg()/recvmsg() uses struct sockaddr_mctp_ext */
76 	bool		addr_ext;
77 
78 	/* list of mctp_sk_key, for incoming tag lookup. updates protected
79 	 * by sk->net->keys_lock
80 	 */
81 	struct hlist_head keys;
82 
83 	/* mechanism for expiring allocated keys; will release an allocated
84 	 * tag, and any netdev state for a request/response pairing
85 	 */
86 	struct timer_list key_expiry;
87 };
88 
89 /* Key for matching incoming packets to sockets or reassembly contexts.
90  * Packets are matched on (src,dest,tag).
91  *
92  * Lifetime / locking requirements:
93  *
94  *  - individual key data (ie, the struct itself) is protected by key->lock;
95  *    changes must be made with that lock held.
96  *
97  *  - the lookup fields: peer_addr, local_addr and tag are set before the
98  *    key is added to lookup lists, and never updated.
99  *
100  *  - A ref to the key must be held (throuh key->refs) if a pointer to the
101  *    key is to be accessed after key->lock is released.
102  *
103  *  - a mctp_sk_key contains a reference to a struct sock; this is valid
104  *    for the life of the key. On sock destruction (through unhash), the key is
105  *    removed from lists (see below), and marked invalid.
106  *
107  * - these mctp_sk_keys appear on two lists:
108  *     1) the struct mctp_sock->keys list
109  *     2) the struct netns_mctp->keys list
110  *
111  *   presences on these lists requires a (single) refcount to be held; both
112  *   lists are updated as a single operation.
113  *
114  *   Updates and lookups in either list are performed under the
115  *   netns_mctp->keys lock. Lookup functions will need to lock the key and
116  *   take a reference before unlocking the keys_lock. Consequently, the list's
117  *   keys_lock *cannot* be acquired with the individual key->lock held.
118  *
119  * - a key may have a sk_buff attached as part of an in-progress message
120  *   reassembly (->reasm_head). The reasm data is protected by the individual
121  *   key->lock.
122  *
123  * - there are two destruction paths for a mctp_sk_key:
124  *
125  *    - through socket unhash (see mctp_sk_unhash). This performs the list
126  *      removal under keys_lock.
127  *
128  *    - where a key is established to receive a reply message: after receiving
129  *      the (complete) reply, or during reassembly errors. Here, we clean up
130  *      the reassembly context (marking reasm_dead, to prevent another from
131  *      starting), and remove the socket from the netns & socket lists.
132  *
133  *    - through an expiry timeout, on a per-socket timer
134  */
135 struct mctp_sk_key {
136 	mctp_eid_t	peer_addr;
137 	mctp_eid_t	local_addr; /* MCTP_ADDR_ANY for local owned tags */
138 	__u8		tag; /* incoming tag match; invert TO for local */
139 
140 	/* we hold a ref to sk when set */
141 	struct sock	*sk;
142 
143 	/* routing lookup list */
144 	struct hlist_node hlist;
145 
146 	/* per-socket list */
147 	struct hlist_node sklist;
148 
149 	/* lock protects against concurrent updates to the reassembly and
150 	 * expiry data below.
151 	 */
152 	spinlock_t	lock;
153 
154 	/* Keys are referenced during the output path, which may sleep */
155 	refcount_t	refs;
156 
157 	/* incoming fragment reassembly context */
158 	struct sk_buff	*reasm_head;
159 	struct sk_buff	**reasm_tailp;
160 	bool		reasm_dead;
161 	u8		last_seq;
162 
163 	/* key validity */
164 	bool		valid;
165 
166 	/* expiry timeout; valid (above) cleared on expiry */
167 	unsigned long	expiry;
168 
169 	/* free to use for device flow state tracking. Initialised to
170 	 * zero on initial key creation
171 	 */
172 	unsigned long	dev_flow_state;
173 	struct mctp_dev	*dev;
174 
175 	/* a tag allocated with SIOCMCTPALLOCTAG ioctl will not expire
176 	 * automatically on timeout or response, instead SIOCMCTPDROPTAG
177 	 * is used.
178 	 */
179 	bool		manual_alloc;
180 };
181 
182 struct mctp_skb_cb {
183 	unsigned int	magic;
184 	unsigned int	net;
185 	int		ifindex; /* extended/direct addressing if set */
186 	mctp_eid_t	src;
187 	unsigned char	halen;
188 	unsigned char	haddr[MAX_ADDR_LEN];
189 };
190 
191 /* skb control-block accessors with a little extra debugging for initial
192  * development.
193  *
194  * TODO: remove checks & mctp_skb_cb->magic; replace callers of __mctp_cb
195  * with mctp_cb().
196  *
197  * __mctp_cb() is only for the initial ingress code; we should see ->magic set
198  * at all times after this.
199  */
200 static inline struct mctp_skb_cb *__mctp_cb(struct sk_buff *skb)
201 {
202 	struct mctp_skb_cb *cb = (void *)skb->cb;
203 
204 	cb->magic = 0x4d435450;
205 	return cb;
206 }
207 
208 static inline struct mctp_skb_cb *mctp_cb(struct sk_buff *skb)
209 {
210 	struct mctp_skb_cb *cb = (void *)skb->cb;
211 
212 	BUILD_BUG_ON(sizeof(struct mctp_skb_cb) > sizeof(skb->cb));
213 	WARN_ON(cb->magic != 0x4d435450);
214 	return (void *)(skb->cb);
215 }
216 
217 /* If CONFIG_MCTP_FLOWS, we may add one of these as a SKB extension,
218  * indicating the flow to the device driver.
219  */
220 struct mctp_flow {
221 	struct mctp_sk_key *key;
222 };
223 
224 /* Route definition.
225  *
226  * These are held in the pernet->mctp.routes list, with RCU protection for
227  * removed routes. We hold a reference to the netdev; routes need to be
228  * dropped on NETDEV_UNREGISTER events.
229  *
230  * Updates to the route table are performed under rtnl; all reads under RCU,
231  * so routes cannot be referenced over a RCU grace period. Specifically: A
232  * caller cannot block between mctp_route_lookup and mctp_route_release()
233  */
234 struct mctp_route {
235 	mctp_eid_t		min, max;
236 
237 	struct mctp_dev		*dev;
238 	unsigned int		mtu;
239 	unsigned char		type;
240 	int			(*output)(struct mctp_route *route,
241 					  struct sk_buff *skb);
242 
243 	struct list_head	list;
244 	refcount_t		refs;
245 	struct rcu_head		rcu;
246 };
247 
248 /* route interfaces */
249 struct mctp_route *mctp_route_lookup(struct net *net, unsigned int dnet,
250 				     mctp_eid_t daddr);
251 
252 int mctp_local_output(struct sock *sk, struct mctp_route *rt,
253 		      struct sk_buff *skb, mctp_eid_t daddr, u8 req_tag);
254 
255 void mctp_key_unref(struct mctp_sk_key *key);
256 struct mctp_sk_key *mctp_alloc_local_tag(struct mctp_sock *msk,
257 					 mctp_eid_t daddr, mctp_eid_t saddr,
258 					 bool manual, u8 *tagp);
259 
260 /* routing <--> device interface */
261 unsigned int mctp_default_net(struct net *net);
262 int mctp_default_net_set(struct net *net, unsigned int index);
263 int mctp_route_add_local(struct mctp_dev *mdev, mctp_eid_t addr);
264 int mctp_route_remove_local(struct mctp_dev *mdev, mctp_eid_t addr);
265 void mctp_route_remove_dev(struct mctp_dev *mdev);
266 
267 /* neighbour definitions */
268 enum mctp_neigh_source {
269 	MCTP_NEIGH_STATIC,
270 	MCTP_NEIGH_DISCOVER,
271 };
272 
273 struct mctp_neigh {
274 	struct mctp_dev		*dev;
275 	mctp_eid_t		eid;
276 	enum mctp_neigh_source	source;
277 
278 	unsigned char		ha[MAX_ADDR_LEN];
279 
280 	struct list_head	list;
281 	struct rcu_head		rcu;
282 };
283 
284 int mctp_neigh_init(void);
285 void mctp_neigh_exit(void);
286 
287 // ret_hwaddr may be NULL, otherwise must have space for MAX_ADDR_LEN
288 int mctp_neigh_lookup(struct mctp_dev *dev, mctp_eid_t eid,
289 		      void *ret_hwaddr);
290 void mctp_neigh_remove_dev(struct mctp_dev *mdev);
291 
292 int mctp_routes_init(void);
293 void mctp_routes_exit(void);
294 
295 void mctp_device_init(void);
296 void mctp_device_exit(void);
297 
298 #endif /* __NET_MCTP_H */
299