Commit | Line | Data |
---|---|---|
a29a194a PM |
1 | /* |
2 | * net/tipc/ib_media.c: Infiniband bearer support for TIPC | |
3 | * | |
4 | * Copyright (c) 2013 Patrick McHardy <kaber@trash.net> | |
5 | * | |
6 | * Based on eth_media.c, which carries the following copyright notice: | |
7 | * | |
8 | * Copyright (c) 2001-2007, Ericsson AB | |
9 | * Copyright (c) 2005-2008, 2011, Wind River Systems | |
10 | * All rights reserved. | |
11 | * | |
12 | * Redistribution and use in source and binary forms, with or without | |
13 | * modification, are permitted provided that the following conditions are met: | |
14 | * | |
15 | * 1. Redistributions of source code must retain the above copyright | |
16 | * notice, this list of conditions and the following disclaimer. | |
17 | * 2. Redistributions in binary form must reproduce the above copyright | |
18 | * notice, this list of conditions and the following disclaimer in the | |
19 | * documentation and/or other materials provided with the distribution. | |
20 | * 3. Neither the names of the copyright holders nor the names of its | |
21 | * contributors may be used to endorse or promote products derived from | |
22 | * this software without specific prior written permission. | |
23 | * | |
24 | * Alternatively, this software may be distributed under the terms of the | |
25 | * GNU General Public License ("GPL") version 2 as published by the Free | |
26 | * Software Foundation. | |
27 | * | |
28 | * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | |
29 | * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | |
30 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | |
31 | * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE | |
32 | * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | |
33 | * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | |
34 | * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | |
35 | * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | |
36 | * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | |
37 | * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | |
38 | * POSSIBILITY OF SUCH DAMAGE. | |
39 | */ | |
40 | ||
41 | #include <linux/if_infiniband.h> | |
42 | #include "core.h" | |
43 | #include "bearer.h" | |
44 | ||
45 | #define MAX_IB_BEARERS MAX_BEARERS | |
46 | ||
47 | /** | |
48 | * struct ib_bearer - Infiniband bearer data structure | |
49 | * @bearer: ptr to associated "generic" bearer structure | |
50 | * @dev: ptr to associated Infiniband network device | |
51 | * @tipc_packet_type: used in binding TIPC to Infiniband driver | |
52 | * @cleanup: work item used when disabling bearer | |
53 | */ | |
54 | ||
55 | struct ib_bearer { | |
56 | struct tipc_bearer *bearer; | |
57 | struct net_device *dev; | |
58 | struct packet_type tipc_packet_type; | |
59 | struct work_struct setup; | |
60 | struct work_struct cleanup; | |
61 | }; | |
62 | ||
63 | static struct tipc_media ib_media_info; | |
64 | static struct ib_bearer ib_bearers[MAX_IB_BEARERS]; | |
65 | static int ib_started; | |
66 | ||
67 | /** | |
68 | * ib_media_addr_set - initialize Infiniband media address structure | |
69 | * | |
70 | * Media-dependent "value" field stores MAC address in first 6 bytes | |
71 | * and zeroes out the remaining bytes. | |
72 | */ | |
73 | static void ib_media_addr_set(const struct tipc_bearer *tb_ptr, | |
74 | struct tipc_media_addr *a, char *mac) | |
75 | { | |
76 | BUILD_BUG_ON(sizeof(a->value) < INFINIBAND_ALEN); | |
77 | memcpy(a->value, mac, INFINIBAND_ALEN); | |
78 | a->media_id = TIPC_MEDIA_TYPE_IB; | |
79 | a->broadcast = !memcmp(mac, tb_ptr->bcast_addr.value, INFINIBAND_ALEN); | |
80 | } | |
81 | ||
82 | /** | |
83 | * send_msg - send a TIPC message out over an InfiniBand interface | |
84 | */ | |
85 | static int send_msg(struct sk_buff *buf, struct tipc_bearer *tb_ptr, | |
86 | struct tipc_media_addr *dest) | |
87 | { | |
88 | struct sk_buff *clone; | |
89 | struct net_device *dev; | |
90 | int delta; | |
91 | ||
92 | clone = skb_clone(buf, GFP_ATOMIC); | |
93 | if (!clone) | |
94 | return 0; | |
95 | ||
96 | dev = ((struct ib_bearer *)(tb_ptr->usr_handle))->dev; | |
97 | delta = dev->hard_header_len - skb_headroom(buf); | |
98 | ||
99 | if ((delta > 0) && | |
100 | pskb_expand_head(clone, SKB_DATA_ALIGN(delta), 0, GFP_ATOMIC)) { | |
101 | kfree_skb(clone); | |
102 | return 0; | |
103 | } | |
104 | ||
105 | skb_reset_network_header(clone); | |
106 | clone->dev = dev; | |
107 | clone->protocol = htons(ETH_P_TIPC); | |
108 | dev_hard_header(clone, dev, ETH_P_TIPC, dest->value, | |
109 | dev->dev_addr, clone->len); | |
110 | dev_queue_xmit(clone); | |
111 | return 0; | |
112 | } | |
113 | ||
114 | /** | |
115 | * recv_msg - handle incoming TIPC message from an InfiniBand interface | |
116 | * | |
117 | * Accept only packets explicitly sent to this node, or broadcast packets; | |
118 | * ignores packets sent using InfiniBand multicast, and traffic sent to other | |
119 | * nodes (which can happen if interface is running in promiscuous mode). | |
120 | */ | |
121 | static int recv_msg(struct sk_buff *buf, struct net_device *dev, | |
122 | struct packet_type *pt, struct net_device *orig_dev) | |
123 | { | |
124 | struct ib_bearer *ib_ptr = (struct ib_bearer *)pt->af_packet_priv; | |
125 | ||
126 | if (!net_eq(dev_net(dev), &init_net)) { | |
127 | kfree_skb(buf); | |
128 | return 0; | |
129 | } | |
130 | ||
131 | if (likely(ib_ptr->bearer)) { | |
132 | if (likely(buf->pkt_type <= PACKET_BROADCAST)) { | |
133 | buf->next = NULL; | |
134 | tipc_recv_msg(buf, ib_ptr->bearer); | |
135 | return 0; | |
136 | } | |
137 | } | |
138 | kfree_skb(buf); | |
139 | return 0; | |
140 | } | |
141 | ||
142 | /** | |
143 | * setup_bearer - setup association between InfiniBand bearer and interface | |
144 | */ | |
145 | static void setup_bearer(struct work_struct *work) | |
146 | { | |
147 | struct ib_bearer *ib_ptr = | |
148 | container_of(work, struct ib_bearer, setup); | |
149 | ||
150 | dev_add_pack(&ib_ptr->tipc_packet_type); | |
151 | } | |
152 | ||
153 | /** | |
154 | * enable_bearer - attach TIPC bearer to an InfiniBand interface | |
155 | */ | |
156 | static int enable_bearer(struct tipc_bearer *tb_ptr) | |
157 | { | |
2537af9d | 158 | struct net_device *dev; |
a29a194a PM |
159 | struct ib_bearer *ib_ptr = &ib_bearers[0]; |
160 | struct ib_bearer *stop = &ib_bearers[MAX_IB_BEARERS]; | |
161 | char *driver_name = strchr((const char *)tb_ptr->name, ':') + 1; | |
162 | int pending_dev = 0; | |
163 | ||
164 | /* Find unused InfiniBand bearer structure */ | |
165 | while (ib_ptr->dev) { | |
166 | if (!ib_ptr->bearer) | |
167 | pending_dev++; | |
168 | if (++ib_ptr == stop) | |
169 | return pending_dev ? -EAGAIN : -EDQUOT; | |
170 | } | |
171 | ||
172 | /* Find device with specified name */ | |
2537af9d | 173 | dev = dev_get_by_name(&init_net, driver_name); |
a29a194a PM |
174 | if (!dev) |
175 | return -ENODEV; | |
176 | ||
177 | /* Create InfiniBand bearer for device */ | |
178 | ib_ptr->dev = dev; | |
179 | ib_ptr->tipc_packet_type.type = htons(ETH_P_TIPC); | |
180 | ib_ptr->tipc_packet_type.dev = dev; | |
181 | ib_ptr->tipc_packet_type.func = recv_msg; | |
182 | ib_ptr->tipc_packet_type.af_packet_priv = ib_ptr; | |
183 | INIT_LIST_HEAD(&(ib_ptr->tipc_packet_type.list)); | |
184 | INIT_WORK(&ib_ptr->setup, setup_bearer); | |
185 | schedule_work(&ib_ptr->setup); | |
186 | ||
187 | /* Associate TIPC bearer with InfiniBand bearer */ | |
188 | ib_ptr->bearer = tb_ptr; | |
189 | tb_ptr->usr_handle = (void *)ib_ptr; | |
190 | memset(tb_ptr->bcast_addr.value, 0, sizeof(tb_ptr->bcast_addr.value)); | |
191 | memcpy(tb_ptr->bcast_addr.value, dev->broadcast, INFINIBAND_ALEN); | |
192 | tb_ptr->bcast_addr.media_id = TIPC_MEDIA_TYPE_IB; | |
193 | tb_ptr->bcast_addr.broadcast = 1; | |
194 | tb_ptr->mtu = dev->mtu; | |
195 | tb_ptr->blocked = 0; | |
196 | ib_media_addr_set(tb_ptr, &tb_ptr->addr, (char *)dev->dev_addr); | |
197 | return 0; | |
198 | } | |
199 | ||
200 | /** | |
201 | * cleanup_bearer - break association between InfiniBand bearer and interface | |
202 | * | |
203 | * This routine must be invoked from a work queue because it can sleep. | |
204 | */ | |
205 | static void cleanup_bearer(struct work_struct *work) | |
206 | { | |
207 | struct ib_bearer *ib_ptr = | |
208 | container_of(work, struct ib_bearer, cleanup); | |
209 | ||
210 | dev_remove_pack(&ib_ptr->tipc_packet_type); | |
211 | dev_put(ib_ptr->dev); | |
212 | ib_ptr->dev = NULL; | |
213 | } | |
214 | ||
215 | /** | |
216 | * disable_bearer - detach TIPC bearer from an InfiniBand interface | |
217 | * | |
218 | * Mark InfiniBand bearer as inactive so that incoming buffers are thrown away, | |
219 | * then get worker thread to complete bearer cleanup. (Can't do cleanup | |
220 | * here because cleanup code needs to sleep and caller holds spinlocks.) | |
221 | */ | |
222 | static void disable_bearer(struct tipc_bearer *tb_ptr) | |
223 | { | |
224 | struct ib_bearer *ib_ptr = (struct ib_bearer *)tb_ptr->usr_handle; | |
225 | ||
226 | ib_ptr->bearer = NULL; | |
227 | INIT_WORK(&ib_ptr->cleanup, cleanup_bearer); | |
228 | schedule_work(&ib_ptr->cleanup); | |
229 | } | |
230 | ||
231 | /** | |
232 | * recv_notification - handle device updates from OS | |
233 | * | |
234 | * Change the state of the InfiniBand bearer (if any) associated with the | |
235 | * specified device. | |
236 | */ | |
237 | static int recv_notification(struct notifier_block *nb, unsigned long evt, | |
351638e7 | 238 | void *ptr) |
a29a194a | 239 | { |
351638e7 | 240 | struct net_device *dev = netdev_notifier_info_to_dev(ptr); |
a29a194a PM |
241 | struct ib_bearer *ib_ptr = &ib_bearers[0]; |
242 | struct ib_bearer *stop = &ib_bearers[MAX_IB_BEARERS]; | |
243 | ||
244 | if (!net_eq(dev_net(dev), &init_net)) | |
245 | return NOTIFY_DONE; | |
246 | ||
247 | while ((ib_ptr->dev != dev)) { | |
248 | if (++ib_ptr == stop) | |
249 | return NOTIFY_DONE; /* couldn't find device */ | |
250 | } | |
251 | if (!ib_ptr->bearer) | |
252 | return NOTIFY_DONE; /* bearer had been disabled */ | |
253 | ||
254 | ib_ptr->bearer->mtu = dev->mtu; | |
255 | ||
256 | switch (evt) { | |
257 | case NETDEV_CHANGE: | |
258 | if (netif_carrier_ok(dev)) | |
259 | tipc_continue(ib_ptr->bearer); | |
260 | else | |
261 | tipc_block_bearer(ib_ptr->bearer->name); | |
262 | break; | |
263 | case NETDEV_UP: | |
264 | tipc_continue(ib_ptr->bearer); | |
265 | break; | |
266 | case NETDEV_DOWN: | |
267 | tipc_block_bearer(ib_ptr->bearer->name); | |
268 | break; | |
269 | case NETDEV_CHANGEMTU: | |
270 | case NETDEV_CHANGEADDR: | |
271 | tipc_block_bearer(ib_ptr->bearer->name); | |
272 | tipc_continue(ib_ptr->bearer); | |
273 | break; | |
274 | case NETDEV_UNREGISTER: | |
275 | case NETDEV_CHANGENAME: | |
276 | tipc_disable_bearer(ib_ptr->bearer->name); | |
277 | break; | |
278 | } | |
279 | return NOTIFY_OK; | |
280 | } | |
281 | ||
282 | static struct notifier_block notifier = { | |
283 | .notifier_call = recv_notification, | |
284 | .priority = 0, | |
285 | }; | |
286 | ||
287 | /** | |
288 | * ib_addr2str - convert InfiniBand address to string | |
289 | */ | |
290 | static int ib_addr2str(struct tipc_media_addr *a, char *str_buf, int str_size) | |
291 | { | |
292 | if (str_size < 60) /* 60 = 19 * strlen("xx:") + strlen("xx\0") */ | |
293 | return 1; | |
294 | ||
295 | sprintf(str_buf, "%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:" | |
296 | "%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x", | |
297 | a->value[0], a->value[1], a->value[2], a->value[3], | |
298 | a->value[4], a->value[5], a->value[6], a->value[7], | |
299 | a->value[8], a->value[9], a->value[10], a->value[11], | |
300 | a->value[12], a->value[13], a->value[14], a->value[15], | |
301 | a->value[16], a->value[17], a->value[18], a->value[19]); | |
302 | ||
303 | return 0; | |
304 | } | |
305 | ||
306 | /** | |
307 | * ib_addr2msg - convert InfiniBand address format to message header format | |
308 | */ | |
309 | static int ib_addr2msg(struct tipc_media_addr *a, char *msg_area) | |
310 | { | |
311 | memset(msg_area, 0, TIPC_MEDIA_ADDR_SIZE); | |
312 | msg_area[TIPC_MEDIA_TYPE_OFFSET] = TIPC_MEDIA_TYPE_IB; | |
313 | memcpy(msg_area, a->value, INFINIBAND_ALEN); | |
314 | return 0; | |
315 | } | |
316 | ||
317 | /** | |
318 | * ib_msg2addr - convert message header address format to InfiniBand format | |
319 | */ | |
320 | static int ib_msg2addr(const struct tipc_bearer *tb_ptr, | |
321 | struct tipc_media_addr *a, char *msg_area) | |
322 | { | |
323 | ib_media_addr_set(tb_ptr, a, msg_area); | |
324 | return 0; | |
325 | } | |
326 | ||
327 | /* | |
328 | * InfiniBand media registration info | |
329 | */ | |
330 | static struct tipc_media ib_media_info = { | |
331 | .send_msg = send_msg, | |
332 | .enable_bearer = enable_bearer, | |
333 | .disable_bearer = disable_bearer, | |
334 | .addr2str = ib_addr2str, | |
335 | .addr2msg = ib_addr2msg, | |
336 | .msg2addr = ib_msg2addr, | |
337 | .priority = TIPC_DEF_LINK_PRI, | |
338 | .tolerance = TIPC_DEF_LINK_TOL, | |
339 | .window = TIPC_DEF_LINK_WIN, | |
340 | .type_id = TIPC_MEDIA_TYPE_IB, | |
341 | .name = "ib" | |
342 | }; | |
343 | ||
344 | /** | |
345 | * tipc_ib_media_start - activate InfiniBand bearer support | |
346 | * | |
347 | * Register InfiniBand media type with TIPC bearer code. Also register | |
348 | * with OS for notifications about device state changes. | |
349 | */ | |
350 | int tipc_ib_media_start(void) | |
351 | { | |
352 | int res; | |
353 | ||
354 | if (ib_started) | |
355 | return -EINVAL; | |
356 | ||
357 | res = tipc_register_media(&ib_media_info); | |
358 | if (res) | |
359 | return res; | |
360 | ||
361 | res = register_netdevice_notifier(¬ifier); | |
362 | if (!res) | |
363 | ib_started = 1; | |
364 | return res; | |
365 | } | |
366 | ||
367 | /** | |
368 | * tipc_ib_media_stop - deactivate InfiniBand bearer support | |
369 | */ | |
370 | void tipc_ib_media_stop(void) | |
371 | { | |
372 | if (!ib_started) | |
373 | return; | |
374 | ||
375 | flush_scheduled_work(); | |
376 | unregister_netdevice_notifier(¬ifier); | |
377 | ib_started = 0; | |
378 | } |