2 * Copyright (c) 2005 Voltaire Inc. All rights reserved.
3 * Copyright (c) 2002-2005, Network Appliance, Inc. All rights reserved.
4 * Copyright (c) 1999-2005, Mellanox Technologies, Inc. All rights reserved.
5 * Copyright (c) 2005 Intel Corporation. All rights reserved.
7 * This software is available to you under a choice of one of two
8 * licenses. You may choose to be licensed under the terms of the GNU
9 * General Public License (GPL) Version 2, available from the file
10 * COPYING in the main directory of this source tree, or the
11 * OpenIB.org BSD license below:
13 * Redistribution and use in source and binary forms, with or
14 * without modification, are permitted provided that the following
17 * - Redistributions of source code must retain the above
18 * copyright notice, this list of conditions and the following
21 * - Redistributions in binary form must reproduce the above
22 * copyright notice, this list of conditions and the following
23 * disclaimer in the documentation and/or other materials
24 * provided with the distribution.
26 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
27 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
28 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
29 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
30 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
31 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
32 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
36 #include <linux/mutex.h>
37 #include <linux/inetdevice.h>
38 #include <linux/workqueue.h>
39 #include <linux/if_arp.h>
41 #include <net/neighbour.h>
42 #include <net/route.h>
43 #include <net/netevent.h>
44 #include <net/addrconf.h>
45 #include <net/ip6_route.h>
46 #include <rdma/ib_addr.h>
48 MODULE_AUTHOR("Sean Hefty");
49 MODULE_DESCRIPTION("IB Address Translation");
50 MODULE_LICENSE("Dual BSD/GPL");
53 struct list_head list
;
54 struct sockaddr_storage src_addr
;
55 struct sockaddr_storage dst_addr
;
56 struct rdma_dev_addr
*addr
;
57 struct rdma_addr_client
*client
;
59 void (*callback
)(int status
, struct sockaddr
*src_addr
,
60 struct rdma_dev_addr
*addr
, void *context
);
61 unsigned long timeout
;
65 static void process_req(struct work_struct
*work
);
67 static DEFINE_MUTEX(lock
);
68 static LIST_HEAD(req_list
);
69 static DECLARE_DELAYED_WORK(work
, process_req
);
70 static struct workqueue_struct
*addr_wq
;
72 void rdma_addr_register_client(struct rdma_addr_client
*client
)
74 atomic_set(&client
->refcount
, 1);
75 init_completion(&client
->comp
);
77 EXPORT_SYMBOL(rdma_addr_register_client
);
79 static inline void put_client(struct rdma_addr_client
*client
)
81 if (atomic_dec_and_test(&client
->refcount
))
82 complete(&client
->comp
);
85 void rdma_addr_unregister_client(struct rdma_addr_client
*client
)
88 wait_for_completion(&client
->comp
);
90 EXPORT_SYMBOL(rdma_addr_unregister_client
);
92 int rdma_copy_addr(struct rdma_dev_addr
*dev_addr
, struct net_device
*dev
,
93 const unsigned char *dst_dev_addr
)
96 case ARPHRD_INFINIBAND
:
97 dev_addr
->dev_type
= RDMA_NODE_IB_CA
;
100 dev_addr
->dev_type
= RDMA_NODE_RNIC
;
103 return -EADDRNOTAVAIL
;
106 memcpy(dev_addr
->src_dev_addr
, dev
->dev_addr
, MAX_ADDR_LEN
);
107 memcpy(dev_addr
->broadcast
, dev
->broadcast
, MAX_ADDR_LEN
);
109 memcpy(dev_addr
->dst_dev_addr
, dst_dev_addr
, MAX_ADDR_LEN
);
110 dev_addr
->src_dev
= dev
;
113 EXPORT_SYMBOL(rdma_copy_addr
);
115 int rdma_translate_ip(struct sockaddr
*addr
, struct rdma_dev_addr
*dev_addr
)
117 struct net_device
*dev
;
118 int ret
= -EADDRNOTAVAIL
;
120 switch (addr
->sa_family
) {
122 dev
= ip_dev_find(&init_net
,
123 ((struct sockaddr_in
*) addr
)->sin_addr
.s_addr
);
128 ret
= rdma_copy_addr(dev_addr
, dev
, NULL
);
132 #if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
134 for_each_netdev(&init_net
, dev
) {
135 if (ipv6_chk_addr(&init_net
,
136 &((struct sockaddr_in6
*) addr
)->sin6_addr
,
138 ret
= rdma_copy_addr(dev_addr
, dev
, NULL
);
147 EXPORT_SYMBOL(rdma_translate_ip
);
149 static void set_timeout(unsigned long time
)
153 cancel_delayed_work(&work
);
155 delay
= time
- jiffies
;
156 if ((long)delay
<= 0)
159 queue_delayed_work(addr_wq
, &work
, delay
);
162 static void queue_req(struct addr_req
*req
)
164 struct addr_req
*temp_req
;
167 list_for_each_entry_reverse(temp_req
, &req_list
, list
) {
168 if (time_after_eq(req
->timeout
, temp_req
->timeout
))
172 list_add(&req
->list
, &temp_req
->list
);
174 if (req_list
.next
== &req
->list
)
175 set_timeout(req
->timeout
);
179 static void addr_send_arp(struct sockaddr
*dst_in
)
184 memset(&fl
, 0, sizeof fl
);
186 switch (dst_in
->sa_family
) {
188 fl
.nl_u
.ip4_u
.daddr
=
189 ((struct sockaddr_in
*) dst_in
)->sin_addr
.s_addr
;
191 if (ip_route_output_key(&init_net
, &rt
, &fl
))
194 neigh_event_send(rt
->u
.dst
.neighbour
, NULL
);
198 #if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
201 struct dst_entry
*dst
;
203 fl
.nl_u
.ip6_u
.daddr
=
204 ((struct sockaddr_in6
*) dst_in
)->sin6_addr
;
206 dst
= ip6_route_output(&init_net
, NULL
, &fl
);
210 neigh_event_send(dst
->neighbour
, NULL
);
218 static int addr4_resolve_remote(struct sockaddr_in
*src_in
,
219 struct sockaddr_in
*dst_in
,
220 struct rdma_dev_addr
*addr
)
222 __be32 src_ip
= src_in
->sin_addr
.s_addr
;
223 __be32 dst_ip
= dst_in
->sin_addr
.s_addr
;
226 struct neighbour
*neigh
;
229 memset(&fl
, 0, sizeof fl
);
230 fl
.nl_u
.ip4_u
.daddr
= dst_ip
;
231 fl
.nl_u
.ip4_u
.saddr
= src_ip
;
232 ret
= ip_route_output_key(&init_net
, &rt
, &fl
);
236 /* If the device does ARP internally, return 'done' */
237 if (rt
->idev
->dev
->flags
& IFF_NOARP
) {
238 rdma_copy_addr(addr
, rt
->idev
->dev
, NULL
);
242 neigh
= neigh_lookup(&arp_tbl
, &rt
->rt_gateway
, rt
->idev
->dev
);
248 if (!(neigh
->nud_state
& NUD_VALID
)) {
254 src_in
->sin_family
= dst_in
->sin_family
;
255 src_in
->sin_addr
.s_addr
= rt
->rt_src
;
258 ret
= rdma_copy_addr(addr
, neigh
->dev
, neigh
->ha
);
260 neigh_release(neigh
);
267 #if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
268 static int addr6_resolve_remote(struct sockaddr_in6
*src_in
,
269 struct sockaddr_in6
*dst_in
,
270 struct rdma_dev_addr
*addr
)
273 struct neighbour
*neigh
;
274 struct dst_entry
*dst
;
277 memset(&fl
, 0, sizeof fl
);
278 fl
.nl_u
.ip6_u
.daddr
= dst_in
->sin6_addr
;
279 fl
.nl_u
.ip6_u
.saddr
= src_in
->sin6_addr
;
281 dst
= ip6_route_output(&init_net
, NULL
, &fl
);
285 if (dst
->dev
->flags
& IFF_NOARP
) {
286 ret
= rdma_copy_addr(addr
, dst
->dev
, NULL
);
288 neigh
= dst
->neighbour
;
289 if (neigh
&& (neigh
->nud_state
& NUD_VALID
))
290 ret
= rdma_copy_addr(addr
, neigh
->dev
, neigh
->ha
);
297 static int addr6_resolve_remote(struct sockaddr_in6
*src_in
,
298 struct sockaddr_in6
*dst_in
,
299 struct rdma_dev_addr
*addr
)
301 return -EADDRNOTAVAIL
;
305 static int addr_resolve_remote(struct sockaddr
*src_in
,
306 struct sockaddr
*dst_in
,
307 struct rdma_dev_addr
*addr
)
309 if (src_in
->sa_family
== AF_INET
) {
310 return addr4_resolve_remote((struct sockaddr_in
*) src_in
,
311 (struct sockaddr_in
*) dst_in
, addr
);
313 return addr6_resolve_remote((struct sockaddr_in6
*) src_in
,
314 (struct sockaddr_in6
*) dst_in
, addr
);
317 static void process_req(struct work_struct
*work
)
319 struct addr_req
*req
, *temp_req
;
320 struct sockaddr
*src_in
, *dst_in
;
321 struct list_head done_list
;
323 INIT_LIST_HEAD(&done_list
);
326 list_for_each_entry_safe(req
, temp_req
, &req_list
, list
) {
327 if (req
->status
== -ENODATA
) {
328 src_in
= (struct sockaddr
*) &req
->src_addr
;
329 dst_in
= (struct sockaddr
*) &req
->dst_addr
;
330 req
->status
= addr_resolve_remote(src_in
, dst_in
,
332 if (req
->status
&& time_after_eq(jiffies
, req
->timeout
))
333 req
->status
= -ETIMEDOUT
;
334 else if (req
->status
== -ENODATA
)
337 list_move_tail(&req
->list
, &done_list
);
340 if (!list_empty(&req_list
)) {
341 req
= list_entry(req_list
.next
, struct addr_req
, list
);
342 set_timeout(req
->timeout
);
346 list_for_each_entry_safe(req
, temp_req
, &done_list
, list
) {
347 list_del(&req
->list
);
348 req
->callback(req
->status
, (struct sockaddr
*) &req
->src_addr
,
349 req
->addr
, req
->context
);
350 put_client(req
->client
);
355 static int addr_resolve_local(struct sockaddr
*src_in
,
356 struct sockaddr
*dst_in
,
357 struct rdma_dev_addr
*addr
)
359 struct net_device
*dev
;
362 switch (dst_in
->sa_family
) {
365 __be32 src_ip
= ((struct sockaddr_in
*) src_in
)->sin_addr
.s_addr
;
366 __be32 dst_ip
= ((struct sockaddr_in
*) dst_in
)->sin_addr
.s_addr
;
368 dev
= ip_dev_find(&init_net
, dst_ip
);
370 return -EADDRNOTAVAIL
;
372 if (ipv4_is_zeronet(src_ip
)) {
373 src_in
->sa_family
= dst_in
->sa_family
;
374 ((struct sockaddr_in
*) src_in
)->sin_addr
.s_addr
= dst_ip
;
375 ret
= rdma_copy_addr(addr
, dev
, dev
->dev_addr
);
376 } else if (ipv4_is_loopback(src_ip
)) {
377 ret
= rdma_translate_ip(dst_in
, addr
);
379 memcpy(addr
->dst_dev_addr
, dev
->dev_addr
, MAX_ADDR_LEN
);
381 ret
= rdma_translate_ip(src_in
, addr
);
383 memcpy(addr
->dst_dev_addr
, dev
->dev_addr
, MAX_ADDR_LEN
);
389 #if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
394 for_each_netdev(&init_net
, dev
)
395 if (ipv6_chk_addr(&init_net
,
396 &((struct sockaddr_in6
*) addr
)->sin6_addr
,
401 return -EADDRNOTAVAIL
;
403 a
= &((struct sockaddr_in6
*) src_in
)->sin6_addr
;
405 if (ipv6_addr_any(a
)) {
406 src_in
->sa_family
= dst_in
->sa_family
;
407 ((struct sockaddr_in6
*) src_in
)->sin6_addr
=
408 ((struct sockaddr_in6
*) dst_in
)->sin6_addr
;
409 ret
= rdma_copy_addr(addr
, dev
, dev
->dev_addr
);
410 } else if (ipv6_addr_loopback(a
)) {
411 ret
= rdma_translate_ip(dst_in
, addr
);
413 memcpy(addr
->dst_dev_addr
, dev
->dev_addr
, MAX_ADDR_LEN
);
415 ret
= rdma_translate_ip(src_in
, addr
);
417 memcpy(addr
->dst_dev_addr
, dev
->dev_addr
, MAX_ADDR_LEN
);
424 ret
= -EADDRNOTAVAIL
;
431 int rdma_resolve_ip(struct rdma_addr_client
*client
,
432 struct sockaddr
*src_addr
, struct sockaddr
*dst_addr
,
433 struct rdma_dev_addr
*addr
, int timeout_ms
,
434 void (*callback
)(int status
, struct sockaddr
*src_addr
,
435 struct rdma_dev_addr
*addr
, void *context
),
438 struct sockaddr
*src_in
, *dst_in
;
439 struct addr_req
*req
;
442 req
= kzalloc(sizeof *req
, GFP_KERNEL
);
447 memcpy(&req
->src_addr
, src_addr
, ip_addr_size(src_addr
));
448 memcpy(&req
->dst_addr
, dst_addr
, ip_addr_size(dst_addr
));
450 req
->callback
= callback
;
451 req
->context
= context
;
452 req
->client
= client
;
453 atomic_inc(&client
->refcount
);
455 src_in
= (struct sockaddr
*) &req
->src_addr
;
456 dst_in
= (struct sockaddr
*) &req
->dst_addr
;
458 req
->status
= addr_resolve_local(src_in
, dst_in
, addr
);
459 if (req
->status
== -EADDRNOTAVAIL
)
460 req
->status
= addr_resolve_remote(src_in
, dst_in
, addr
);
462 switch (req
->status
) {
464 req
->timeout
= jiffies
;
468 req
->timeout
= msecs_to_jiffies(timeout_ms
) + jiffies
;
470 addr_send_arp(dst_in
);
474 atomic_dec(&client
->refcount
);
480 EXPORT_SYMBOL(rdma_resolve_ip
);
482 void rdma_addr_cancel(struct rdma_dev_addr
*addr
)
484 struct addr_req
*req
, *temp_req
;
487 list_for_each_entry_safe(req
, temp_req
, &req_list
, list
) {
488 if (req
->addr
== addr
) {
489 req
->status
= -ECANCELED
;
490 req
->timeout
= jiffies
;
491 list_move(&req
->list
, &req_list
);
492 set_timeout(req
->timeout
);
498 EXPORT_SYMBOL(rdma_addr_cancel
);
500 static int netevent_callback(struct notifier_block
*self
, unsigned long event
,
503 if (event
== NETEVENT_NEIGH_UPDATE
) {
504 struct neighbour
*neigh
= ctx
;
506 if (neigh
->nud_state
& NUD_VALID
) {
507 set_timeout(jiffies
);
513 static struct notifier_block nb
= {
514 .notifier_call
= netevent_callback
517 static int addr_init(void)
519 addr_wq
= create_singlethread_workqueue("ib_addr");
523 register_netevent_notifier(&nb
);
527 static void addr_cleanup(void)
529 unregister_netevent_notifier(&nb
);
530 destroy_workqueue(addr_wq
);
533 module_init(addr_init
);
534 module_exit(addr_cleanup
);