1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * inet_diag.c Module for monitoring INET transport protocols sockets.
5 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
8 #include <linux/kernel.h>
9 #include <linux/module.h>
10 #include <linux/types.h>
11 #include <linux/fcntl.h>
12 #include <linux/random.h>
13 #include <linux/slab.h>
14 #include <linux/cache.h>
15 #include <linux/init.h>
16 #include <linux/time.h>
21 #include <net/inet_common.h>
22 #include <net/inet_connection_sock.h>
23 #include <net/inet_hashtables.h>
24 #include <net/inet_timewait_sock.h>
25 #include <net/inet6_hashtables.h>
26 #include <net/netlink.h>
28 #include <linux/inet.h>
29 #include <linux/stddef.h>
31 #include <linux/inet_diag.h>
32 #include <linux/sock_diag.h>
34 static const struct inet_diag_handler
**inet_diag_table
;
36 struct inet_diag_entry
{
47 static DEFINE_MUTEX(inet_diag_table_mutex
);
49 static const struct inet_diag_handler
*inet_diag_lock_handler(int proto
)
51 if (!inet_diag_table
[proto
])
52 sock_load_diag_module(AF_INET
, proto
);
54 mutex_lock(&inet_diag_table_mutex
);
55 if (!inet_diag_table
[proto
])
56 return ERR_PTR(-ENOENT
);
58 return inet_diag_table
[proto
];
61 static void inet_diag_unlock_handler(const struct inet_diag_handler
*handler
)
63 mutex_unlock(&inet_diag_table_mutex
);
66 void inet_diag_msg_common_fill(struct inet_diag_msg
*r
, struct sock
*sk
)
68 r
->idiag_family
= sk
->sk_family
;
70 r
->id
.idiag_sport
= htons(sk
->sk_num
);
71 r
->id
.idiag_dport
= sk
->sk_dport
;
72 r
->id
.idiag_if
= sk
->sk_bound_dev_if
;
73 sock_diag_save_cookie(sk
, r
->id
.idiag_cookie
);
75 #if IS_ENABLED(CONFIG_IPV6)
76 if (sk
->sk_family
== AF_INET6
) {
77 *(struct in6_addr
*)r
->id
.idiag_src
= sk
->sk_v6_rcv_saddr
;
78 *(struct in6_addr
*)r
->id
.idiag_dst
= sk
->sk_v6_daddr
;
82 memset(&r
->id
.idiag_src
, 0, sizeof(r
->id
.idiag_src
));
83 memset(&r
->id
.idiag_dst
, 0, sizeof(r
->id
.idiag_dst
));
85 r
->id
.idiag_src
[0] = sk
->sk_rcv_saddr
;
86 r
->id
.idiag_dst
[0] = sk
->sk_daddr
;
89 EXPORT_SYMBOL_GPL(inet_diag_msg_common_fill
);
91 static size_t inet_sk_attr_size(struct sock
*sk
,
92 const struct inet_diag_req_v2
*req
,
95 const struct inet_diag_handler
*handler
;
98 handler
= inet_diag_table
[req
->sdiag_protocol
];
99 if (handler
&& handler
->idiag_get_aux_size
)
100 aux
= handler
->idiag_get_aux_size(sk
, net_admin
);
102 return nla_total_size(sizeof(struct tcp_info
))
103 + nla_total_size(1) /* INET_DIAG_SHUTDOWN */
104 + nla_total_size(1) /* INET_DIAG_TOS */
105 + nla_total_size(1) /* INET_DIAG_TCLASS */
106 + nla_total_size(4) /* INET_DIAG_MARK */
107 + nla_total_size(4) /* INET_DIAG_CLASS_ID */
108 + nla_total_size(sizeof(struct inet_diag_meminfo
))
109 + nla_total_size(sizeof(struct inet_diag_msg
))
110 + nla_total_size(SK_MEMINFO_VARS
* sizeof(u32
))
111 + nla_total_size(TCP_CA_NAME_MAX
)
112 + nla_total_size(sizeof(struct tcpvegas_info
))
117 int inet_diag_msg_attrs_fill(struct sock
*sk
, struct sk_buff
*skb
,
118 struct inet_diag_msg
*r
, int ext
,
119 struct user_namespace
*user_ns
,
122 const struct inet_sock
*inet
= inet_sk(sk
);
124 if (nla_put_u8(skb
, INET_DIAG_SHUTDOWN
, sk
->sk_shutdown
))
127 /* IPv6 dual-stack sockets use inet->tos for IPv4 connections,
128 * hence this needs to be included regardless of socket family.
130 if (ext
& (1 << (INET_DIAG_TOS
- 1)))
131 if (nla_put_u8(skb
, INET_DIAG_TOS
, inet
->tos
) < 0)
134 #if IS_ENABLED(CONFIG_IPV6)
135 if (r
->idiag_family
== AF_INET6
) {
136 if (ext
& (1 << (INET_DIAG_TCLASS
- 1)))
137 if (nla_put_u8(skb
, INET_DIAG_TCLASS
,
138 inet6_sk(sk
)->tclass
) < 0)
141 if (((1 << sk
->sk_state
) & (TCPF_LISTEN
| TCPF_CLOSE
)) &&
142 nla_put_u8(skb
, INET_DIAG_SKV6ONLY
, ipv6_only_sock(sk
)))
147 if (net_admin
&& nla_put_u32(skb
, INET_DIAG_MARK
, sk
->sk_mark
))
150 r
->idiag_uid
= from_kuid_munged(user_ns
, sock_i_uid(sk
));
151 r
->idiag_inode
= sock_i_ino(sk
);
157 EXPORT_SYMBOL_GPL(inet_diag_msg_attrs_fill
);
159 int inet_sk_diag_fill(struct sock
*sk
, struct inet_connection_sock
*icsk
,
160 struct sk_buff
*skb
, const struct inet_diag_req_v2
*req
,
161 struct user_namespace
*user_ns
,
162 u32 portid
, u32 seq
, u16 nlmsg_flags
,
163 const struct nlmsghdr
*unlh
,
166 const struct tcp_congestion_ops
*ca_ops
;
167 const struct inet_diag_handler
*handler
;
168 int ext
= req
->idiag_ext
;
169 struct inet_diag_msg
*r
;
170 struct nlmsghdr
*nlh
;
174 handler
= inet_diag_table
[req
->sdiag_protocol
];
177 nlh
= nlmsg_put(skb
, portid
, seq
, unlh
->nlmsg_type
, sizeof(*r
),
183 BUG_ON(!sk_fullsock(sk
));
185 inet_diag_msg_common_fill(r
, sk
);
186 r
->idiag_state
= sk
->sk_state
;
188 r
->idiag_retrans
= 0;
190 if (inet_diag_msg_attrs_fill(sk
, skb
, r
, ext
, user_ns
, net_admin
))
193 if (ext
& (1 << (INET_DIAG_MEMINFO
- 1))) {
194 struct inet_diag_meminfo minfo
= {
195 .idiag_rmem
= sk_rmem_alloc_get(sk
),
196 .idiag_wmem
= sk
->sk_wmem_queued
,
197 .idiag_fmem
= sk
->sk_forward_alloc
,
198 .idiag_tmem
= sk_wmem_alloc_get(sk
),
201 if (nla_put(skb
, INET_DIAG_MEMINFO
, sizeof(minfo
), &minfo
) < 0)
205 if (ext
& (1 << (INET_DIAG_SKMEMINFO
- 1)))
206 if (sock_diag_put_meminfo(sk
, skb
, INET_DIAG_SKMEMINFO
))
210 * RAW sockets might have user-defined protocols assigned,
211 * so report the one supplied on socket creation.
213 if (sk
->sk_type
== SOCK_RAW
) {
214 if (nla_put_u8(skb
, INET_DIAG_PROTOCOL
, sk
->sk_protocol
))
219 handler
->idiag_get_info(sk
, r
, NULL
);
223 if (icsk
->icsk_pending
== ICSK_TIME_RETRANS
||
224 icsk
->icsk_pending
== ICSK_TIME_REO_TIMEOUT
||
225 icsk
->icsk_pending
== ICSK_TIME_LOSS_PROBE
) {
227 r
->idiag_retrans
= icsk
->icsk_retransmits
;
229 jiffies_to_msecs(icsk
->icsk_timeout
- jiffies
);
230 } else if (icsk
->icsk_pending
== ICSK_TIME_PROBE0
) {
232 r
->idiag_retrans
= icsk
->icsk_probes_out
;
234 jiffies_to_msecs(icsk
->icsk_timeout
- jiffies
);
235 } else if (timer_pending(&sk
->sk_timer
)) {
237 r
->idiag_retrans
= icsk
->icsk_probes_out
;
239 jiffies_to_msecs(sk
->sk_timer
.expires
- jiffies
);
242 r
->idiag_expires
= 0;
245 if ((ext
& (1 << (INET_DIAG_INFO
- 1))) && handler
->idiag_info_size
) {
246 attr
= nla_reserve_64bit(skb
, INET_DIAG_INFO
,
247 handler
->idiag_info_size
,
252 info
= nla_data(attr
);
255 if (ext
& (1 << (INET_DIAG_CONG
- 1))) {
259 ca_ops
= READ_ONCE(icsk
->icsk_ca_ops
);
261 err
= nla_put_string(skb
, INET_DIAG_CONG
, ca_ops
->name
);
267 handler
->idiag_get_info(sk
, r
, info
);
269 if (ext
& (1 << (INET_DIAG_INFO
- 1)) && handler
->idiag_get_aux
)
270 if (handler
->idiag_get_aux(sk
, net_admin
, skb
) < 0)
273 if (sk
->sk_state
< TCP_TIME_WAIT
) {
274 union tcp_cc_info info
;
279 ca_ops
= READ_ONCE(icsk
->icsk_ca_ops
);
280 if (ca_ops
&& ca_ops
->get_info
)
281 sz
= ca_ops
->get_info(sk
, ext
, &attr
, &info
);
283 if (sz
&& nla_put(skb
, attr
, sz
, &info
) < 0)
287 if (ext
& (1 << (INET_DIAG_CLASS_ID
- 1)) ||
288 ext
& (1 << (INET_DIAG_TCLASS
- 1))) {
291 #ifdef CONFIG_SOCK_CGROUP_DATA
292 classid
= sock_cgroup_classid(&sk
->sk_cgrp_data
);
294 /* Fallback to socket priority if class id isn't set.
295 * Classful qdiscs use it as direct reference to class.
296 * For cgroup2 classid is always zero.
299 classid
= sk
->sk_priority
;
301 if (nla_put_u32(skb
, INET_DIAG_CLASS_ID
, classid
))
310 nlmsg_cancel(skb
, nlh
);
313 EXPORT_SYMBOL_GPL(inet_sk_diag_fill
);
315 static int inet_csk_diag_fill(struct sock
*sk
,
317 const struct inet_diag_req_v2
*req
,
318 struct user_namespace
*user_ns
,
319 u32 portid
, u32 seq
, u16 nlmsg_flags
,
320 const struct nlmsghdr
*unlh
,
323 return inet_sk_diag_fill(sk
, inet_csk(sk
), skb
, req
, user_ns
,
324 portid
, seq
, nlmsg_flags
, unlh
, net_admin
);
327 static int inet_twsk_diag_fill(struct sock
*sk
,
329 u32 portid
, u32 seq
, u16 nlmsg_flags
,
330 const struct nlmsghdr
*unlh
)
332 struct inet_timewait_sock
*tw
= inet_twsk(sk
);
333 struct inet_diag_msg
*r
;
334 struct nlmsghdr
*nlh
;
337 nlh
= nlmsg_put(skb
, portid
, seq
, unlh
->nlmsg_type
, sizeof(*r
),
343 BUG_ON(tw
->tw_state
!= TCP_TIME_WAIT
);
345 tmo
= tw
->tw_timer
.expires
- jiffies
;
349 inet_diag_msg_common_fill(r
, sk
);
350 r
->idiag_retrans
= 0;
352 r
->idiag_state
= tw
->tw_substate
;
354 r
->idiag_expires
= jiffies_to_msecs(tmo
);
364 static int inet_req_diag_fill(struct sock
*sk
, struct sk_buff
*skb
,
365 u32 portid
, u32 seq
, u16 nlmsg_flags
,
366 const struct nlmsghdr
*unlh
, bool net_admin
)
368 struct request_sock
*reqsk
= inet_reqsk(sk
);
369 struct inet_diag_msg
*r
;
370 struct nlmsghdr
*nlh
;
373 nlh
= nlmsg_put(skb
, portid
, seq
, unlh
->nlmsg_type
, sizeof(*r
),
379 inet_diag_msg_common_fill(r
, sk
);
380 r
->idiag_state
= TCP_SYN_RECV
;
382 r
->idiag_retrans
= reqsk
->num_retrans
;
384 BUILD_BUG_ON(offsetof(struct inet_request_sock
, ir_cookie
) !=
385 offsetof(struct sock
, sk_cookie
));
387 tmo
= inet_reqsk(sk
)->rsk_timer
.expires
- jiffies
;
388 r
->idiag_expires
= (tmo
>= 0) ? jiffies_to_msecs(tmo
) : 0;
394 if (net_admin
&& nla_put_u32(skb
, INET_DIAG_MARK
,
395 inet_rsk(reqsk
)->ir_mark
))
402 static int sk_diag_fill(struct sock
*sk
, struct sk_buff
*skb
,
403 const struct inet_diag_req_v2
*r
,
404 struct user_namespace
*user_ns
,
405 u32 portid
, u32 seq
, u16 nlmsg_flags
,
406 const struct nlmsghdr
*unlh
, bool net_admin
)
408 if (sk
->sk_state
== TCP_TIME_WAIT
)
409 return inet_twsk_diag_fill(sk
, skb
, portid
, seq
,
412 if (sk
->sk_state
== TCP_NEW_SYN_RECV
)
413 return inet_req_diag_fill(sk
, skb
, portid
, seq
,
414 nlmsg_flags
, unlh
, net_admin
);
416 return inet_csk_diag_fill(sk
, skb
, r
, user_ns
, portid
, seq
,
417 nlmsg_flags
, unlh
, net_admin
);
420 struct sock
*inet_diag_find_one_icsk(struct net
*net
,
421 struct inet_hashinfo
*hashinfo
,
422 const struct inet_diag_req_v2
*req
)
427 if (req
->sdiag_family
== AF_INET
)
428 sk
= inet_lookup(net
, hashinfo
, NULL
, 0, req
->id
.idiag_dst
[0],
429 req
->id
.idiag_dport
, req
->id
.idiag_src
[0],
430 req
->id
.idiag_sport
, req
->id
.idiag_if
);
431 #if IS_ENABLED(CONFIG_IPV6)
432 else if (req
->sdiag_family
== AF_INET6
) {
433 if (ipv6_addr_v4mapped((struct in6_addr
*)req
->id
.idiag_dst
) &&
434 ipv6_addr_v4mapped((struct in6_addr
*)req
->id
.idiag_src
))
435 sk
= inet_lookup(net
, hashinfo
, NULL
, 0, req
->id
.idiag_dst
[3],
436 req
->id
.idiag_dport
, req
->id
.idiag_src
[3],
437 req
->id
.idiag_sport
, req
->id
.idiag_if
);
439 sk
= inet6_lookup(net
, hashinfo
, NULL
, 0,
440 (struct in6_addr
*)req
->id
.idiag_dst
,
442 (struct in6_addr
*)req
->id
.idiag_src
,
449 return ERR_PTR(-EINVAL
);
453 return ERR_PTR(-ENOENT
);
455 if (sock_diag_check_cookie(sk
, req
->id
.idiag_cookie
)) {
457 return ERR_PTR(-ENOENT
);
462 EXPORT_SYMBOL_GPL(inet_diag_find_one_icsk
);
464 int inet_diag_dump_one_icsk(struct inet_hashinfo
*hashinfo
,
465 struct sk_buff
*in_skb
,
466 const struct nlmsghdr
*nlh
,
467 const struct inet_diag_req_v2
*req
)
469 bool net_admin
= netlink_net_capable(in_skb
, CAP_NET_ADMIN
);
470 struct net
*net
= sock_net(in_skb
->sk
);
475 sk
= inet_diag_find_one_icsk(net
, hashinfo
, req
);
479 rep
= nlmsg_new(inet_sk_attr_size(sk
, req
, net_admin
), GFP_KERNEL
);
485 err
= sk_diag_fill(sk
, rep
, req
,
486 sk_user_ns(NETLINK_CB(in_skb
).sk
),
487 NETLINK_CB(in_skb
).portid
,
488 nlh
->nlmsg_seq
, 0, nlh
, net_admin
);
490 WARN_ON(err
== -EMSGSIZE
);
494 err
= netlink_unicast(net
->diag_nlsk
, rep
, NETLINK_CB(in_skb
).portid
,
505 EXPORT_SYMBOL_GPL(inet_diag_dump_one_icsk
);
507 static int inet_diag_cmd_exact(int cmd
, struct sk_buff
*in_skb
,
508 const struct nlmsghdr
*nlh
,
509 const struct inet_diag_req_v2
*req
)
511 const struct inet_diag_handler
*handler
;
514 handler
= inet_diag_lock_handler(req
->sdiag_protocol
);
516 err
= PTR_ERR(handler
);
517 else if (cmd
== SOCK_DIAG_BY_FAMILY
)
518 err
= handler
->dump_one(in_skb
, nlh
, req
);
519 else if (cmd
== SOCK_DESTROY
&& handler
->destroy
)
520 err
= handler
->destroy(in_skb
, req
);
523 inet_diag_unlock_handler(handler
);
528 static int bitstring_match(const __be32
*a1
, const __be32
*a2
, int bits
)
530 int words
= bits
>> 5;
535 if (memcmp(a1
, a2
, words
<< 2))
545 mask
= htonl((0xffffffff) << (32 - bits
));
547 if ((w1
^ w2
) & mask
)
554 static int inet_diag_bc_run(const struct nlattr
*_bc
,
555 const struct inet_diag_entry
*entry
)
557 const void *bc
= nla_data(_bc
);
558 int len
= nla_len(_bc
);
562 const struct inet_diag_bc_op
*op
= bc
;
565 case INET_DIAG_BC_NOP
:
567 case INET_DIAG_BC_JMP
:
570 case INET_DIAG_BC_S_EQ
:
571 yes
= entry
->sport
== op
[1].no
;
573 case INET_DIAG_BC_S_GE
:
574 yes
= entry
->sport
>= op
[1].no
;
576 case INET_DIAG_BC_S_LE
:
577 yes
= entry
->sport
<= op
[1].no
;
579 case INET_DIAG_BC_D_EQ
:
580 yes
= entry
->dport
== op
[1].no
;
582 case INET_DIAG_BC_D_GE
:
583 yes
= entry
->dport
>= op
[1].no
;
585 case INET_DIAG_BC_D_LE
:
586 yes
= entry
->dport
<= op
[1].no
;
588 case INET_DIAG_BC_AUTO
:
589 yes
= !(entry
->userlocks
& SOCK_BINDPORT_LOCK
);
591 case INET_DIAG_BC_S_COND
:
592 case INET_DIAG_BC_D_COND
: {
593 const struct inet_diag_hostcond
*cond
;
596 cond
= (const struct inet_diag_hostcond
*)(op
+ 1);
597 if (cond
->port
!= -1 &&
598 cond
->port
!= (op
->code
== INET_DIAG_BC_S_COND
?
599 entry
->sport
: entry
->dport
)) {
604 if (op
->code
== INET_DIAG_BC_S_COND
)
609 if (cond
->family
!= AF_UNSPEC
&&
610 cond
->family
!= entry
->family
) {
611 if (entry
->family
== AF_INET6
&&
612 cond
->family
== AF_INET
) {
613 if (addr
[0] == 0 && addr
[1] == 0 &&
614 addr
[2] == htonl(0xffff) &&
615 bitstring_match(addr
+ 3,
624 if (cond
->prefix_len
== 0)
626 if (bitstring_match(addr
, cond
->addr
,
632 case INET_DIAG_BC_DEV_COND
: {
635 ifindex
= *((const u32
*)(op
+ 1));
636 if (ifindex
!= entry
->ifindex
)
640 case INET_DIAG_BC_MARK_COND
: {
641 struct inet_diag_markcond
*cond
;
643 cond
= (struct inet_diag_markcond
*)(op
+ 1);
644 if ((entry
->mark
& cond
->mask
) != cond
->mark
)
661 /* This helper is available for all sockets (ESTABLISH, TIMEWAIT, SYN_RECV)
663 static void entry_fill_addrs(struct inet_diag_entry
*entry
,
664 const struct sock
*sk
)
666 #if IS_ENABLED(CONFIG_IPV6)
667 if (sk
->sk_family
== AF_INET6
) {
668 entry
->saddr
= sk
->sk_v6_rcv_saddr
.s6_addr32
;
669 entry
->daddr
= sk
->sk_v6_daddr
.s6_addr32
;
673 entry
->saddr
= &sk
->sk_rcv_saddr
;
674 entry
->daddr
= &sk
->sk_daddr
;
678 int inet_diag_bc_sk(const struct nlattr
*bc
, struct sock
*sk
)
680 struct inet_sock
*inet
= inet_sk(sk
);
681 struct inet_diag_entry entry
;
686 entry
.family
= sk
->sk_family
;
687 entry_fill_addrs(&entry
, sk
);
688 entry
.sport
= inet
->inet_num
;
689 entry
.dport
= ntohs(inet
->inet_dport
);
690 entry
.ifindex
= sk
->sk_bound_dev_if
;
691 entry
.userlocks
= sk_fullsock(sk
) ? sk
->sk_userlocks
: 0;
693 entry
.mark
= sk
->sk_mark
;
694 else if (sk
->sk_state
== TCP_NEW_SYN_RECV
)
695 entry
.mark
= inet_rsk(inet_reqsk(sk
))->ir_mark
;
699 return inet_diag_bc_run(bc
, &entry
);
701 EXPORT_SYMBOL_GPL(inet_diag_bc_sk
);
703 static int valid_cc(const void *bc
, int len
, int cc
)
706 const struct inet_diag_bc_op
*op
= bc
;
712 if (op
->yes
< 4 || op
->yes
& 3)
720 /* data is u32 ifindex */
721 static bool valid_devcond(const struct inet_diag_bc_op
*op
, int len
,
724 /* Check ifindex space. */
725 *min_len
+= sizeof(u32
);
731 /* Validate an inet_diag_hostcond. */
732 static bool valid_hostcond(const struct inet_diag_bc_op
*op
, int len
,
735 struct inet_diag_hostcond
*cond
;
738 /* Check hostcond space. */
739 *min_len
+= sizeof(struct inet_diag_hostcond
);
742 cond
= (struct inet_diag_hostcond
*)(op
+ 1);
744 /* Check address family and address length. */
745 switch (cond
->family
) {
750 addr_len
= sizeof(struct in_addr
);
753 addr_len
= sizeof(struct in6_addr
);
758 *min_len
+= addr_len
;
762 /* Check prefix length (in bits) vs address length (in bytes). */
763 if (cond
->prefix_len
> 8 * addr_len
)
769 /* Validate a port comparison operator. */
770 static bool valid_port_comparison(const struct inet_diag_bc_op
*op
,
771 int len
, int *min_len
)
773 /* Port comparisons put the port in a follow-on inet_diag_bc_op. */
774 *min_len
+= sizeof(struct inet_diag_bc_op
);
780 static bool valid_markcond(const struct inet_diag_bc_op
*op
, int len
,
783 *min_len
+= sizeof(struct inet_diag_markcond
);
784 return len
>= *min_len
;
787 static int inet_diag_bc_audit(const struct nlattr
*attr
,
788 const struct sk_buff
*skb
)
790 bool net_admin
= netlink_net_capable(skb
, CAP_NET_ADMIN
);
791 const void *bytecode
, *bc
;
792 int bytecode_len
, len
;
794 if (!attr
|| nla_len(attr
) < sizeof(struct inet_diag_bc_op
))
797 bytecode
= bc
= nla_data(attr
);
798 len
= bytecode_len
= nla_len(attr
);
801 int min_len
= sizeof(struct inet_diag_bc_op
);
802 const struct inet_diag_bc_op
*op
= bc
;
805 case INET_DIAG_BC_S_COND
:
806 case INET_DIAG_BC_D_COND
:
807 if (!valid_hostcond(bc
, len
, &min_len
))
810 case INET_DIAG_BC_DEV_COND
:
811 if (!valid_devcond(bc
, len
, &min_len
))
814 case INET_DIAG_BC_S_EQ
:
815 case INET_DIAG_BC_S_GE
:
816 case INET_DIAG_BC_S_LE
:
817 case INET_DIAG_BC_D_EQ
:
818 case INET_DIAG_BC_D_GE
:
819 case INET_DIAG_BC_D_LE
:
820 if (!valid_port_comparison(bc
, len
, &min_len
))
823 case INET_DIAG_BC_MARK_COND
:
826 if (!valid_markcond(bc
, len
, &min_len
))
829 case INET_DIAG_BC_AUTO
:
830 case INET_DIAG_BC_JMP
:
831 case INET_DIAG_BC_NOP
:
837 if (op
->code
!= INET_DIAG_BC_NOP
) {
838 if (op
->no
< min_len
|| op
->no
> len
+ 4 || op
->no
& 3)
841 !valid_cc(bytecode
, bytecode_len
, len
- op
->no
))
845 if (op
->yes
< min_len
|| op
->yes
> len
+ 4 || op
->yes
& 3)
850 return len
== 0 ? 0 : -EINVAL
;
853 static int inet_csk_diag_dump(struct sock
*sk
,
855 struct netlink_callback
*cb
,
856 const struct inet_diag_req_v2
*r
,
857 const struct nlattr
*bc
,
860 if (!inet_diag_bc_sk(bc
, sk
))
863 return inet_csk_diag_fill(sk
, skb
, r
,
864 sk_user_ns(NETLINK_CB(cb
->skb
).sk
),
865 NETLINK_CB(cb
->skb
).portid
,
866 cb
->nlh
->nlmsg_seq
, NLM_F_MULTI
, cb
->nlh
,
870 static void twsk_build_assert(void)
872 BUILD_BUG_ON(offsetof(struct inet_timewait_sock
, tw_family
) !=
873 offsetof(struct sock
, sk_family
));
875 BUILD_BUG_ON(offsetof(struct inet_timewait_sock
, tw_num
) !=
876 offsetof(struct inet_sock
, inet_num
));
878 BUILD_BUG_ON(offsetof(struct inet_timewait_sock
, tw_dport
) !=
879 offsetof(struct inet_sock
, inet_dport
));
881 BUILD_BUG_ON(offsetof(struct inet_timewait_sock
, tw_rcv_saddr
) !=
882 offsetof(struct inet_sock
, inet_rcv_saddr
));
884 BUILD_BUG_ON(offsetof(struct inet_timewait_sock
, tw_daddr
) !=
885 offsetof(struct inet_sock
, inet_daddr
));
887 #if IS_ENABLED(CONFIG_IPV6)
888 BUILD_BUG_ON(offsetof(struct inet_timewait_sock
, tw_v6_rcv_saddr
) !=
889 offsetof(struct sock
, sk_v6_rcv_saddr
));
891 BUILD_BUG_ON(offsetof(struct inet_timewait_sock
, tw_v6_daddr
) !=
892 offsetof(struct sock
, sk_v6_daddr
));
896 void inet_diag_dump_icsk(struct inet_hashinfo
*hashinfo
, struct sk_buff
*skb
,
897 struct netlink_callback
*cb
,
898 const struct inet_diag_req_v2
*r
, struct nlattr
*bc
)
900 bool net_admin
= netlink_net_capable(cb
->skb
, CAP_NET_ADMIN
);
901 struct net
*net
= sock_net(skb
->sk
);
902 u32 idiag_states
= r
->idiag_states
;
903 int i
, num
, s_i
, s_num
;
906 if (idiag_states
& TCPF_SYN_RECV
)
907 idiag_states
|= TCPF_NEW_SYN_RECV
;
909 s_num
= num
= cb
->args
[2];
911 if (cb
->args
[0] == 0) {
912 if (!(idiag_states
& TCPF_LISTEN
) || r
->id
.idiag_dport
)
915 for (i
= s_i
; i
< INET_LHTABLE_SIZE
; i
++) {
916 struct inet_listen_hashbucket
*ilb
;
919 ilb
= &hashinfo
->listening_hash
[i
];
920 spin_lock(&ilb
->lock
);
921 sk_for_each(sk
, &ilb
->head
) {
922 struct inet_sock
*inet
= inet_sk(sk
);
924 if (!net_eq(sock_net(sk
), net
))
932 if (r
->sdiag_family
!= AF_UNSPEC
&&
933 sk
->sk_family
!= r
->sdiag_family
)
936 if (r
->id
.idiag_sport
!= inet
->inet_sport
&&
940 if (inet_csk_diag_dump(sk
, skb
, cb
, r
,
941 bc
, net_admin
) < 0) {
942 spin_unlock(&ilb
->lock
);
949 spin_unlock(&ilb
->lock
);
955 s_i
= num
= s_num
= 0;
958 if (!(idiag_states
& ~TCPF_LISTEN
))
962 for (i
= s_i
; i
<= hashinfo
->ehash_mask
; i
++) {
963 struct inet_ehash_bucket
*head
= &hashinfo
->ehash
[i
];
964 spinlock_t
*lock
= inet_ehash_lockp(hashinfo
, i
);
965 struct hlist_nulls_node
*node
;
966 struct sock
*sk_arr
[SKARR_SZ
];
967 int num_arr
[SKARR_SZ
];
970 if (hlist_nulls_empty(&head
->chain
))
980 sk_nulls_for_each(sk
, node
, &head
->chain
) {
983 if (!net_eq(sock_net(sk
), net
))
987 state
= (sk
->sk_state
== TCP_TIME_WAIT
) ?
988 inet_twsk(sk
)->tw_substate
: sk
->sk_state
;
989 if (!(idiag_states
& (1 << state
)))
991 if (r
->sdiag_family
!= AF_UNSPEC
&&
992 sk
->sk_family
!= r
->sdiag_family
)
994 if (r
->id
.idiag_sport
!= htons(sk
->sk_num
) &&
997 if (r
->id
.idiag_dport
!= sk
->sk_dport
&&
1000 twsk_build_assert();
1002 if (!inet_diag_bc_sk(bc
, sk
))
1005 if (!refcount_inc_not_zero(&sk
->sk_refcnt
))
1008 num_arr
[accum
] = num
;
1010 if (++accum
== SKARR_SZ
)
1015 spin_unlock_bh(lock
);
1017 for (idx
= 0; idx
< accum
; idx
++) {
1019 res
= sk_diag_fill(sk_arr
[idx
], skb
, r
,
1020 sk_user_ns(NETLINK_CB(cb
->skb
).sk
),
1021 NETLINK_CB(cb
->skb
).portid
,
1022 cb
->nlh
->nlmsg_seq
, NLM_F_MULTI
,
1023 cb
->nlh
, net_admin
);
1027 sock_gen_put(sk_arr
[idx
]);
1032 if (accum
== SKARR_SZ
) {
1044 EXPORT_SYMBOL_GPL(inet_diag_dump_icsk
);
1046 static int __inet_diag_dump(struct sk_buff
*skb
, struct netlink_callback
*cb
,
1047 const struct inet_diag_req_v2
*r
,
1050 const struct inet_diag_handler
*handler
;
1053 handler
= inet_diag_lock_handler(r
->sdiag_protocol
);
1054 if (!IS_ERR(handler
))
1055 handler
->dump(skb
, cb
, r
, bc
);
1057 err
= PTR_ERR(handler
);
1058 inet_diag_unlock_handler(handler
);
1060 return err
? : skb
->len
;
1063 static int inet_diag_dump(struct sk_buff
*skb
, struct netlink_callback
*cb
)
1065 int hdrlen
= sizeof(struct inet_diag_req_v2
);
1066 struct nlattr
*bc
= NULL
;
1068 if (nlmsg_attrlen(cb
->nlh
, hdrlen
))
1069 bc
= nlmsg_find_attr(cb
->nlh
, hdrlen
, INET_DIAG_REQ_BYTECODE
);
1071 return __inet_diag_dump(skb
, cb
, nlmsg_data(cb
->nlh
), bc
);
1074 static int inet_diag_type2proto(int type
)
1077 case TCPDIAG_GETSOCK
:
1079 case DCCPDIAG_GETSOCK
:
1080 return IPPROTO_DCCP
;
1086 static int inet_diag_dump_compat(struct sk_buff
*skb
,
1087 struct netlink_callback
*cb
)
1089 struct inet_diag_req
*rc
= nlmsg_data(cb
->nlh
);
1090 int hdrlen
= sizeof(struct inet_diag_req
);
1091 struct inet_diag_req_v2 req
;
1092 struct nlattr
*bc
= NULL
;
1094 req
.sdiag_family
= AF_UNSPEC
; /* compatibility */
1095 req
.sdiag_protocol
= inet_diag_type2proto(cb
->nlh
->nlmsg_type
);
1096 req
.idiag_ext
= rc
->idiag_ext
;
1097 req
.idiag_states
= rc
->idiag_states
;
1100 if (nlmsg_attrlen(cb
->nlh
, hdrlen
))
1101 bc
= nlmsg_find_attr(cb
->nlh
, hdrlen
, INET_DIAG_REQ_BYTECODE
);
1103 return __inet_diag_dump(skb
, cb
, &req
, bc
);
1106 static int inet_diag_get_exact_compat(struct sk_buff
*in_skb
,
1107 const struct nlmsghdr
*nlh
)
1109 struct inet_diag_req
*rc
= nlmsg_data(nlh
);
1110 struct inet_diag_req_v2 req
;
1112 req
.sdiag_family
= rc
->idiag_family
;
1113 req
.sdiag_protocol
= inet_diag_type2proto(nlh
->nlmsg_type
);
1114 req
.idiag_ext
= rc
->idiag_ext
;
1115 req
.idiag_states
= rc
->idiag_states
;
1118 return inet_diag_cmd_exact(SOCK_DIAG_BY_FAMILY
, in_skb
, nlh
, &req
);
1121 static int inet_diag_rcv_msg_compat(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
1123 int hdrlen
= sizeof(struct inet_diag_req
);
1124 struct net
*net
= sock_net(skb
->sk
);
1126 if (nlh
->nlmsg_type
>= INET_DIAG_GETSOCK_MAX
||
1127 nlmsg_len(nlh
) < hdrlen
)
1130 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
1131 if (nlmsg_attrlen(nlh
, hdrlen
)) {
1132 struct nlattr
*attr
;
1135 attr
= nlmsg_find_attr(nlh
, hdrlen
,
1136 INET_DIAG_REQ_BYTECODE
);
1137 err
= inet_diag_bc_audit(attr
, skb
);
1142 struct netlink_dump_control c
= {
1143 .dump
= inet_diag_dump_compat
,
1145 return netlink_dump_start(net
->diag_nlsk
, skb
, nlh
, &c
);
1149 return inet_diag_get_exact_compat(skb
, nlh
);
1152 static int inet_diag_handler_cmd(struct sk_buff
*skb
, struct nlmsghdr
*h
)
1154 int hdrlen
= sizeof(struct inet_diag_req_v2
);
1155 struct net
*net
= sock_net(skb
->sk
);
1157 if (nlmsg_len(h
) < hdrlen
)
1160 if (h
->nlmsg_type
== SOCK_DIAG_BY_FAMILY
&&
1161 h
->nlmsg_flags
& NLM_F_DUMP
) {
1162 if (nlmsg_attrlen(h
, hdrlen
)) {
1163 struct nlattr
*attr
;
1166 attr
= nlmsg_find_attr(h
, hdrlen
,
1167 INET_DIAG_REQ_BYTECODE
);
1168 err
= inet_diag_bc_audit(attr
, skb
);
1173 struct netlink_dump_control c
= {
1174 .dump
= inet_diag_dump
,
1176 return netlink_dump_start(net
->diag_nlsk
, skb
, h
, &c
);
1180 return inet_diag_cmd_exact(h
->nlmsg_type
, skb
, h
, nlmsg_data(h
));
1184 int inet_diag_handler_get_info(struct sk_buff
*skb
, struct sock
*sk
)
1186 const struct inet_diag_handler
*handler
;
1187 struct nlmsghdr
*nlh
;
1188 struct nlattr
*attr
;
1189 struct inet_diag_msg
*r
;
1193 nlh
= nlmsg_put(skb
, 0, 0, SOCK_DIAG_BY_FAMILY
, sizeof(*r
), 0);
1197 r
= nlmsg_data(nlh
);
1198 memset(r
, 0, sizeof(*r
));
1199 inet_diag_msg_common_fill(r
, sk
);
1200 if (sk
->sk_type
== SOCK_DGRAM
|| sk
->sk_type
== SOCK_STREAM
)
1201 r
->id
.idiag_sport
= inet_sk(sk
)->inet_sport
;
1202 r
->idiag_state
= sk
->sk_state
;
1204 if ((err
= nla_put_u8(skb
, INET_DIAG_PROTOCOL
, sk
->sk_protocol
))) {
1205 nlmsg_cancel(skb
, nlh
);
1209 handler
= inet_diag_lock_handler(sk
->sk_protocol
);
1210 if (IS_ERR(handler
)) {
1211 inet_diag_unlock_handler(handler
);
1212 nlmsg_cancel(skb
, nlh
);
1213 return PTR_ERR(handler
);
1216 attr
= handler
->idiag_info_size
1217 ? nla_reserve_64bit(skb
, INET_DIAG_INFO
,
1218 handler
->idiag_info_size
,
1222 info
= nla_data(attr
);
1224 handler
->idiag_get_info(sk
, r
, info
);
1225 inet_diag_unlock_handler(handler
);
1227 nlmsg_end(skb
, nlh
);
1231 static const struct sock_diag_handler inet_diag_handler
= {
1233 .dump
= inet_diag_handler_cmd
,
1234 .get_info
= inet_diag_handler_get_info
,
1235 .destroy
= inet_diag_handler_cmd
,
1238 static const struct sock_diag_handler inet6_diag_handler
= {
1240 .dump
= inet_diag_handler_cmd
,
1241 .get_info
= inet_diag_handler_get_info
,
1242 .destroy
= inet_diag_handler_cmd
,
1245 int inet_diag_register(const struct inet_diag_handler
*h
)
1247 const __u16 type
= h
->idiag_type
;
1250 if (type
>= IPPROTO_MAX
)
1253 mutex_lock(&inet_diag_table_mutex
);
1255 if (!inet_diag_table
[type
]) {
1256 inet_diag_table
[type
] = h
;
1259 mutex_unlock(&inet_diag_table_mutex
);
1263 EXPORT_SYMBOL_GPL(inet_diag_register
);
1265 void inet_diag_unregister(const struct inet_diag_handler
*h
)
1267 const __u16 type
= h
->idiag_type
;
1269 if (type
>= IPPROTO_MAX
)
1272 mutex_lock(&inet_diag_table_mutex
);
1273 inet_diag_table
[type
] = NULL
;
1274 mutex_unlock(&inet_diag_table_mutex
);
1276 EXPORT_SYMBOL_GPL(inet_diag_unregister
);
1278 static int __init
inet_diag_init(void)
1280 const int inet_diag_table_size
= (IPPROTO_MAX
*
1281 sizeof(struct inet_diag_handler
*));
1284 inet_diag_table
= kzalloc(inet_diag_table_size
, GFP_KERNEL
);
1285 if (!inet_diag_table
)
1288 err
= sock_diag_register(&inet_diag_handler
);
1292 err
= sock_diag_register(&inet6_diag_handler
);
1296 sock_diag_register_inet_compat(inet_diag_rcv_msg_compat
);
1301 sock_diag_unregister(&inet_diag_handler
);
1303 kfree(inet_diag_table
);
1307 static void __exit
inet_diag_exit(void)
1309 sock_diag_unregister(&inet6_diag_handler
);
1310 sock_diag_unregister(&inet_diag_handler
);
1311 sock_diag_unregister_inet_compat(inet_diag_rcv_msg_compat
);
1312 kfree(inet_diag_table
);
1315 module_init(inet_diag_init
);
1316 module_exit(inet_diag_exit
);
1317 MODULE_LICENSE("GPL");
1318 MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK
, NETLINK_SOCK_DIAG
, 2 /* AF_INET */);
1319 MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK
, NETLINK_SOCK_DIAG
, 10 /* AF_INET6 */);