2 * Copyright (c) 2004, 2005 Topspin Communications. All rights reserved.
3 * Copyright (c) 2005 Mellanox Technologies Ltd. All rights reserved.
4 * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved.
6 * This software is available to you under a choice of one of two
7 * licenses. You may choose to be licensed under the terms of the GNU
8 * General Public License (GPL) Version 2, available from the file
9 * COPYING in the main directory of this source tree, or the
10 * OpenIB.org BSD license below:
12 * Redistribution and use in source and binary forms, with or
13 * without modification, are permitted provided that the following
16 * - Redistributions of source code must retain the above
17 * copyright notice, this list of conditions and the following
20 * - Redistributions in binary form must reproduce the above
21 * copyright notice, this list of conditions and the following
22 * disclaimer in the documentation and/or other materials
23 * provided with the distribution.
25 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
26 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
27 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
28 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
29 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
30 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
31 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
35 #include "core_priv.h"
37 #include <linux/slab.h>
38 #include <linux/stat.h>
39 #include <linux/string.h>
40 #include <linux/netdevice.h>
41 #include <linux/ethtool.h>
43 #include <rdma/ib_mad.h>
44 #include <rdma/ib_pma.h>
45 #include <rdma/ib_cache.h>
46 #include <rdma/rdma_counter.h>
50 struct gid_attr_group
{
53 struct attribute_group ndev
;
54 struct attribute_group type
;
58 struct ib_device
*ibdev
;
59 struct gid_attr_group
*gid_attr_group
;
60 struct attribute_group gid_group
;
61 struct attribute_group
*pkey_group
;
62 const struct attribute_group
*pma_table
;
63 struct attribute_group
*hw_stats_ag
;
64 struct rdma_hw_stats
*hw_stats
;
68 struct port_attribute
{
69 struct attribute attr
;
70 ssize_t (*show
)(struct ib_port
*, struct port_attribute
*, char *buf
);
71 ssize_t (*store
)(struct ib_port
*, struct port_attribute
*,
72 const char *buf
, size_t count
);
75 #define PORT_ATTR(_name, _mode, _show, _store) \
76 struct port_attribute port_attr_##_name = __ATTR(_name, _mode, _show, _store)
78 #define PORT_ATTR_RO(_name) \
79 struct port_attribute port_attr_##_name = __ATTR_RO(_name)
81 struct port_table_attribute
{
82 struct port_attribute attr
;
88 struct hw_stats_attribute
{
89 struct attribute attr
;
90 ssize_t (*show
)(struct kobject
*kobj
,
91 struct attribute
*attr
, char *buf
);
92 ssize_t (*store
)(struct kobject
*kobj
,
93 struct attribute
*attr
,
100 static ssize_t
port_attr_show(struct kobject
*kobj
,
101 struct attribute
*attr
, char *buf
)
103 struct port_attribute
*port_attr
=
104 container_of(attr
, struct port_attribute
, attr
);
105 struct ib_port
*p
= container_of(kobj
, struct ib_port
, kobj
);
107 if (!port_attr
->show
)
110 return port_attr
->show(p
, port_attr
, buf
);
113 static ssize_t
port_attr_store(struct kobject
*kobj
,
114 struct attribute
*attr
,
115 const char *buf
, size_t count
)
117 struct port_attribute
*port_attr
=
118 container_of(attr
, struct port_attribute
, attr
);
119 struct ib_port
*p
= container_of(kobj
, struct ib_port
, kobj
);
121 if (!port_attr
->store
)
123 return port_attr
->store(p
, port_attr
, buf
, count
);
126 static const struct sysfs_ops port_sysfs_ops
= {
127 .show
= port_attr_show
,
128 .store
= port_attr_store
131 static ssize_t
gid_attr_show(struct kobject
*kobj
,
132 struct attribute
*attr
, char *buf
)
134 struct port_attribute
*port_attr
=
135 container_of(attr
, struct port_attribute
, attr
);
136 struct ib_port
*p
= container_of(kobj
, struct gid_attr_group
,
139 if (!port_attr
->show
)
142 return port_attr
->show(p
, port_attr
, buf
);
145 static const struct sysfs_ops gid_attr_sysfs_ops
= {
146 .show
= gid_attr_show
149 static ssize_t
state_show(struct ib_port
*p
, struct port_attribute
*unused
,
152 struct ib_port_attr attr
;
155 static const char *state_name
[] = {
156 [IB_PORT_NOP
] = "NOP",
157 [IB_PORT_DOWN
] = "DOWN",
158 [IB_PORT_INIT
] = "INIT",
159 [IB_PORT_ARMED
] = "ARMED",
160 [IB_PORT_ACTIVE
] = "ACTIVE",
161 [IB_PORT_ACTIVE_DEFER
] = "ACTIVE_DEFER"
164 ret
= ib_query_port(p
->ibdev
, p
->port_num
, &attr
);
168 return sysfs_emit(buf
, "%d: %s\n", attr
.state
,
170 attr
.state
< ARRAY_SIZE(state_name
) ?
171 state_name
[attr
.state
] :
175 static ssize_t
lid_show(struct ib_port
*p
, struct port_attribute
*unused
,
178 struct ib_port_attr attr
;
181 ret
= ib_query_port(p
->ibdev
, p
->port_num
, &attr
);
185 return sysfs_emit(buf
, "0x%x\n", attr
.lid
);
188 static ssize_t
lid_mask_count_show(struct ib_port
*p
,
189 struct port_attribute
*unused
,
192 struct ib_port_attr attr
;
195 ret
= ib_query_port(p
->ibdev
, p
->port_num
, &attr
);
199 return sysfs_emit(buf
, "%d\n", attr
.lmc
);
202 static ssize_t
sm_lid_show(struct ib_port
*p
, struct port_attribute
*unused
,
205 struct ib_port_attr attr
;
208 ret
= ib_query_port(p
->ibdev
, p
->port_num
, &attr
);
212 return sysfs_emit(buf
, "0x%x\n", attr
.sm_lid
);
215 static ssize_t
sm_sl_show(struct ib_port
*p
, struct port_attribute
*unused
,
218 struct ib_port_attr attr
;
221 ret
= ib_query_port(p
->ibdev
, p
->port_num
, &attr
);
225 return sysfs_emit(buf
, "%d\n", attr
.sm_sl
);
228 static ssize_t
cap_mask_show(struct ib_port
*p
, struct port_attribute
*unused
,
231 struct ib_port_attr attr
;
234 ret
= ib_query_port(p
->ibdev
, p
->port_num
, &attr
);
238 return sysfs_emit(buf
, "0x%08x\n", attr
.port_cap_flags
);
241 static ssize_t
rate_show(struct ib_port
*p
, struct port_attribute
*unused
,
244 struct ib_port_attr attr
;
246 int rate
; /* in deci-Gb/sec */
249 ret
= ib_query_port(p
->ibdev
, p
->port_num
, &attr
);
253 switch (attr
.active_speed
) {
283 default: /* default to SDR for invalid rates */
289 rate
*= ib_width_enum_to_int(attr
.active_width
);
293 return sysfs_emit(buf
, "%d%s Gb/sec (%dX%s)\n", rate
/ 10,
294 rate
% 10 ? ".5" : "",
295 ib_width_enum_to_int(attr
.active_width
), speed
);
298 static const char *phys_state_to_str(enum ib_port_phys_state phys_state
)
300 static const char * phys_state_str
[] = {
305 "PortConfigurationTraining",
311 if (phys_state
< ARRAY_SIZE(phys_state_str
))
312 return phys_state_str
[phys_state
];
316 static ssize_t
phys_state_show(struct ib_port
*p
, struct port_attribute
*unused
,
319 struct ib_port_attr attr
;
323 ret
= ib_query_port(p
->ibdev
, p
->port_num
, &attr
);
327 return sysfs_emit(buf
, "%d: %s\n", attr
.phys_state
,
328 phys_state_to_str(attr
.phys_state
));
331 static ssize_t
link_layer_show(struct ib_port
*p
, struct port_attribute
*unused
,
336 switch (rdma_port_get_link_layer(p
->ibdev
, p
->port_num
)) {
337 case IB_LINK_LAYER_INFINIBAND
:
338 output
= "InfiniBand";
340 case IB_LINK_LAYER_ETHERNET
:
348 return sysfs_emit(buf
, "%s\n", output
);
351 static PORT_ATTR_RO(state
);
352 static PORT_ATTR_RO(lid
);
353 static PORT_ATTR_RO(lid_mask_count
);
354 static PORT_ATTR_RO(sm_lid
);
355 static PORT_ATTR_RO(sm_sl
);
356 static PORT_ATTR_RO(cap_mask
);
357 static PORT_ATTR_RO(rate
);
358 static PORT_ATTR_RO(phys_state
);
359 static PORT_ATTR_RO(link_layer
);
361 static struct attribute
*port_default_attrs
[] = {
362 &port_attr_state
.attr
,
364 &port_attr_lid_mask_count
.attr
,
365 &port_attr_sm_lid
.attr
,
366 &port_attr_sm_sl
.attr
,
367 &port_attr_cap_mask
.attr
,
368 &port_attr_rate
.attr
,
369 &port_attr_phys_state
.attr
,
370 &port_attr_link_layer
.attr
,
374 static ssize_t
print_ndev(const struct ib_gid_attr
*gid_attr
, char *buf
)
376 struct net_device
*ndev
;
380 ndev
= rcu_dereference(gid_attr
->ndev
);
382 ret
= sysfs_emit(buf
, "%s\n", ndev
->name
);
387 static ssize_t
print_gid_type(const struct ib_gid_attr
*gid_attr
, char *buf
)
389 return sysfs_emit(buf
, "%s\n",
390 ib_cache_gid_type_str(gid_attr
->gid_type
));
393 static ssize_t
_show_port_gid_attr(
394 struct ib_port
*p
, struct port_attribute
*attr
, char *buf
,
395 ssize_t (*print
)(const struct ib_gid_attr
*gid_attr
, char *buf
))
397 struct port_table_attribute
*tab_attr
=
398 container_of(attr
, struct port_table_attribute
, attr
);
399 const struct ib_gid_attr
*gid_attr
;
402 gid_attr
= rdma_get_gid_attr(p
->ibdev
, p
->port_num
, tab_attr
->index
);
403 if (IS_ERR(gid_attr
))
404 /* -EINVAL is returned for user space compatibility reasons. */
407 ret
= print(gid_attr
, buf
);
408 rdma_put_gid_attr(gid_attr
);
412 static ssize_t
show_port_gid(struct ib_port
*p
, struct port_attribute
*attr
,
415 struct port_table_attribute
*tab_attr
=
416 container_of(attr
, struct port_table_attribute
, attr
);
417 const struct ib_gid_attr
*gid_attr
;
420 gid_attr
= rdma_get_gid_attr(p
->ibdev
, p
->port_num
, tab_attr
->index
);
421 if (IS_ERR(gid_attr
)) {
422 const union ib_gid zgid
= {};
424 /* If reading GID fails, it is likely due to GID entry being
425 * empty (invalid) or reserved GID in the table. User space
426 * expects to read GID table entries as long as it given index
427 * is within GID table size. Administrative/debugging tool
428 * fails to query rest of the GID entries if it hits error
429 * while querying a GID of the given index. To avoid user
430 * space throwing such error on fail to read gid, return zero
431 * GID as before. This maintains backward compatibility.
433 return sysfs_emit(buf
, "%pI6\n", zgid
.raw
);
436 len
= sysfs_emit(buf
, "%pI6\n", gid_attr
->gid
.raw
);
437 rdma_put_gid_attr(gid_attr
);
441 static ssize_t
show_port_gid_attr_ndev(struct ib_port
*p
,
442 struct port_attribute
*attr
, char *buf
)
444 return _show_port_gid_attr(p
, attr
, buf
, print_ndev
);
447 static ssize_t
show_port_gid_attr_gid_type(struct ib_port
*p
,
448 struct port_attribute
*attr
,
451 return _show_port_gid_attr(p
, attr
, buf
, print_gid_type
);
454 static ssize_t
show_port_pkey(struct ib_port
*p
, struct port_attribute
*attr
,
457 struct port_table_attribute
*tab_attr
=
458 container_of(attr
, struct port_table_attribute
, attr
);
462 ret
= ib_query_pkey(p
->ibdev
, p
->port_num
, tab_attr
->index
, &pkey
);
466 return sysfs_emit(buf
, "0x%04x\n", pkey
);
469 #define PORT_PMA_ATTR(_name, _counter, _width, _offset) \
470 struct port_table_attribute port_pma_attr_##_name = { \
471 .attr = __ATTR(_name, S_IRUGO, show_pma_counter, NULL), \
472 .index = (_offset) | ((_width) << 16) | ((_counter) << 24), \
473 .attr_id = IB_PMA_PORT_COUNTERS , \
476 #define PORT_PMA_ATTR_EXT(_name, _width, _offset) \
477 struct port_table_attribute port_pma_attr_ext_##_name = { \
478 .attr = __ATTR(_name, S_IRUGO, show_pma_counter, NULL), \
479 .index = (_offset) | ((_width) << 16), \
480 .attr_id = IB_PMA_PORT_COUNTERS_EXT , \
484 * Get a Perfmgmt MAD block of data.
485 * Returns error code or the number of bytes retrieved.
487 static int get_perf_mad(struct ib_device
*dev
, int port_num
, __be16 attr
,
488 void *data
, int offset
, size_t size
)
490 struct ib_mad
*in_mad
;
491 struct ib_mad
*out_mad
;
492 size_t mad_size
= sizeof(*out_mad
);
493 u16 out_mad_pkey_index
= 0;
496 if (!dev
->ops
.process_mad
)
499 in_mad
= kzalloc(sizeof(*in_mad
), GFP_KERNEL
);
500 out_mad
= kzalloc(sizeof(*out_mad
), GFP_KERNEL
);
501 if (!in_mad
|| !out_mad
) {
506 in_mad
->mad_hdr
.base_version
= 1;
507 in_mad
->mad_hdr
.mgmt_class
= IB_MGMT_CLASS_PERF_MGMT
;
508 in_mad
->mad_hdr
.class_version
= 1;
509 in_mad
->mad_hdr
.method
= IB_MGMT_METHOD_GET
;
510 in_mad
->mad_hdr
.attr_id
= attr
;
512 if (attr
!= IB_PMA_CLASS_PORT_INFO
)
513 in_mad
->data
[41] = port_num
; /* PortSelect field */
515 if ((dev
->ops
.process_mad(dev
, IB_MAD_IGNORE_MKEY
, port_num
, NULL
, NULL
,
516 in_mad
, out_mad
, &mad_size
,
517 &out_mad_pkey_index
) &
518 (IB_MAD_RESULT_SUCCESS
| IB_MAD_RESULT_REPLY
)) !=
519 (IB_MAD_RESULT_SUCCESS
| IB_MAD_RESULT_REPLY
)) {
523 memcpy(data
, out_mad
->data
+ offset
, size
);
531 static ssize_t
show_pma_counter(struct ib_port
*p
, struct port_attribute
*attr
,
534 struct port_table_attribute
*tab_attr
=
535 container_of(attr
, struct port_table_attribute
, attr
);
536 int offset
= tab_attr
->index
& 0xffff;
537 int width
= (tab_attr
->index
>> 16) & 0xff;
542 ret
= get_perf_mad(p
->ibdev
, p
->port_num
, tab_attr
->attr_id
, &data
,
543 40 + offset
/ 8, sizeof(data
));
549 len
= sysfs_emit(buf
, "%u\n",
550 (*data
>> (4 - (offset
% 8))) & 0xf);
553 len
= sysfs_emit(buf
, "%u\n", *data
);
556 len
= sysfs_emit(buf
, "%u\n", be16_to_cpup((__be16
*)data
));
559 len
= sysfs_emit(buf
, "%u\n", be32_to_cpup((__be32
*)data
));
562 len
= sysfs_emit(buf
, "%llu\n", be64_to_cpup((__be64
*)data
));
572 static PORT_PMA_ATTR(symbol_error
, 0, 16, 32);
573 static PORT_PMA_ATTR(link_error_recovery
, 1, 8, 48);
574 static PORT_PMA_ATTR(link_downed
, 2, 8, 56);
575 static PORT_PMA_ATTR(port_rcv_errors
, 3, 16, 64);
576 static PORT_PMA_ATTR(port_rcv_remote_physical_errors
, 4, 16, 80);
577 static PORT_PMA_ATTR(port_rcv_switch_relay_errors
, 5, 16, 96);
578 static PORT_PMA_ATTR(port_xmit_discards
, 6, 16, 112);
579 static PORT_PMA_ATTR(port_xmit_constraint_errors
, 7, 8, 128);
580 static PORT_PMA_ATTR(port_rcv_constraint_errors
, 8, 8, 136);
581 static PORT_PMA_ATTR(local_link_integrity_errors
, 9, 4, 152);
582 static PORT_PMA_ATTR(excessive_buffer_overrun_errors
, 10, 4, 156);
583 static PORT_PMA_ATTR(VL15_dropped
, 11, 16, 176);
584 static PORT_PMA_ATTR(port_xmit_data
, 12, 32, 192);
585 static PORT_PMA_ATTR(port_rcv_data
, 13, 32, 224);
586 static PORT_PMA_ATTR(port_xmit_packets
, 14, 32, 256);
587 static PORT_PMA_ATTR(port_rcv_packets
, 15, 32, 288);
588 static PORT_PMA_ATTR(port_xmit_wait
, 0, 32, 320);
591 * Counters added by extended set
593 static PORT_PMA_ATTR_EXT(port_xmit_data
, 64, 64);
594 static PORT_PMA_ATTR_EXT(port_rcv_data
, 64, 128);
595 static PORT_PMA_ATTR_EXT(port_xmit_packets
, 64, 192);
596 static PORT_PMA_ATTR_EXT(port_rcv_packets
, 64, 256);
597 static PORT_PMA_ATTR_EXT(unicast_xmit_packets
, 64, 320);
598 static PORT_PMA_ATTR_EXT(unicast_rcv_packets
, 64, 384);
599 static PORT_PMA_ATTR_EXT(multicast_xmit_packets
, 64, 448);
600 static PORT_PMA_ATTR_EXT(multicast_rcv_packets
, 64, 512);
602 static struct attribute
*pma_attrs
[] = {
603 &port_pma_attr_symbol_error
.attr
.attr
,
604 &port_pma_attr_link_error_recovery
.attr
.attr
,
605 &port_pma_attr_link_downed
.attr
.attr
,
606 &port_pma_attr_port_rcv_errors
.attr
.attr
,
607 &port_pma_attr_port_rcv_remote_physical_errors
.attr
.attr
,
608 &port_pma_attr_port_rcv_switch_relay_errors
.attr
.attr
,
609 &port_pma_attr_port_xmit_discards
.attr
.attr
,
610 &port_pma_attr_port_xmit_constraint_errors
.attr
.attr
,
611 &port_pma_attr_port_rcv_constraint_errors
.attr
.attr
,
612 &port_pma_attr_local_link_integrity_errors
.attr
.attr
,
613 &port_pma_attr_excessive_buffer_overrun_errors
.attr
.attr
,
614 &port_pma_attr_VL15_dropped
.attr
.attr
,
615 &port_pma_attr_port_xmit_data
.attr
.attr
,
616 &port_pma_attr_port_rcv_data
.attr
.attr
,
617 &port_pma_attr_port_xmit_packets
.attr
.attr
,
618 &port_pma_attr_port_rcv_packets
.attr
.attr
,
619 &port_pma_attr_port_xmit_wait
.attr
.attr
,
623 static struct attribute
*pma_attrs_ext
[] = {
624 &port_pma_attr_symbol_error
.attr
.attr
,
625 &port_pma_attr_link_error_recovery
.attr
.attr
,
626 &port_pma_attr_link_downed
.attr
.attr
,
627 &port_pma_attr_port_rcv_errors
.attr
.attr
,
628 &port_pma_attr_port_rcv_remote_physical_errors
.attr
.attr
,
629 &port_pma_attr_port_rcv_switch_relay_errors
.attr
.attr
,
630 &port_pma_attr_port_xmit_discards
.attr
.attr
,
631 &port_pma_attr_port_xmit_constraint_errors
.attr
.attr
,
632 &port_pma_attr_port_rcv_constraint_errors
.attr
.attr
,
633 &port_pma_attr_local_link_integrity_errors
.attr
.attr
,
634 &port_pma_attr_excessive_buffer_overrun_errors
.attr
.attr
,
635 &port_pma_attr_VL15_dropped
.attr
.attr
,
636 &port_pma_attr_ext_port_xmit_data
.attr
.attr
,
637 &port_pma_attr_ext_port_rcv_data
.attr
.attr
,
638 &port_pma_attr_ext_port_xmit_packets
.attr
.attr
,
639 &port_pma_attr_port_xmit_wait
.attr
.attr
,
640 &port_pma_attr_ext_port_rcv_packets
.attr
.attr
,
641 &port_pma_attr_ext_unicast_rcv_packets
.attr
.attr
,
642 &port_pma_attr_ext_unicast_xmit_packets
.attr
.attr
,
643 &port_pma_attr_ext_multicast_rcv_packets
.attr
.attr
,
644 &port_pma_attr_ext_multicast_xmit_packets
.attr
.attr
,
648 static struct attribute
*pma_attrs_noietf
[] = {
649 &port_pma_attr_symbol_error
.attr
.attr
,
650 &port_pma_attr_link_error_recovery
.attr
.attr
,
651 &port_pma_attr_link_downed
.attr
.attr
,
652 &port_pma_attr_port_rcv_errors
.attr
.attr
,
653 &port_pma_attr_port_rcv_remote_physical_errors
.attr
.attr
,
654 &port_pma_attr_port_rcv_switch_relay_errors
.attr
.attr
,
655 &port_pma_attr_port_xmit_discards
.attr
.attr
,
656 &port_pma_attr_port_xmit_constraint_errors
.attr
.attr
,
657 &port_pma_attr_port_rcv_constraint_errors
.attr
.attr
,
658 &port_pma_attr_local_link_integrity_errors
.attr
.attr
,
659 &port_pma_attr_excessive_buffer_overrun_errors
.attr
.attr
,
660 &port_pma_attr_VL15_dropped
.attr
.attr
,
661 &port_pma_attr_ext_port_xmit_data
.attr
.attr
,
662 &port_pma_attr_ext_port_rcv_data
.attr
.attr
,
663 &port_pma_attr_ext_port_xmit_packets
.attr
.attr
,
664 &port_pma_attr_ext_port_rcv_packets
.attr
.attr
,
665 &port_pma_attr_port_xmit_wait
.attr
.attr
,
669 static const struct attribute_group pma_group
= {
674 static const struct attribute_group pma_group_ext
= {
676 .attrs
= pma_attrs_ext
679 static const struct attribute_group pma_group_noietf
= {
681 .attrs
= pma_attrs_noietf
684 static void ib_port_release(struct kobject
*kobj
)
686 struct ib_port
*p
= container_of(kobj
, struct ib_port
, kobj
);
690 if (p
->gid_group
.attrs
) {
691 for (i
= 0; (a
= p
->gid_group
.attrs
[i
]); ++i
)
694 kfree(p
->gid_group
.attrs
);
698 if (p
->pkey_group
->attrs
) {
699 for (i
= 0; (a
= p
->pkey_group
->attrs
[i
]); ++i
)
702 kfree(p
->pkey_group
->attrs
);
705 kfree(p
->pkey_group
);
706 p
->pkey_group
= NULL
;
712 static void ib_port_gid_attr_release(struct kobject
*kobj
)
714 struct gid_attr_group
*g
= container_of(kobj
, struct gid_attr_group
,
720 for (i
= 0; (a
= g
->ndev
.attrs
[i
]); ++i
)
723 kfree(g
->ndev
.attrs
);
727 for (i
= 0; (a
= g
->type
.attrs
[i
]); ++i
)
730 kfree(g
->type
.attrs
);
736 static struct kobj_type port_type
= {
737 .release
= ib_port_release
,
738 .sysfs_ops
= &port_sysfs_ops
,
739 .default_attrs
= port_default_attrs
742 static struct kobj_type gid_attr_type
= {
743 .sysfs_ops
= &gid_attr_sysfs_ops
,
744 .release
= ib_port_gid_attr_release
747 static struct attribute
**
748 alloc_group_attrs(ssize_t (*show
)(struct ib_port
*,
749 struct port_attribute
*, char *buf
),
752 struct attribute
**tab_attr
;
753 struct port_table_attribute
*element
;
756 tab_attr
= kcalloc(1 + len
, sizeof(struct attribute
*), GFP_KERNEL
);
760 for (i
= 0; i
< len
; i
++) {
761 element
= kzalloc(sizeof(struct port_table_attribute
),
766 if (snprintf(element
->name
, sizeof(element
->name
),
767 "%d", i
) >= sizeof(element
->name
)) {
772 element
->attr
.attr
.name
= element
->name
;
773 element
->attr
.attr
.mode
= S_IRUGO
;
774 element
->attr
.show
= show
;
776 sysfs_attr_init(&element
->attr
.attr
);
778 tab_attr
[i
] = &element
->attr
.attr
;
791 * Figure out which counter table to use depending on
792 * the device capabilities.
794 static const struct attribute_group
*get_counter_table(struct ib_device
*dev
,
797 struct ib_class_port_info cpi
;
799 if (get_perf_mad(dev
, port_num
, IB_PMA_CLASS_PORT_INFO
,
800 &cpi
, 40, sizeof(cpi
)) >= 0) {
801 if (cpi
.capability_mask
& IB_PMA_CLASS_CAP_EXT_WIDTH
)
802 /* We have extended counters */
803 return &pma_group_ext
;
805 if (cpi
.capability_mask
& IB_PMA_CLASS_CAP_EXT_WIDTH_NOIETF
)
806 /* But not the IETF ones */
807 return &pma_group_noietf
;
810 /* Fall back to normal counters */
814 static int update_hw_stats(struct ib_device
*dev
, struct rdma_hw_stats
*stats
,
815 u8 port_num
, int index
)
819 if (time_is_after_eq_jiffies(stats
->timestamp
+ stats
->lifespan
))
821 ret
= dev
->ops
.get_hw_stats(dev
, stats
, port_num
, index
);
824 if (ret
== stats
->num_counters
)
825 stats
->timestamp
= jiffies
;
830 static int print_hw_stat(struct ib_device
*dev
, int port_num
,
831 struct rdma_hw_stats
*stats
, int index
, char *buf
)
833 u64 v
= rdma_counter_get_hwstat_value(dev
, port_num
, index
);
835 return sysfs_emit(buf
, "%llu\n", stats
->value
[index
] + v
);
838 static ssize_t
show_hw_stats(struct kobject
*kobj
, struct attribute
*attr
,
841 struct ib_device
*dev
;
842 struct ib_port
*port
;
843 struct hw_stats_attribute
*hsa
;
844 struct rdma_hw_stats
*stats
;
847 hsa
= container_of(attr
, struct hw_stats_attribute
, attr
);
848 if (!hsa
->port_num
) {
849 dev
= container_of((struct device
*)kobj
,
850 struct ib_device
, dev
);
851 stats
= dev
->hw_stats
;
853 port
= container_of(kobj
, struct ib_port
, kobj
);
855 stats
= port
->hw_stats
;
857 mutex_lock(&stats
->lock
);
858 ret
= update_hw_stats(dev
, stats
, hsa
->port_num
, hsa
->index
);
861 ret
= print_hw_stat(dev
, hsa
->port_num
, stats
, hsa
->index
, buf
);
863 mutex_unlock(&stats
->lock
);
868 static ssize_t
show_stats_lifespan(struct kobject
*kobj
,
869 struct attribute
*attr
,
872 struct hw_stats_attribute
*hsa
;
873 struct rdma_hw_stats
*stats
;
876 hsa
= container_of(attr
, struct hw_stats_attribute
, attr
);
877 if (!hsa
->port_num
) {
878 struct ib_device
*dev
= container_of((struct device
*)kobj
,
879 struct ib_device
, dev
);
881 stats
= dev
->hw_stats
;
883 struct ib_port
*p
= container_of(kobj
, struct ib_port
, kobj
);
888 mutex_lock(&stats
->lock
);
889 msecs
= jiffies_to_msecs(stats
->lifespan
);
890 mutex_unlock(&stats
->lock
);
892 return sysfs_emit(buf
, "%d\n", msecs
);
895 static ssize_t
set_stats_lifespan(struct kobject
*kobj
,
896 struct attribute
*attr
,
897 const char *buf
, size_t count
)
899 struct hw_stats_attribute
*hsa
;
900 struct rdma_hw_stats
*stats
;
905 ret
= kstrtoint(buf
, 10, &msecs
);
908 if (msecs
< 0 || msecs
> 10000)
910 jiffies
= msecs_to_jiffies(msecs
);
911 hsa
= container_of(attr
, struct hw_stats_attribute
, attr
);
912 if (!hsa
->port_num
) {
913 struct ib_device
*dev
= container_of((struct device
*)kobj
,
914 struct ib_device
, dev
);
916 stats
= dev
->hw_stats
;
918 struct ib_port
*p
= container_of(kobj
, struct ib_port
, kobj
);
923 mutex_lock(&stats
->lock
);
924 stats
->lifespan
= jiffies
;
925 mutex_unlock(&stats
->lock
);
930 static void free_hsag(struct kobject
*kobj
, struct attribute_group
*attr_group
)
932 struct attribute
**attr
;
934 sysfs_remove_group(kobj
, attr_group
);
936 for (attr
= attr_group
->attrs
; *attr
; attr
++)
941 static struct attribute
*alloc_hsa(int index
, u8 port_num
, const char *name
)
943 struct hw_stats_attribute
*hsa
;
945 hsa
= kmalloc(sizeof(*hsa
), GFP_KERNEL
);
949 hsa
->attr
.name
= (char *)name
;
950 hsa
->attr
.mode
= S_IRUGO
;
951 hsa
->show
= show_hw_stats
;
954 hsa
->port_num
= port_num
;
959 static struct attribute
*alloc_hsa_lifespan(char *name
, u8 port_num
)
961 struct hw_stats_attribute
*hsa
;
963 hsa
= kmalloc(sizeof(*hsa
), GFP_KERNEL
);
967 hsa
->attr
.name
= name
;
968 hsa
->attr
.mode
= S_IWUSR
| S_IRUGO
;
969 hsa
->show
= show_stats_lifespan
;
970 hsa
->store
= set_stats_lifespan
;
972 hsa
->port_num
= port_num
;
977 static void setup_hw_stats(struct ib_device
*device
, struct ib_port
*port
,
980 struct attribute_group
*hsag
;
981 struct rdma_hw_stats
*stats
;
984 stats
= device
->ops
.alloc_hw_stats(device
, port_num
);
989 if (!stats
->names
|| stats
->num_counters
<= 0)
993 * Two extra attribue elements here, one for the lifespan entry and
994 * one to NULL terminate the list for the sysfs core code
996 hsag
= kzalloc(sizeof(*hsag
) +
997 sizeof(void *) * (stats
->num_counters
+ 2),
1000 goto err_free_stats
;
1002 ret
= device
->ops
.get_hw_stats(device
, stats
, port_num
,
1003 stats
->num_counters
);
1004 if (ret
!= stats
->num_counters
)
1007 stats
->timestamp
= jiffies
;
1009 hsag
->name
= "hw_counters";
1010 hsag
->attrs
= (void *)hsag
+ sizeof(*hsag
);
1012 for (i
= 0; i
< stats
->num_counters
; i
++) {
1013 hsag
->attrs
[i
] = alloc_hsa(i
, port_num
, stats
->names
[i
]);
1014 if (!hsag
->attrs
[i
])
1016 sysfs_attr_init(hsag
->attrs
[i
]);
1019 mutex_init(&stats
->lock
);
1020 /* treat an error here as non-fatal */
1021 hsag
->attrs
[i
] = alloc_hsa_lifespan("lifespan", port_num
);
1023 sysfs_attr_init(hsag
->attrs
[i
]);
1026 struct kobject
*kobj
= &port
->kobj
;
1027 ret
= sysfs_create_group(kobj
, hsag
);
1030 port
->hw_stats_ag
= hsag
;
1031 port
->hw_stats
= stats
;
1032 if (device
->port_data
)
1033 device
->port_data
[port_num
].hw_stats
= stats
;
1035 struct kobject
*kobj
= &device
->dev
.kobj
;
1036 ret
= sysfs_create_group(kobj
, hsag
);
1039 device
->hw_stats_ag
= hsag
;
1040 device
->hw_stats
= stats
;
1047 kfree(hsag
->attrs
[i
]);
1055 static int add_port(struct ib_core_device
*coredev
, int port_num
)
1057 struct ib_device
*device
= rdma_device_to_ibdev(&coredev
->dev
);
1058 bool is_full_dev
= &device
->coredev
== coredev
;
1060 struct ib_port_attr attr
;
1064 ret
= ib_query_port(device
, port_num
, &attr
);
1068 p
= kzalloc(sizeof *p
, GFP_KERNEL
);
1073 p
->port_num
= port_num
;
1075 ret
= kobject_init_and_add(&p
->kobj
, &port_type
,
1076 coredev
->ports_kobj
,
1082 p
->gid_attr_group
= kzalloc(sizeof(*p
->gid_attr_group
), GFP_KERNEL
);
1083 if (!p
->gid_attr_group
) {
1088 p
->gid_attr_group
->port
= p
;
1089 ret
= kobject_init_and_add(&p
->gid_attr_group
->kobj
, &gid_attr_type
,
1090 &p
->kobj
, "gid_attrs");
1092 goto err_put_gid_attrs
;
1095 if (device
->ops
.process_mad
&& is_full_dev
) {
1096 p
->pma_table
= get_counter_table(device
, port_num
);
1097 ret
= sysfs_create_group(&p
->kobj
, p
->pma_table
);
1099 goto err_put_gid_attrs
;
1102 p
->gid_group
.name
= "gids";
1103 p
->gid_group
.attrs
= alloc_group_attrs(show_port_gid
, attr
.gid_tbl_len
);
1104 if (!p
->gid_group
.attrs
) {
1106 goto err_remove_pma
;
1109 ret
= sysfs_create_group(&p
->kobj
, &p
->gid_group
);
1113 p
->gid_attr_group
->ndev
.name
= "ndevs";
1114 p
->gid_attr_group
->ndev
.attrs
= alloc_group_attrs(show_port_gid_attr_ndev
,
1116 if (!p
->gid_attr_group
->ndev
.attrs
) {
1118 goto err_remove_gid
;
1121 ret
= sysfs_create_group(&p
->gid_attr_group
->kobj
,
1122 &p
->gid_attr_group
->ndev
);
1124 goto err_free_gid_ndev
;
1126 p
->gid_attr_group
->type
.name
= "types";
1127 p
->gid_attr_group
->type
.attrs
= alloc_group_attrs(show_port_gid_attr_gid_type
,
1129 if (!p
->gid_attr_group
->type
.attrs
) {
1131 goto err_remove_gid_ndev
;
1134 ret
= sysfs_create_group(&p
->gid_attr_group
->kobj
,
1135 &p
->gid_attr_group
->type
);
1137 goto err_free_gid_type
;
1139 if (attr
.pkey_tbl_len
) {
1140 p
->pkey_group
= kzalloc(sizeof(*p
->pkey_group
), GFP_KERNEL
);
1141 if (!p
->pkey_group
) {
1143 goto err_remove_gid_type
;
1146 p
->pkey_group
->name
= "pkeys";
1147 p
->pkey_group
->attrs
= alloc_group_attrs(show_port_pkey
,
1149 if (!p
->pkey_group
->attrs
) {
1151 goto err_free_pkey_group
;
1154 ret
= sysfs_create_group(&p
->kobj
, p
->pkey_group
);
1160 if (device
->ops
.init_port
&& is_full_dev
) {
1161 ret
= device
->ops
.init_port(device
, port_num
, &p
->kobj
);
1163 goto err_remove_pkey
;
1167 * If port == 0, it means hw_counters are per device and not per
1168 * port, so holder should be device. Therefore skip per port conunter
1171 if (device
->ops
.alloc_hw_stats
&& port_num
&& is_full_dev
)
1172 setup_hw_stats(device
, p
, port_num
);
1174 list_add_tail(&p
->kobj
.entry
, &coredev
->port_list
);
1176 kobject_uevent(&p
->kobj
, KOBJ_ADD
);
1181 sysfs_remove_group(&p
->kobj
, p
->pkey_group
);
1184 if (p
->pkey_group
) {
1185 for (i
= 0; i
< attr
.pkey_tbl_len
; ++i
)
1186 kfree(p
->pkey_group
->attrs
[i
]);
1188 kfree(p
->pkey_group
->attrs
);
1189 p
->pkey_group
->attrs
= NULL
;
1192 err_free_pkey_group
:
1193 kfree(p
->pkey_group
);
1195 err_remove_gid_type
:
1196 sysfs_remove_group(&p
->gid_attr_group
->kobj
,
1197 &p
->gid_attr_group
->type
);
1200 for (i
= 0; i
< attr
.gid_tbl_len
; ++i
)
1201 kfree(p
->gid_attr_group
->type
.attrs
[i
]);
1203 kfree(p
->gid_attr_group
->type
.attrs
);
1204 p
->gid_attr_group
->type
.attrs
= NULL
;
1206 err_remove_gid_ndev
:
1207 sysfs_remove_group(&p
->gid_attr_group
->kobj
,
1208 &p
->gid_attr_group
->ndev
);
1211 for (i
= 0; i
< attr
.gid_tbl_len
; ++i
)
1212 kfree(p
->gid_attr_group
->ndev
.attrs
[i
]);
1214 kfree(p
->gid_attr_group
->ndev
.attrs
);
1215 p
->gid_attr_group
->ndev
.attrs
= NULL
;
1218 sysfs_remove_group(&p
->kobj
, &p
->gid_group
);
1221 for (i
= 0; i
< attr
.gid_tbl_len
; ++i
)
1222 kfree(p
->gid_group
.attrs
[i
]);
1224 kfree(p
->gid_group
.attrs
);
1225 p
->gid_group
.attrs
= NULL
;
1229 sysfs_remove_group(&p
->kobj
, p
->pma_table
);
1232 kobject_put(&p
->gid_attr_group
->kobj
);
1235 kobject_put(&p
->kobj
);
1239 static const char *node_type_string(int node_type
)
1241 switch (node_type
) {
1242 case RDMA_NODE_IB_CA
:
1244 case RDMA_NODE_IB_SWITCH
:
1246 case RDMA_NODE_IB_ROUTER
:
1248 case RDMA_NODE_RNIC
:
1250 case RDMA_NODE_USNIC
:
1252 case RDMA_NODE_USNIC_UDP
:
1254 case RDMA_NODE_UNSPECIFIED
:
1255 return "unspecified";
1260 static ssize_t
node_type_show(struct device
*device
,
1261 struct device_attribute
*attr
, char *buf
)
1263 struct ib_device
*dev
= rdma_device_to_ibdev(device
);
1265 return sysfs_emit(buf
, "%d: %s\n", dev
->node_type
,
1266 node_type_string(dev
->node_type
));
1268 static DEVICE_ATTR_RO(node_type
);
1270 static ssize_t
sys_image_guid_show(struct device
*device
,
1271 struct device_attribute
*dev_attr
, char *buf
)
1273 struct ib_device
*dev
= rdma_device_to_ibdev(device
);
1274 __be16
*guid
= (__be16
*)&dev
->attrs
.sys_image_guid
;
1276 return sysfs_emit(buf
, "%04x:%04x:%04x:%04x\n",
1277 be16_to_cpu(guid
[0]),
1278 be16_to_cpu(guid
[1]),
1279 be16_to_cpu(guid
[2]),
1280 be16_to_cpu(guid
[3]));
1282 static DEVICE_ATTR_RO(sys_image_guid
);
1284 static ssize_t
node_guid_show(struct device
*device
,
1285 struct device_attribute
*attr
, char *buf
)
1287 struct ib_device
*dev
= rdma_device_to_ibdev(device
);
1288 __be16
*node_guid
= (__be16
*)&dev
->node_guid
;
1290 return sysfs_emit(buf
, "%04x:%04x:%04x:%04x\n",
1291 be16_to_cpu(node_guid
[0]),
1292 be16_to_cpu(node_guid
[1]),
1293 be16_to_cpu(node_guid
[2]),
1294 be16_to_cpu(node_guid
[3]));
1296 static DEVICE_ATTR_RO(node_guid
);
1298 static ssize_t
node_desc_show(struct device
*device
,
1299 struct device_attribute
*attr
, char *buf
)
1301 struct ib_device
*dev
= rdma_device_to_ibdev(device
);
1303 return sysfs_emit(buf
, "%.64s\n", dev
->node_desc
);
1306 static ssize_t
node_desc_store(struct device
*device
,
1307 struct device_attribute
*attr
,
1308 const char *buf
, size_t count
)
1310 struct ib_device
*dev
= rdma_device_to_ibdev(device
);
1311 struct ib_device_modify desc
= {};
1314 if (!dev
->ops
.modify_device
)
1317 memcpy(desc
.node_desc
, buf
, min_t(int, count
, IB_DEVICE_NODE_DESC_MAX
));
1318 ret
= ib_modify_device(dev
, IB_DEVICE_MODIFY_NODE_DESC
, &desc
);
1324 static DEVICE_ATTR_RW(node_desc
);
1326 static ssize_t
fw_ver_show(struct device
*device
, struct device_attribute
*attr
,
1329 struct ib_device
*dev
= rdma_device_to_ibdev(device
);
1330 char version
[IB_FW_VERSION_NAME_MAX
] = {};
1332 ib_get_device_fw_str(dev
, version
);
1334 return sysfs_emit(buf
, "%s\n", version
);
1336 static DEVICE_ATTR_RO(fw_ver
);
1338 static struct attribute
*ib_dev_attrs
[] = {
1339 &dev_attr_node_type
.attr
,
1340 &dev_attr_node_guid
.attr
,
1341 &dev_attr_sys_image_guid
.attr
,
1342 &dev_attr_fw_ver
.attr
,
1343 &dev_attr_node_desc
.attr
,
1347 const struct attribute_group ib_dev_attr_group
= {
1348 .attrs
= ib_dev_attrs
,
1351 void ib_free_port_attrs(struct ib_core_device
*coredev
)
1353 struct ib_device
*device
= rdma_device_to_ibdev(&coredev
->dev
);
1354 bool is_full_dev
= &device
->coredev
== coredev
;
1355 struct kobject
*p
, *t
;
1357 list_for_each_entry_safe(p
, t
, &coredev
->port_list
, entry
) {
1358 struct ib_port
*port
= container_of(p
, struct ib_port
, kobj
);
1360 list_del(&p
->entry
);
1361 if (port
->hw_stats_ag
)
1362 free_hsag(&port
->kobj
, port
->hw_stats_ag
);
1363 kfree(port
->hw_stats
);
1364 if (device
->port_data
&& is_full_dev
)
1365 device
->port_data
[port
->port_num
].hw_stats
= NULL
;
1367 if (port
->pma_table
)
1368 sysfs_remove_group(p
, port
->pma_table
);
1369 if (port
->pkey_group
)
1370 sysfs_remove_group(p
, port
->pkey_group
);
1371 sysfs_remove_group(p
, &port
->gid_group
);
1372 sysfs_remove_group(&port
->gid_attr_group
->kobj
,
1373 &port
->gid_attr_group
->ndev
);
1374 sysfs_remove_group(&port
->gid_attr_group
->kobj
,
1375 &port
->gid_attr_group
->type
);
1376 kobject_put(&port
->gid_attr_group
->kobj
);
1380 kobject_put(coredev
->ports_kobj
);
1383 int ib_setup_port_attrs(struct ib_core_device
*coredev
)
1385 struct ib_device
*device
= rdma_device_to_ibdev(&coredev
->dev
);
1389 coredev
->ports_kobj
= kobject_create_and_add("ports",
1390 &coredev
->dev
.kobj
);
1391 if (!coredev
->ports_kobj
)
1394 rdma_for_each_port (device
, port
) {
1395 ret
= add_port(coredev
, port
);
1403 ib_free_port_attrs(coredev
);
1407 int ib_device_register_sysfs(struct ib_device
*device
)
1411 ret
= ib_setup_port_attrs(&device
->coredev
);
1415 if (device
->ops
.alloc_hw_stats
)
1416 setup_hw_stats(device
, NULL
, 0);
1421 void ib_device_unregister_sysfs(struct ib_device
*device
)
1423 if (device
->hw_stats_ag
)
1424 free_hsag(&device
->dev
.kobj
, device
->hw_stats_ag
);
1425 kfree(device
->hw_stats
);
1427 ib_free_port_attrs(&device
->coredev
);
1431 * ib_port_register_module_stat - add module counters under relevant port
1434 * @device: IB device to add counters
1435 * @port_num: valid port number
1436 * @kobj: pointer to the kobject to initialize
1437 * @ktype: pointer to the ktype for this kobject.
1438 * @name: the name of the kobject
1440 int ib_port_register_module_stat(struct ib_device
*device
, u8 port_num
,
1441 struct kobject
*kobj
, struct kobj_type
*ktype
,
1444 struct kobject
*p
, *t
;
1447 list_for_each_entry_safe(p
, t
, &device
->coredev
.port_list
, entry
) {
1448 struct ib_port
*port
= container_of(p
, struct ib_port
, kobj
);
1450 if (port
->port_num
!= port_num
)
1453 ret
= kobject_init_and_add(kobj
, ktype
, &port
->kobj
, "%s",
1463 EXPORT_SYMBOL(ib_port_register_module_stat
);
1466 * ib_port_unregister_module_stat - release module counters
1467 * @kobj: pointer to the kobject to release
1469 void ib_port_unregister_module_stat(struct kobject
*kobj
)
1473 EXPORT_SYMBOL(ib_port_unregister_module_stat
);