1 // SPDX-License-Identifier: GPL-2.0
3 * Networking over Thunderbolt cable using Apple ThunderboltIP protocol
5 * Copyright (C) 2017, Intel Corporation
6 * Authors: Amir Levy <amir.jer.levy@intel.com>
7 * Michael Jamet <michael.jamet@intel.com>
8 * Mika Westerberg <mika.westerberg@linux.intel.com>
11 #include <linux/atomic.h>
12 #include <linux/highmem.h>
13 #include <linux/if_vlan.h>
14 #include <linux/jhash.h>
15 #include <linux/module.h>
16 #include <linux/etherdevice.h>
17 #include <linux/rtnetlink.h>
18 #include <linux/sizes.h>
19 #include <linux/thunderbolt.h>
20 #include <linux/uuid.h>
21 #include <linux/workqueue.h>
23 #include <net/ip6_checksum.h>
25 /* Protocol timeouts in ms */
26 #define TBNET_LOGIN_DELAY 4500
27 #define TBNET_LOGIN_TIMEOUT 500
28 #define TBNET_LOGOUT_TIMEOUT 100
30 #define TBNET_RING_SIZE 256
31 #define TBNET_LOCAL_PATH 0xf
32 #define TBNET_LOGIN_RETRIES 60
33 #define TBNET_LOGOUT_RETRIES 5
34 #define TBNET_MATCH_FRAGS_ID BIT(1)
35 #define TBNET_MAX_MTU SZ_64K
36 #define TBNET_FRAME_SIZE SZ_4K
37 #define TBNET_MAX_PAYLOAD_SIZE \
38 (TBNET_FRAME_SIZE - sizeof(struct thunderbolt_ip_frame_header))
39 /* Rx packets need to hold space for skb_shared_info */
40 #define TBNET_RX_MAX_SIZE \
41 (TBNET_FRAME_SIZE + SKB_DATA_ALIGN(sizeof(struct skb_shared_info)))
42 #define TBNET_RX_PAGE_ORDER get_order(TBNET_RX_MAX_SIZE)
43 #define TBNET_RX_PAGE_SIZE (PAGE_SIZE << TBNET_RX_PAGE_ORDER)
45 #define TBNET_L0_PORT_NUM(route) ((route) & GENMASK(5, 0))
48 * struct thunderbolt_ip_frame_header - Header for each Thunderbolt frame
49 * @frame_size: size of the data with the frame
50 * @frame_index: running index on the frames
51 * @frame_id: ID of the frame to match frames to specific packet
52 * @frame_count: how many frames assembles a full packet
54 * Each data frame passed to the high-speed DMA ring has this header. If
55 * the XDomain network directory announces that %TBNET_MATCH_FRAGS_ID is
56 * supported then @frame_id is filled, otherwise it stays %0.
58 struct thunderbolt_ip_frame_header
{
65 enum thunderbolt_ip_frame_pdf
{
66 TBIP_PDF_FRAME_START
= 1,
70 enum thunderbolt_ip_type
{
77 struct thunderbolt_ip_header
{
82 uuid_t initiator_uuid
;
88 #define TBIP_HDR_LENGTH_MASK GENMASK(5, 0)
89 #define TBIP_HDR_SN_MASK GENMASK(28, 27)
90 #define TBIP_HDR_SN_SHIFT 27
92 struct thunderbolt_ip_login
{
93 struct thunderbolt_ip_header hdr
;
99 #define TBIP_LOGIN_PROTO_VERSION 1
101 struct thunderbolt_ip_login_response
{
102 struct thunderbolt_ip_header hdr
;
105 u32 receiver_mac_len
;
109 struct thunderbolt_ip_logout
{
110 struct thunderbolt_ip_header hdr
;
113 struct thunderbolt_ip_status
{
114 struct thunderbolt_ip_header hdr
;
125 u64 rx_length_errors
;
128 u64 rx_missed_errors
;
132 struct net_device
*dev
;
134 struct ring_frame frame
;
138 struct tbnet_frame frames
[TBNET_RING_SIZE
];
141 struct tb_ring
*ring
;
145 * struct tbnet - ThunderboltIP network driver private data
146 * @svc: XDomain service the driver is bound to
147 * @xd: XDomain the service blongs to
148 * @handler: ThunderboltIP configuration protocol handler
149 * @dev: Networking device
150 * @napi: NAPI structure for Rx polling
151 * @stats: Network statistics
152 * @skb: Network packet that is currently processed on Rx path
153 * @command_id: ID used for next configuration protocol packet
154 * @login_sent: ThunderboltIP login message successfully sent
155 * @login_received: ThunderboltIP login message received from the remote
157 * @transmit_path: HopID the other end needs to use building the
158 * opposite side path.
159 * @connection_lock: Lock serializing access to @login_sent,
160 * @login_received and @transmit_path.
161 * @login_retries: Number of login retries currently done
162 * @login_work: Worker to send ThunderboltIP login packets
163 * @connected_work: Worker that finalizes the ThunderboltIP connection
164 * setup and enables DMA paths for high speed data
166 * @disconnect_work: Worker that handles tearing down the ThunderboltIP
168 * @rx_hdr: Copy of the currently processed Rx frame. Used when a
169 * network packet consists of multiple Thunderbolt frames.
170 * In host byte order.
171 * @rx_ring: Software ring holding Rx frames
172 * @frame_id: Frame ID use for next Tx packet
173 * (if %TBNET_MATCH_FRAGS_ID is supported in both ends)
174 * @tx_ring: Software ring holding Tx frames
177 const struct tb_service
*svc
;
178 struct tb_xdomain
*xd
;
179 struct tb_protocol_handler handler
;
180 struct net_device
*dev
;
181 struct napi_struct napi
;
182 struct tbnet_stats stats
;
188 struct mutex connection_lock
;
190 struct delayed_work login_work
;
191 struct work_struct connected_work
;
192 struct work_struct disconnect_work
;
193 struct thunderbolt_ip_frame_header rx_hdr
;
194 struct tbnet_ring rx_ring
;
196 struct tbnet_ring tx_ring
;
199 /* Network property directory UUID: c66189ca-1cce-4195-bdb8-49592e5f5a4f */
200 static const uuid_t tbnet_dir_uuid
=
201 UUID_INIT(0xc66189ca, 0x1cce, 0x4195,
202 0xbd, 0xb8, 0x49, 0x59, 0x2e, 0x5f, 0x5a, 0x4f);
204 /* ThunderboltIP protocol UUID: 798f589e-3616-8a47-97c6-5664a920c8dd */
205 static const uuid_t tbnet_svc_uuid
=
206 UUID_INIT(0x798f589e, 0x3616, 0x8a47,
207 0x97, 0xc6, 0x56, 0x64, 0xa9, 0x20, 0xc8, 0xdd);
209 static struct tb_property_dir
*tbnet_dir
;
211 static void tbnet_fill_header(struct thunderbolt_ip_header
*hdr
, u64 route
,
212 u8 sequence
, const uuid_t
*initiator_uuid
, const uuid_t
*target_uuid
,
213 enum thunderbolt_ip_type type
, size_t size
, u32 command_id
)
217 /* Length does not include route_hi/lo and length_sn fields */
218 length_sn
= (size
- 3 * 4) / 4;
219 length_sn
|= (sequence
<< TBIP_HDR_SN_SHIFT
) & TBIP_HDR_SN_MASK
;
221 hdr
->route_hi
= upper_32_bits(route
);
222 hdr
->route_lo
= lower_32_bits(route
);
223 hdr
->length_sn
= length_sn
;
224 uuid_copy(&hdr
->uuid
, &tbnet_svc_uuid
);
225 uuid_copy(&hdr
->initiator_uuid
, initiator_uuid
);
226 uuid_copy(&hdr
->target_uuid
, target_uuid
);
228 hdr
->command_id
= command_id
;
231 static int tbnet_login_response(struct tbnet
*net
, u64 route
, u8 sequence
,
234 struct thunderbolt_ip_login_response reply
;
235 struct tb_xdomain
*xd
= net
->xd
;
237 memset(&reply
, 0, sizeof(reply
));
238 tbnet_fill_header(&reply
.hdr
, route
, sequence
, xd
->local_uuid
,
239 xd
->remote_uuid
, TBIP_LOGIN_RESPONSE
, sizeof(reply
),
241 memcpy(reply
.receiver_mac
, net
->dev
->dev_addr
, ETH_ALEN
);
242 reply
.receiver_mac_len
= ETH_ALEN
;
244 return tb_xdomain_response(xd
, &reply
, sizeof(reply
),
245 TB_CFG_PKG_XDOMAIN_RESP
);
248 static int tbnet_login_request(struct tbnet
*net
, u8 sequence
)
250 struct thunderbolt_ip_login_response reply
;
251 struct thunderbolt_ip_login request
;
252 struct tb_xdomain
*xd
= net
->xd
;
254 memset(&request
, 0, sizeof(request
));
255 tbnet_fill_header(&request
.hdr
, xd
->route
, sequence
, xd
->local_uuid
,
256 xd
->remote_uuid
, TBIP_LOGIN
, sizeof(request
),
257 atomic_inc_return(&net
->command_id
));
259 request
.proto_version
= TBIP_LOGIN_PROTO_VERSION
;
260 request
.transmit_path
= TBNET_LOCAL_PATH
;
262 return tb_xdomain_request(xd
, &request
, sizeof(request
),
263 TB_CFG_PKG_XDOMAIN_RESP
, &reply
,
264 sizeof(reply
), TB_CFG_PKG_XDOMAIN_RESP
,
265 TBNET_LOGIN_TIMEOUT
);
268 static int tbnet_logout_response(struct tbnet
*net
, u64 route
, u8 sequence
,
271 struct thunderbolt_ip_status reply
;
272 struct tb_xdomain
*xd
= net
->xd
;
274 memset(&reply
, 0, sizeof(reply
));
275 tbnet_fill_header(&reply
.hdr
, route
, sequence
, xd
->local_uuid
,
276 xd
->remote_uuid
, TBIP_STATUS
, sizeof(reply
),
277 atomic_inc_return(&net
->command_id
));
278 return tb_xdomain_response(xd
, &reply
, sizeof(reply
),
279 TB_CFG_PKG_XDOMAIN_RESP
);
282 static int tbnet_logout_request(struct tbnet
*net
)
284 struct thunderbolt_ip_logout request
;
285 struct thunderbolt_ip_status reply
;
286 struct tb_xdomain
*xd
= net
->xd
;
288 memset(&request
, 0, sizeof(request
));
289 tbnet_fill_header(&request
.hdr
, xd
->route
, 0, xd
->local_uuid
,
290 xd
->remote_uuid
, TBIP_LOGOUT
, sizeof(request
),
291 atomic_inc_return(&net
->command_id
));
293 return tb_xdomain_request(xd
, &request
, sizeof(request
),
294 TB_CFG_PKG_XDOMAIN_RESP
, &reply
,
295 sizeof(reply
), TB_CFG_PKG_XDOMAIN_RESP
,
296 TBNET_LOGOUT_TIMEOUT
);
299 static void start_login(struct tbnet
*net
)
301 mutex_lock(&net
->connection_lock
);
302 net
->login_sent
= false;
303 net
->login_received
= false;
304 mutex_unlock(&net
->connection_lock
);
306 queue_delayed_work(system_long_wq
, &net
->login_work
,
307 msecs_to_jiffies(1000));
310 static void stop_login(struct tbnet
*net
)
312 cancel_delayed_work_sync(&net
->login_work
);
313 cancel_work_sync(&net
->connected_work
);
316 static inline unsigned int tbnet_frame_size(const struct tbnet_frame
*tf
)
318 return tf
->frame
.size
? : TBNET_FRAME_SIZE
;
321 static void tbnet_free_buffers(struct tbnet_ring
*ring
)
325 for (i
= 0; i
< TBNET_RING_SIZE
; i
++) {
326 struct device
*dma_dev
= tb_ring_dma_device(ring
->ring
);
327 struct tbnet_frame
*tf
= &ring
->frames
[i
];
328 enum dma_data_direction dir
;
335 if (ring
->ring
->is_tx
) {
338 size
= TBNET_FRAME_SIZE
;
340 dir
= DMA_FROM_DEVICE
;
341 order
= TBNET_RX_PAGE_ORDER
;
342 size
= TBNET_RX_PAGE_SIZE
;
345 if (tf
->frame
.buffer_phy
)
346 dma_unmap_page(dma_dev
, tf
->frame
.buffer_phy
, size
,
349 __free_pages(tf
->page
, order
);
357 static void tbnet_tear_down(struct tbnet
*net
, bool send_logout
)
359 netif_carrier_off(net
->dev
);
360 netif_stop_queue(net
->dev
);
364 mutex_lock(&net
->connection_lock
);
366 if (net
->login_sent
&& net
->login_received
) {
367 int retries
= TBNET_LOGOUT_RETRIES
;
369 while (send_logout
&& retries
-- > 0) {
370 int ret
= tbnet_logout_request(net
);
371 if (ret
!= -ETIMEDOUT
)
375 tb_ring_stop(net
->rx_ring
.ring
);
376 tb_ring_stop(net
->tx_ring
.ring
);
377 tbnet_free_buffers(&net
->rx_ring
);
378 tbnet_free_buffers(&net
->tx_ring
);
380 if (tb_xdomain_disable_paths(net
->xd
))
381 netdev_warn(net
->dev
, "failed to disable DMA paths\n");
384 net
->login_retries
= 0;
385 net
->login_sent
= false;
386 net
->login_received
= false;
388 mutex_unlock(&net
->connection_lock
);
391 static int tbnet_handle_packet(const void *buf
, size_t size
, void *data
)
393 const struct thunderbolt_ip_login
*pkg
= buf
;
394 struct tbnet
*net
= data
;
400 /* Make sure the packet is for us */
401 if (size
< sizeof(struct thunderbolt_ip_header
))
403 if (!uuid_equal(&pkg
->hdr
.initiator_uuid
, net
->xd
->remote_uuid
))
405 if (!uuid_equal(&pkg
->hdr
.target_uuid
, net
->xd
->local_uuid
))
408 route
= ((u64
)pkg
->hdr
.route_hi
<< 32) | pkg
->hdr
.route_lo
;
409 route
&= ~BIT_ULL(63);
410 if (route
!= net
->xd
->route
)
413 sequence
= pkg
->hdr
.length_sn
& TBIP_HDR_SN_MASK
;
414 sequence
>>= TBIP_HDR_SN_SHIFT
;
415 command_id
= pkg
->hdr
.command_id
;
417 switch (pkg
->hdr
.type
) {
419 if (!netif_running(net
->dev
))
422 ret
= tbnet_login_response(net
, route
, sequence
,
423 pkg
->hdr
.command_id
);
425 mutex_lock(&net
->connection_lock
);
426 net
->login_received
= true;
427 net
->transmit_path
= pkg
->transmit_path
;
429 /* If we reached the number of max retries or
430 * previous logout, schedule another round of
433 if (net
->login_retries
>= TBNET_LOGIN_RETRIES
||
435 net
->login_retries
= 0;
436 queue_delayed_work(system_long_wq
,
437 &net
->login_work
, 0);
439 mutex_unlock(&net
->connection_lock
);
441 queue_work(system_long_wq
, &net
->connected_work
);
446 ret
= tbnet_logout_response(net
, route
, sequence
, command_id
);
448 queue_work(system_long_wq
, &net
->disconnect_work
);
456 netdev_warn(net
->dev
, "failed to send ThunderboltIP response\n");
461 static unsigned int tbnet_available_buffers(const struct tbnet_ring
*ring
)
463 return ring
->prod
- ring
->cons
;
466 static int tbnet_alloc_rx_buffers(struct tbnet
*net
, unsigned int nbuffers
)
468 struct tbnet_ring
*ring
= &net
->rx_ring
;
472 struct device
*dma_dev
= tb_ring_dma_device(ring
->ring
);
473 unsigned int index
= ring
->prod
& (TBNET_RING_SIZE
- 1);
474 struct tbnet_frame
*tf
= &ring
->frames
[index
];
480 /* Allocate page (order > 0) so that it can hold maximum
481 * ThunderboltIP frame (4kB) and the additional room for
482 * SKB shared info required by build_skb().
484 tf
->page
= dev_alloc_pages(TBNET_RX_PAGE_ORDER
);
490 dma_addr
= dma_map_page(dma_dev
, tf
->page
, 0,
491 TBNET_RX_PAGE_SIZE
, DMA_FROM_DEVICE
);
492 if (dma_mapping_error(dma_dev
, dma_addr
)) {
497 tf
->frame
.buffer_phy
= dma_addr
;
500 tb_ring_rx(ring
->ring
, &tf
->frame
);
508 tbnet_free_buffers(ring
);
512 static struct tbnet_frame
*tbnet_get_tx_buffer(struct tbnet
*net
)
514 struct tbnet_ring
*ring
= &net
->tx_ring
;
515 struct device
*dma_dev
= tb_ring_dma_device(ring
->ring
);
516 struct tbnet_frame
*tf
;
519 if (!tbnet_available_buffers(ring
))
522 index
= ring
->cons
++ & (TBNET_RING_SIZE
- 1);
524 tf
= &ring
->frames
[index
];
527 dma_sync_single_for_cpu(dma_dev
, tf
->frame
.buffer_phy
,
528 tbnet_frame_size(tf
), DMA_TO_DEVICE
);
533 static void tbnet_tx_callback(struct tb_ring
*ring
, struct ring_frame
*frame
,
536 struct tbnet_frame
*tf
= container_of(frame
, typeof(*tf
), frame
);
537 struct tbnet
*net
= netdev_priv(tf
->dev
);
539 /* Return buffer to the ring */
542 if (tbnet_available_buffers(&net
->tx_ring
) >= TBNET_RING_SIZE
/ 2)
543 netif_wake_queue(net
->dev
);
546 static int tbnet_alloc_tx_buffers(struct tbnet
*net
)
548 struct tbnet_ring
*ring
= &net
->tx_ring
;
549 struct device
*dma_dev
= tb_ring_dma_device(ring
->ring
);
552 for (i
= 0; i
< TBNET_RING_SIZE
; i
++) {
553 struct tbnet_frame
*tf
= &ring
->frames
[i
];
556 tf
->page
= alloc_page(GFP_KERNEL
);
558 tbnet_free_buffers(ring
);
562 dma_addr
= dma_map_page(dma_dev
, tf
->page
, 0, TBNET_FRAME_SIZE
,
564 if (dma_mapping_error(dma_dev
, dma_addr
)) {
565 __free_page(tf
->page
);
567 tbnet_free_buffers(ring
);
572 tf
->frame
.buffer_phy
= dma_addr
;
573 tf
->frame
.callback
= tbnet_tx_callback
;
574 tf
->frame
.sof
= TBIP_PDF_FRAME_START
;
575 tf
->frame
.eof
= TBIP_PDF_FRAME_END
;
579 ring
->prod
= TBNET_RING_SIZE
- 1;
584 static void tbnet_connected_work(struct work_struct
*work
)
586 struct tbnet
*net
= container_of(work
, typeof(*net
), connected_work
);
590 if (netif_carrier_ok(net
->dev
))
593 mutex_lock(&net
->connection_lock
);
594 connected
= net
->login_sent
&& net
->login_received
;
595 mutex_unlock(&net
->connection_lock
);
600 /* Both logins successful so enable the high-speed DMA paths and
601 * start the network device queue.
603 ret
= tb_xdomain_enable_paths(net
->xd
, TBNET_LOCAL_PATH
,
604 net
->rx_ring
.ring
->hop
,
606 net
->tx_ring
.ring
->hop
);
608 netdev_err(net
->dev
, "failed to enable DMA paths\n");
612 tb_ring_start(net
->tx_ring
.ring
);
613 tb_ring_start(net
->rx_ring
.ring
);
615 ret
= tbnet_alloc_rx_buffers(net
, TBNET_RING_SIZE
);
619 ret
= tbnet_alloc_tx_buffers(net
);
621 goto err_free_rx_buffers
;
623 netif_carrier_on(net
->dev
);
624 netif_start_queue(net
->dev
);
628 tbnet_free_buffers(&net
->rx_ring
);
630 tb_ring_stop(net
->rx_ring
.ring
);
631 tb_ring_stop(net
->tx_ring
.ring
);
634 static void tbnet_login_work(struct work_struct
*work
)
636 struct tbnet
*net
= container_of(work
, typeof(*net
), login_work
.work
);
637 unsigned long delay
= msecs_to_jiffies(TBNET_LOGIN_DELAY
);
640 if (netif_carrier_ok(net
->dev
))
643 ret
= tbnet_login_request(net
, net
->login_retries
% 4);
645 if (net
->login_retries
++ < TBNET_LOGIN_RETRIES
) {
646 queue_delayed_work(system_long_wq
, &net
->login_work
,
649 netdev_info(net
->dev
, "ThunderboltIP login timed out\n");
652 net
->login_retries
= 0;
654 mutex_lock(&net
->connection_lock
);
655 net
->login_sent
= true;
656 mutex_unlock(&net
->connection_lock
);
658 queue_work(system_long_wq
, &net
->connected_work
);
662 static void tbnet_disconnect_work(struct work_struct
*work
)
664 struct tbnet
*net
= container_of(work
, typeof(*net
), disconnect_work
);
666 tbnet_tear_down(net
, false);
669 static bool tbnet_check_frame(struct tbnet
*net
, const struct tbnet_frame
*tf
,
670 const struct thunderbolt_ip_frame_header
*hdr
)
672 u32 frame_id
, frame_count
, frame_size
, frame_index
;
675 if (tf
->frame
.flags
& RING_DESC_CRC_ERROR
) {
676 net
->stats
.rx_crc_errors
++;
678 } else if (tf
->frame
.flags
& RING_DESC_BUFFER_OVERRUN
) {
679 net
->stats
.rx_over_errors
++;
683 /* Should be greater than just header i.e. contains data */
684 size
= tbnet_frame_size(tf
);
685 if (size
<= sizeof(*hdr
)) {
686 net
->stats
.rx_length_errors
++;
690 frame_count
= le32_to_cpu(hdr
->frame_count
);
691 frame_size
= le32_to_cpu(hdr
->frame_size
);
692 frame_index
= le16_to_cpu(hdr
->frame_index
);
693 frame_id
= le16_to_cpu(hdr
->frame_id
);
695 if ((frame_size
> size
- sizeof(*hdr
)) || !frame_size
) {
696 net
->stats
.rx_length_errors
++;
700 /* In case we're in the middle of packet, validate the frame
701 * header based on first fragment of the packet.
703 if (net
->skb
&& net
->rx_hdr
.frame_count
) {
704 /* Check the frame count fits the count field */
705 if (frame_count
!= net
->rx_hdr
.frame_count
) {
706 net
->stats
.rx_length_errors
++;
710 /* Check the frame identifiers are incremented correctly,
711 * and id is matching.
713 if (frame_index
!= net
->rx_hdr
.frame_index
+ 1 ||
714 frame_id
!= net
->rx_hdr
.frame_id
) {
715 net
->stats
.rx_missed_errors
++;
719 if (net
->skb
->len
+ frame_size
> TBNET_MAX_MTU
) {
720 net
->stats
.rx_length_errors
++;
727 /* Start of packet, validate the frame header */
728 if (frame_count
== 0 || frame_count
> TBNET_RING_SIZE
/ 4) {
729 net
->stats
.rx_length_errors
++;
732 if (frame_index
!= 0) {
733 net
->stats
.rx_missed_errors
++;
740 static int tbnet_poll(struct napi_struct
*napi
, int budget
)
742 struct tbnet
*net
= container_of(napi
, struct tbnet
, napi
);
743 unsigned int cleaned_count
= tbnet_available_buffers(&net
->rx_ring
);
744 struct device
*dma_dev
= tb_ring_dma_device(net
->rx_ring
.ring
);
745 unsigned int rx_packets
= 0;
747 while (rx_packets
< budget
) {
748 const struct thunderbolt_ip_frame_header
*hdr
;
749 unsigned int hdr_size
= sizeof(*hdr
);
750 struct sk_buff
*skb
= NULL
;
751 struct ring_frame
*frame
;
752 struct tbnet_frame
*tf
;
757 /* Return some buffers to hardware, one at a time is too
758 * slow so allocate MAX_SKB_FRAGS buffers at the same
761 if (cleaned_count
>= MAX_SKB_FRAGS
) {
762 tbnet_alloc_rx_buffers(net
, cleaned_count
);
766 frame
= tb_ring_poll(net
->rx_ring
.ring
);
770 dma_unmap_page(dma_dev
, frame
->buffer_phy
,
771 TBNET_RX_PAGE_SIZE
, DMA_FROM_DEVICE
);
773 tf
= container_of(frame
, typeof(*tf
), frame
);
780 hdr
= page_address(page
);
781 if (!tbnet_check_frame(net
, tf
, hdr
)) {
782 __free_pages(page
, TBNET_RX_PAGE_ORDER
);
783 dev_kfree_skb_any(net
->skb
);
788 frame_size
= le32_to_cpu(hdr
->frame_size
);
792 skb
= build_skb(page_address(page
),
795 __free_pages(page
, TBNET_RX_PAGE_ORDER
);
796 net
->stats
.rx_errors
++;
800 skb_reserve(skb
, hdr_size
);
801 skb_put(skb
, frame_size
);
805 skb_add_rx_frag(skb
, skb_shinfo(skb
)->nr_frags
,
806 page
, hdr_size
, frame_size
,
807 TBNET_RX_PAGE_SIZE
- hdr_size
);
810 net
->rx_hdr
.frame_size
= frame_size
;
811 net
->rx_hdr
.frame_count
= le32_to_cpu(hdr
->frame_count
);
812 net
->rx_hdr
.frame_index
= le16_to_cpu(hdr
->frame_index
);
813 net
->rx_hdr
.frame_id
= le16_to_cpu(hdr
->frame_id
);
814 last
= net
->rx_hdr
.frame_index
== net
->rx_hdr
.frame_count
- 1;
817 net
->stats
.rx_bytes
+= frame_size
;
820 skb
->protocol
= eth_type_trans(skb
, net
->dev
);
821 napi_gro_receive(&net
->napi
, skb
);
826 net
->stats
.rx_packets
+= rx_packets
;
829 tbnet_alloc_rx_buffers(net
, cleaned_count
);
831 if (rx_packets
>= budget
)
834 napi_complete_done(napi
, rx_packets
);
835 /* Re-enable the ring interrupt */
836 tb_ring_poll_complete(net
->rx_ring
.ring
);
841 static void tbnet_start_poll(void *data
)
843 struct tbnet
*net
= data
;
845 napi_schedule(&net
->napi
);
848 static int tbnet_open(struct net_device
*dev
)
850 struct tbnet
*net
= netdev_priv(dev
);
851 struct tb_xdomain
*xd
= net
->xd
;
852 u16 sof_mask
, eof_mask
;
853 struct tb_ring
*ring
;
855 netif_carrier_off(dev
);
857 ring
= tb_ring_alloc_tx(xd
->tb
->nhi
, -1, TBNET_RING_SIZE
,
860 netdev_err(dev
, "failed to allocate Tx ring\n");
863 net
->tx_ring
.ring
= ring
;
865 sof_mask
= BIT(TBIP_PDF_FRAME_START
);
866 eof_mask
= BIT(TBIP_PDF_FRAME_END
);
868 ring
= tb_ring_alloc_rx(xd
->tb
->nhi
, -1, TBNET_RING_SIZE
,
869 RING_FLAG_FRAME
| RING_FLAG_E2E
, sof_mask
,
870 eof_mask
, tbnet_start_poll
, net
);
872 netdev_err(dev
, "failed to allocate Rx ring\n");
873 tb_ring_free(net
->tx_ring
.ring
);
874 net
->tx_ring
.ring
= NULL
;
877 net
->rx_ring
.ring
= ring
;
879 napi_enable(&net
->napi
);
885 static int tbnet_stop(struct net_device
*dev
)
887 struct tbnet
*net
= netdev_priv(dev
);
889 napi_disable(&net
->napi
);
891 cancel_work_sync(&net
->disconnect_work
);
892 tbnet_tear_down(net
, true);
894 tb_ring_free(net
->rx_ring
.ring
);
895 net
->rx_ring
.ring
= NULL
;
896 tb_ring_free(net
->tx_ring
.ring
);
897 net
->tx_ring
.ring
= NULL
;
902 static bool tbnet_xmit_csum_and_map(struct tbnet
*net
, struct sk_buff
*skb
,
903 struct tbnet_frame
**frames
, u32 frame_count
)
905 struct thunderbolt_ip_frame_header
*hdr
= page_address(frames
[0]->page
);
906 struct device
*dma_dev
= tb_ring_dma_device(net
->tx_ring
.ring
);
907 __wsum wsum
= htonl(skb
->len
- skb_transport_offset(skb
));
908 unsigned int i
, len
, offset
= skb_transport_offset(skb
);
909 __be16 protocol
= skb
->protocol
;
910 void *data
= skb
->data
;
911 void *dest
= hdr
+ 1;
914 if (skb
->ip_summed
!= CHECKSUM_PARTIAL
) {
915 /* No need to calculate checksum so we just update the
916 * total frame count and sync the frames for DMA.
918 for (i
= 0; i
< frame_count
; i
++) {
919 hdr
= page_address(frames
[i
]->page
);
920 hdr
->frame_count
= cpu_to_le32(frame_count
);
921 dma_sync_single_for_device(dma_dev
,
922 frames
[i
]->frame
.buffer_phy
,
923 tbnet_frame_size(frames
[i
]), DMA_TO_DEVICE
);
929 if (protocol
== htons(ETH_P_8021Q
)) {
930 struct vlan_hdr
*vhdr
, vh
;
932 vhdr
= skb_header_pointer(skb
, ETH_HLEN
, sizeof(vh
), &vh
);
936 protocol
= vhdr
->h_vlan_encapsulated_proto
;
939 /* Data points on the beginning of packet.
940 * Check is the checksum absolute place in the packet.
941 * ipcso will update IP checksum.
942 * tucso will update TCP/UPD checksum.
944 if (protocol
== htons(ETH_P_IP
)) {
945 __sum16
*ipcso
= dest
+ ((void *)&(ip_hdr(skb
)->check
) - data
);
948 *ipcso
= ip_fast_csum(dest
+ skb_network_offset(skb
),
951 if (ip_hdr(skb
)->protocol
== IPPROTO_TCP
)
952 tucso
= dest
+ ((void *)&(tcp_hdr(skb
)->check
) - data
);
953 else if (ip_hdr(skb
)->protocol
== IPPROTO_UDP
)
954 tucso
= dest
+ ((void *)&(udp_hdr(skb
)->check
) - data
);
958 *tucso
= ~csum_tcpudp_magic(ip_hdr(skb
)->saddr
,
959 ip_hdr(skb
)->daddr
, 0,
960 ip_hdr(skb
)->protocol
, 0);
961 } else if (skb_is_gso_v6(skb
)) {
962 tucso
= dest
+ ((void *)&(tcp_hdr(skb
)->check
) - data
);
963 *tucso
= ~csum_ipv6_magic(&ipv6_hdr(skb
)->saddr
,
964 &ipv6_hdr(skb
)->daddr
, 0,
967 } else if (protocol
== htons(ETH_P_IPV6
)) {
968 tucso
= dest
+ skb_checksum_start_offset(skb
) + skb
->csum_offset
;
969 *tucso
= ~csum_ipv6_magic(&ipv6_hdr(skb
)->saddr
,
970 &ipv6_hdr(skb
)->daddr
, 0,
971 ipv6_hdr(skb
)->nexthdr
, 0);
976 /* First frame was headers, rest of the frames contain data.
977 * Calculate checksum over each frame.
979 for (i
= 0; i
< frame_count
; i
++) {
980 hdr
= page_address(frames
[i
]->page
);
981 dest
= (void *)(hdr
+ 1) + offset
;
982 len
= le32_to_cpu(hdr
->frame_size
) - offset
;
983 wsum
= csum_partial(dest
, len
, wsum
);
984 hdr
->frame_count
= cpu_to_le32(frame_count
);
989 *tucso
= csum_fold(wsum
);
991 /* Checksum is finally calculated and we don't touch the memory
992 * anymore, so DMA sync the frames now.
994 for (i
= 0; i
< frame_count
; i
++) {
995 dma_sync_single_for_device(dma_dev
, frames
[i
]->frame
.buffer_phy
,
996 tbnet_frame_size(frames
[i
]), DMA_TO_DEVICE
);
1002 static void *tbnet_kmap_frag(struct sk_buff
*skb
, unsigned int frag_num
,
1005 const skb_frag_t
*frag
= &skb_shinfo(skb
)->frags
[frag_num
];
1007 *len
= skb_frag_size(frag
);
1008 return kmap_atomic(skb_frag_page(frag
)) + frag
->page_offset
;
1011 static netdev_tx_t
tbnet_start_xmit(struct sk_buff
*skb
,
1012 struct net_device
*dev
)
1014 struct tbnet
*net
= netdev_priv(dev
);
1015 struct tbnet_frame
*frames
[MAX_SKB_FRAGS
];
1016 u16 frame_id
= atomic_read(&net
->frame_id
);
1017 struct thunderbolt_ip_frame_header
*hdr
;
1018 unsigned int len
= skb_headlen(skb
);
1019 unsigned int data_len
= skb
->len
;
1020 unsigned int nframes
, i
;
1021 unsigned int frag
= 0;
1022 void *src
= skb
->data
;
1023 u32 frame_index
= 0;
1027 nframes
= DIV_ROUND_UP(data_len
, TBNET_MAX_PAYLOAD_SIZE
);
1028 if (tbnet_available_buffers(&net
->tx_ring
) < nframes
) {
1029 netif_stop_queue(net
->dev
);
1030 return NETDEV_TX_BUSY
;
1033 frames
[frame_index
] = tbnet_get_tx_buffer(net
);
1034 if (!frames
[frame_index
])
1037 hdr
= page_address(frames
[frame_index
]->page
);
1040 /* If overall packet is bigger than the frame data size */
1041 while (data_len
> TBNET_MAX_PAYLOAD_SIZE
) {
1042 unsigned int size_left
= TBNET_MAX_PAYLOAD_SIZE
;
1044 hdr
->frame_size
= cpu_to_le32(TBNET_MAX_PAYLOAD_SIZE
);
1045 hdr
->frame_index
= cpu_to_le16(frame_index
);
1046 hdr
->frame_id
= cpu_to_le16(frame_id
);
1049 if (len
> size_left
) {
1050 /* Copy data onto Tx buffer data with
1051 * full frame size then break and go to
1054 memcpy(dest
, src
, size_left
);
1061 memcpy(dest
, src
, len
);
1070 /* Ensure all fragments have been processed */
1071 if (frag
< skb_shinfo(skb
)->nr_frags
) {
1072 /* Map and then unmap quickly */
1073 src
= tbnet_kmap_frag(skb
, frag
++, &len
);
1075 } else if (unlikely(size_left
> 0)) {
1078 } while (size_left
> 0);
1080 data_len
-= TBNET_MAX_PAYLOAD_SIZE
;
1083 frames
[frame_index
] = tbnet_get_tx_buffer(net
);
1084 if (!frames
[frame_index
])
1087 hdr
= page_address(frames
[frame_index
]->page
);
1091 hdr
->frame_size
= cpu_to_le32(data_len
);
1092 hdr
->frame_index
= cpu_to_le16(frame_index
);
1093 hdr
->frame_id
= cpu_to_le16(frame_id
);
1095 frames
[frame_index
]->frame
.size
= data_len
+ sizeof(*hdr
);
1097 /* In case the remaining data_len is smaller than a frame */
1098 while (len
< data_len
) {
1099 memcpy(dest
, src
, len
);
1108 if (frag
< skb_shinfo(skb
)->nr_frags
) {
1109 src
= tbnet_kmap_frag(skb
, frag
++, &len
);
1111 } else if (unlikely(data_len
> 0)) {
1116 memcpy(dest
, src
, data_len
);
1121 if (!tbnet_xmit_csum_and_map(net
, skb
, frames
, frame_index
+ 1))
1124 for (i
= 0; i
< frame_index
+ 1; i
++)
1125 tb_ring_tx(net
->tx_ring
.ring
, &frames
[i
]->frame
);
1127 if (net
->svc
->prtcstns
& TBNET_MATCH_FRAGS_ID
)
1128 atomic_inc(&net
->frame_id
);
1130 net
->stats
.tx_packets
++;
1131 net
->stats
.tx_bytes
+= skb
->len
;
1133 dev_consume_skb_any(skb
);
1135 return NETDEV_TX_OK
;
1138 /* We can re-use the buffers */
1139 net
->tx_ring
.cons
-= frame_index
;
1141 dev_kfree_skb_any(skb
);
1142 net
->stats
.tx_errors
++;
1144 return NETDEV_TX_OK
;
1147 static void tbnet_get_stats64(struct net_device
*dev
,
1148 struct rtnl_link_stats64
*stats
)
1150 struct tbnet
*net
= netdev_priv(dev
);
1152 stats
->tx_packets
= net
->stats
.tx_packets
;
1153 stats
->rx_packets
= net
->stats
.rx_packets
;
1154 stats
->tx_bytes
= net
->stats
.tx_bytes
;
1155 stats
->rx_bytes
= net
->stats
.rx_bytes
;
1156 stats
->rx_errors
= net
->stats
.rx_errors
+ net
->stats
.rx_length_errors
+
1157 net
->stats
.rx_over_errors
+ net
->stats
.rx_crc_errors
+
1158 net
->stats
.rx_missed_errors
;
1159 stats
->tx_errors
= net
->stats
.tx_errors
;
1160 stats
->rx_length_errors
= net
->stats
.rx_length_errors
;
1161 stats
->rx_over_errors
= net
->stats
.rx_over_errors
;
1162 stats
->rx_crc_errors
= net
->stats
.rx_crc_errors
;
1163 stats
->rx_missed_errors
= net
->stats
.rx_missed_errors
;
1166 static const struct net_device_ops tbnet_netdev_ops
= {
1167 .ndo_open
= tbnet_open
,
1168 .ndo_stop
= tbnet_stop
,
1169 .ndo_start_xmit
= tbnet_start_xmit
,
1170 .ndo_get_stats64
= tbnet_get_stats64
,
1173 static void tbnet_generate_mac(struct net_device
*dev
)
1175 const struct tbnet
*net
= netdev_priv(dev
);
1176 const struct tb_xdomain
*xd
= net
->xd
;
1180 phy_port
= tb_phy_port_from_link(TBNET_L0_PORT_NUM(xd
->route
));
1182 /* Unicast and locally administered MAC */
1183 dev
->dev_addr
[0] = phy_port
<< 4 | 0x02;
1184 hash
= jhash2((u32
*)xd
->local_uuid
, 4, 0);
1185 memcpy(dev
->dev_addr
+ 1, &hash
, sizeof(hash
));
1186 hash
= jhash2((u32
*)xd
->local_uuid
, 4, hash
);
1187 dev
->dev_addr
[5] = hash
& 0xff;
1190 static int tbnet_probe(struct tb_service
*svc
, const struct tb_service_id
*id
)
1192 struct tb_xdomain
*xd
= tb_service_parent(svc
);
1193 struct net_device
*dev
;
1197 dev
= alloc_etherdev(sizeof(*net
));
1201 SET_NETDEV_DEV(dev
, &svc
->dev
);
1203 net
= netdev_priv(dev
);
1204 INIT_DELAYED_WORK(&net
->login_work
, tbnet_login_work
);
1205 INIT_WORK(&net
->connected_work
, tbnet_connected_work
);
1206 INIT_WORK(&net
->disconnect_work
, tbnet_disconnect_work
);
1207 mutex_init(&net
->connection_lock
);
1208 atomic_set(&net
->command_id
, 0);
1209 atomic_set(&net
->frame_id
, 0);
1214 tbnet_generate_mac(dev
);
1216 strcpy(dev
->name
, "thunderbolt%d");
1217 dev
->netdev_ops
= &tbnet_netdev_ops
;
1219 /* ThunderboltIP takes advantage of TSO packets but instead of
1220 * segmenting them we just split the packet into Thunderbolt
1221 * frames (maximum payload size of each frame is 4084 bytes) and
1222 * calculate checksum over the whole packet here.
1224 * The receiving side does the opposite if the host OS supports
1225 * LRO, otherwise it needs to split the large packet into MTU
1226 * sized smaller packets.
1228 * In order to receive large packets from the networking stack,
1229 * we need to announce support for most of the offloading
1232 dev
->hw_features
= NETIF_F_SG
| NETIF_F_ALL_TSO
| NETIF_F_GRO
|
1233 NETIF_F_IP_CSUM
| NETIF_F_IPV6_CSUM
;
1234 dev
->features
= dev
->hw_features
| NETIF_F_HIGHDMA
;
1235 dev
->hard_header_len
+= sizeof(struct thunderbolt_ip_frame_header
);
1237 netif_napi_add(dev
, &net
->napi
, tbnet_poll
, NAPI_POLL_WEIGHT
);
1239 /* MTU range: 68 - 65522 */
1240 dev
->min_mtu
= ETH_MIN_MTU
;
1241 dev
->max_mtu
= TBNET_MAX_MTU
- ETH_HLEN
;
1243 net
->handler
.uuid
= &tbnet_svc_uuid
;
1244 net
->handler
.callback
= tbnet_handle_packet
,
1245 net
->handler
.data
= net
;
1246 tb_register_protocol_handler(&net
->handler
);
1248 tb_service_set_drvdata(svc
, net
);
1250 ret
= register_netdev(dev
);
1252 tb_unregister_protocol_handler(&net
->handler
);
1260 static void tbnet_remove(struct tb_service
*svc
)
1262 struct tbnet
*net
= tb_service_get_drvdata(svc
);
1264 unregister_netdev(net
->dev
);
1265 tb_unregister_protocol_handler(&net
->handler
);
1266 free_netdev(net
->dev
);
1269 static void tbnet_shutdown(struct tb_service
*svc
)
1271 tbnet_tear_down(tb_service_get_drvdata(svc
), true);
1274 static int __maybe_unused
tbnet_suspend(struct device
*dev
)
1276 struct tb_service
*svc
= tb_to_service(dev
);
1277 struct tbnet
*net
= tb_service_get_drvdata(svc
);
1280 if (netif_running(net
->dev
)) {
1281 netif_device_detach(net
->dev
);
1282 tbnet_tear_down(net
, true);
1285 tb_unregister_protocol_handler(&net
->handler
);
1289 static int __maybe_unused
tbnet_resume(struct device
*dev
)
1291 struct tb_service
*svc
= tb_to_service(dev
);
1292 struct tbnet
*net
= tb_service_get_drvdata(svc
);
1294 tb_register_protocol_handler(&net
->handler
);
1296 netif_carrier_off(net
->dev
);
1297 if (netif_running(net
->dev
)) {
1298 netif_device_attach(net
->dev
);
1305 static const struct dev_pm_ops tbnet_pm_ops
= {
1306 SET_SYSTEM_SLEEP_PM_OPS(tbnet_suspend
, tbnet_resume
)
1309 static const struct tb_service_id tbnet_ids
[] = {
1310 { TB_SERVICE("network", 1) },
1313 MODULE_DEVICE_TABLE(tbsvc
, tbnet_ids
);
1315 static struct tb_service_driver tbnet_driver
= {
1317 .owner
= THIS_MODULE
,
1318 .name
= "thunderbolt-net",
1319 .pm
= &tbnet_pm_ops
,
1321 .probe
= tbnet_probe
,
1322 .remove
= tbnet_remove
,
1323 .shutdown
= tbnet_shutdown
,
1324 .id_table
= tbnet_ids
,
1327 static int __init
tbnet_init(void)
1331 tbnet_dir
= tb_property_create_dir(&tbnet_dir_uuid
);
1335 tb_property_add_immediate(tbnet_dir
, "prtcid", 1);
1336 tb_property_add_immediate(tbnet_dir
, "prtcvers", 1);
1337 tb_property_add_immediate(tbnet_dir
, "prtcrevs", 1);
1338 tb_property_add_immediate(tbnet_dir
, "prtcstns",
1339 TBNET_MATCH_FRAGS_ID
);
1341 ret
= tb_register_property_dir("network", tbnet_dir
);
1343 tb_property_free_dir(tbnet_dir
);
1347 return tb_register_service_driver(&tbnet_driver
);
1349 module_init(tbnet_init
);
1351 static void __exit
tbnet_exit(void)
1353 tb_unregister_service_driver(&tbnet_driver
);
1354 tb_unregister_property_dir("network", tbnet_dir
);
1355 tb_property_free_dir(tbnet_dir
);
1357 module_exit(tbnet_exit
);
1359 MODULE_AUTHOR("Amir Levy <amir.jer.levy@intel.com>");
1360 MODULE_AUTHOR("Michael Jamet <michael.jamet@intel.com>");
1361 MODULE_AUTHOR("Mika Westerberg <mika.westerberg@linux.intel.com>");
1362 MODULE_DESCRIPTION("Thunderbolt network driver");
1363 MODULE_LICENSE("GPL v2");