2 * Intel MIC Platform Software Stack (MPSS)
4 * Copyright(c) 2015 Intel Corporation.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License, version 2, as
8 * published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License for more details.
15 * The full GNU General Public License is included in this distribution in
16 * the file called "COPYING".
18 * Intel MIC Coprocessor State Management (COSM) Driver
21 #include <linux/kthread.h>
22 #include "cosm_main.h"
25 * The COSM driver uses SCIF to communicate between the management node and the
26 * MIC cards. SCIF is used to (a) Send a shutdown command to the card (b)
27 * receive a shutdown status back from the card upon completion of shutdown and
28 * (c) receive periodic heartbeat messages from the card used to deduce if the
31 * A COSM server consisting of a SCIF listening endpoint waits for incoming
32 * connections from the card. Upon acceptance of the connection, a separate
33 * work-item is scheduled to handle SCIF message processing for that card. The
34 * life-time of this work-item is therefore the time from which the connection
35 * from a card is accepted to the time at which the connection is closed. A new
36 * work-item starts each time the card boots and is alive till the card (a)
37 * shuts down (b) is reset (c) crashes (d) cosm_client driver on the card is
40 * From the point of view of COSM interactions with SCIF during card
41 * shutdown, reset and crash are as follows:
45 * 1. COSM client on the card invokes orderly_poweroff() in response to SHUTDOWN
46 * message from the host.
47 * 2. Card driver shutdown callback invokes scif_unregister_device(..) resulting
48 * in scif_remove(..) getting called on the card
49 * 3. scif_remove -> scif_stop -> scif_handle_remove_node ->
50 * scif_peer_unregister_device -> device_unregister for the host peer device
51 * 4. During device_unregister remove(..) method of cosm_client is invoked which
52 * closes the COSM SCIF endpoint on the card. This results in a SCIF_DISCNCT
53 * message being sent to host SCIF. SCIF_DISCNCT message processing on the
54 * host SCIF sets the host COSM SCIF endpoint state to DISCONNECTED and wakes
55 * up the host COSM thread blocked in scif_poll(..) resulting in
56 * scif_poll(..) returning POLLHUP.
57 * 5. On the card, scif_peer_release_dev is next called which results in an
58 * SCIF_EXIT message being sent to the host and after receiving the
59 * SCIF_EXIT_ACK from the host the peer device teardown on the card is
61 * 6. As part of the SCIF_EXIT message processing on the host, host sends a
62 * SCIF_REMOVE_NODE to itself corresponding to the card being removed. This
63 * starts a similar SCIF peer device teardown sequence on the host
64 * corresponding to the card being shut down.
68 * The case of interest here is when the card has not been previously shut down
69 * since most of the steps below are skipped in that case:
71 * 1. cosm_stop(..) invokes hw_ops->stop(..) method of the base PCIe driver
72 * which unregisters the SCIF HW device resulting in scif_remove(..) being
74 * 2. scif_remove(..) calls scif_disconnect_node(..) which results in a
75 * SCIF_EXIT message being sent to the card.
76 * 3. The card executes scif_stop() as part of SCIF_EXIT message
77 * processing. This results in the COSM endpoint on the card being closed and
78 * the SCIF host peer device on the card getting unregistered similar to
79 * steps 3, 4 and 5 for the card shutdown case above. scif_poll(..) on the
80 * host returns POLLHUP as a result.
81 * 4. On the host, card peer device unregister and SCIF HW remove(..) also
82 * subsequently complete.
86 * If a reset is issued after the card has crashed, there is no SCIF_DISCNT
87 * message from the card which would result in scif_poll(..) returning
88 * POLLHUP. In this case when the host SCIF driver sends a SCIF_REMOVE_NODE
89 * message to itself resulting in the card SCIF peer device being unregistered,
90 * this results in a scif_peer_release_dev -> scif_cleanup_scifdev->
91 * scif_invalidate_ep call sequence which sets the endpoint state to
92 * DISCONNECTED and results in scif_poll(..) returning POLLHUP.
95 #define COSM_SCIF_BACKLOG 16
96 #define COSM_HEARTBEAT_CHECK_DELTA_SEC 10
97 #define COSM_HEARTBEAT_TIMEOUT_SEC \
98 (COSM_HEARTBEAT_SEND_SEC + COSM_HEARTBEAT_CHECK_DELTA_SEC)
99 #define COSM_HEARTBEAT_TIMEOUT_MSEC (COSM_HEARTBEAT_TIMEOUT_SEC * MSEC_PER_SEC)
101 static struct task_struct
*server_thread
;
102 static scif_epd_t listen_epd
;
104 /* Publish MIC card's shutdown status to user space MIC daemon */
105 static void cosm_update_mic_status(struct cosm_device
*cdev
)
107 if (cdev
->shutdown_status_int
!= MIC_NOP
) {
108 cosm_set_shutdown_status(cdev
, cdev
->shutdown_status_int
);
109 cdev
->shutdown_status_int
= MIC_NOP
;
113 /* Store MIC card's shutdown status internally when it is received */
114 static void cosm_shutdown_status_int(struct cosm_device
*cdev
,
115 enum mic_status shutdown_status
)
117 switch (shutdown_status
) {
124 dev_err(&cdev
->dev
, "%s %d Unexpected shutdown_status %d\n",
125 __func__
, __LINE__
, shutdown_status
);
128 cdev
->shutdown_status_int
= shutdown_status
;
129 cdev
->heartbeat_watchdog_enable
= false;
131 if (cdev
->state
!= MIC_SHUTTING_DOWN
)
132 cosm_set_state(cdev
, MIC_SHUTTING_DOWN
);
135 /* Non-blocking recv. Read and process all available messages */
136 static void cosm_scif_recv(struct cosm_device
*cdev
)
142 rc
= scif_recv(cdev
->epd
, &msg
, sizeof(msg
), 0);
146 dev_dbg(&cdev
->dev
, "%s: %d rc %d\n",
147 __func__
, __LINE__
, rc
);
150 dev_dbg(&cdev
->dev
, "%s: %d rc %d id 0x%llx\n",
151 __func__
, __LINE__
, rc
, msg
.id
);
154 case COSM_MSG_SHUTDOWN_STATUS
:
155 cosm_shutdown_status_int(cdev
, msg
.shutdown_status
);
157 case COSM_MSG_HEARTBEAT
:
158 /* Nothing to do, heartbeat only unblocks scif_poll */
161 dev_err(&cdev
->dev
, "%s: %d unknown msg.id %lld\n",
162 __func__
, __LINE__
, msg
.id
);
168 /* Publish crashed status for this MIC card */
169 static void cosm_set_crashed(struct cosm_device
*cdev
)
171 dev_err(&cdev
->dev
, "node alive timeout\n");
172 cosm_shutdown_status_int(cdev
, MIC_CRASHED
);
173 cosm_update_mic_status(cdev
);
176 /* Send host time to the MIC card to sync system time between host and MIC */
177 static void cosm_send_time(struct cosm_device
*cdev
)
179 struct cosm_msg msg
= { .id
= COSM_MSG_SYNC_TIME
};
182 getnstimeofday64(&msg
.timespec
);
183 rc
= scif_send(cdev
->epd
, &msg
, sizeof(msg
), SCIF_SEND_BLOCK
);
185 dev_err(&cdev
->dev
, "%s %d scif_send failed rc %d\n",
186 __func__
, __LINE__
, rc
);
190 * Close this cosm_device's endpoint after its peer endpoint on the card has
191 * been closed. In all cases except MIC card crash POLLHUP on the host is
192 * triggered by the client's endpoint being closed.
194 static void cosm_scif_close(struct cosm_device
*cdev
)
197 * Because SHUTDOWN_STATUS message is sent by the MIC cards in the
198 * reboot notifier when shutdown is still not complete, we notify mpssd
199 * to reset the card when SCIF endpoint is closed.
201 cosm_update_mic_status(cdev
);
202 scif_close(cdev
->epd
);
204 dev_dbg(&cdev
->dev
, "%s %d\n", __func__
, __LINE__
);
208 * Set card state to ONLINE when a new SCIF connection from a MIC card is
209 * received. Normally the state is BOOTING when the connection comes in, but can
210 * be ONLINE if cosm_client driver on the card was unloaded and then reloaded.
212 static int cosm_set_online(struct cosm_device
*cdev
)
216 if (MIC_BOOTING
== cdev
->state
|| MIC_ONLINE
== cdev
->state
) {
217 cdev
->heartbeat_watchdog_enable
= cdev
->sysfs_heartbeat_enable
;
218 cdev
->epd
= cdev
->newepd
;
219 if (cdev
->state
== MIC_BOOTING
)
220 cosm_set_state(cdev
, MIC_ONLINE
);
221 cosm_send_time(cdev
);
222 dev_dbg(&cdev
->dev
, "%s %d\n", __func__
, __LINE__
);
224 dev_warn(&cdev
->dev
, "%s %d not going online in state: %s\n",
225 __func__
, __LINE__
, cosm_state_string
[cdev
->state
]);
228 /* Drop reference acquired by bus_find_device in the server thread */
229 put_device(&cdev
->dev
);
234 * Work function for handling work for a SCIF connection from a particular MIC
235 * card. It first sets the card state to ONLINE and then calls scif_poll to
236 * block on activity such as incoming messages on the SCIF endpoint. When the
237 * endpoint is closed, the work function exits, completing its life cycle, from
238 * MIC card boot to card shutdown/reset/crash.
240 void cosm_scif_work(struct work_struct
*work
)
242 struct cosm_device
*cdev
= container_of(work
, struct cosm_device
,
244 struct scif_pollepd pollepd
;
247 mutex_lock(&cdev
->cosm_mutex
);
248 if (cosm_set_online(cdev
))
252 pollepd
.epd
= cdev
->epd
;
253 pollepd
.events
= POLLIN
;
255 /* Drop the mutex before blocking in scif_poll(..) */
256 mutex_unlock(&cdev
->cosm_mutex
);
257 /* poll(..) with timeout on our endpoint */
258 rc
= scif_poll(&pollepd
, 1, COSM_HEARTBEAT_TIMEOUT_MSEC
);
259 mutex_lock(&cdev
->cosm_mutex
);
261 dev_err(&cdev
->dev
, "%s %d scif_poll rc %d\n",
262 __func__
, __LINE__
, rc
);
266 /* There is a message from the card */
267 if (pollepd
.revents
& POLLIN
)
268 cosm_scif_recv(cdev
);
270 /* The peer endpoint is closed or this endpoint disconnected */
271 if (pollepd
.revents
& POLLHUP
) {
272 cosm_scif_close(cdev
);
276 /* Did we timeout from poll? */
277 if (!rc
&& cdev
->heartbeat_watchdog_enable
)
278 cosm_set_crashed(cdev
);
281 dev_dbg(&cdev
->dev
, "%s %d exiting\n", __func__
, __LINE__
);
282 mutex_unlock(&cdev
->cosm_mutex
);
286 * COSM SCIF server thread function. Accepts incoming SCIF connections from MIC
287 * cards, finds the correct cosm_device to associate that connection with and
288 * schedules individual work items for each MIC card.
290 static int cosm_scif_server(void *unused
)
292 struct cosm_device
*cdev
;
294 struct scif_port_id port_id
;
297 allow_signal(SIGKILL
);
299 while (!kthread_should_stop()) {
300 rc
= scif_accept(listen_epd
, &port_id
, &newepd
,
303 if (-ERESTARTSYS
!= rc
)
304 pr_err("%s %d rc %d\n", __func__
, __LINE__
, rc
);
309 * Associate the incoming connection with a particular
310 * cosm_device, COSM device ID == SCIF node ID - 1
312 cdev
= cosm_find_cdev_by_id(port_id
.node
- 1);
315 cdev
->newepd
= newepd
;
316 schedule_work(&cdev
->scif_work
);
319 pr_debug("%s %d Server thread stopped\n", __func__
, __LINE__
);
323 static int cosm_scif_listen(void)
327 listen_epd
= scif_open();
329 pr_err("%s %d scif_open failed\n", __func__
, __LINE__
);
333 rc
= scif_bind(listen_epd
, SCIF_COSM_LISTEN_PORT
);
335 pr_err("%s %d scif_bind failed rc %d\n",
336 __func__
, __LINE__
, rc
);
340 rc
= scif_listen(listen_epd
, COSM_SCIF_BACKLOG
);
342 pr_err("%s %d scif_listen rc %d\n", __func__
, __LINE__
, rc
);
345 pr_debug("%s %d listen_epd set up\n", __func__
, __LINE__
);
348 scif_close(listen_epd
);
353 static void cosm_scif_listen_exit(void)
355 pr_debug("%s %d closing listen_epd\n", __func__
, __LINE__
);
357 scif_close(listen_epd
);
363 * Create a listening SCIF endpoint and a server kthread which accepts incoming
364 * SCIF connections from MIC cards
366 int cosm_scif_init(void)
368 int rc
= cosm_scif_listen();
371 pr_err("%s %d cosm_scif_listen rc %d\n",
372 __func__
, __LINE__
, rc
);
376 server_thread
= kthread_run(cosm_scif_server
, NULL
, "cosm_server");
377 if (IS_ERR(server_thread
)) {
378 rc
= PTR_ERR(server_thread
);
379 pr_err("%s %d kthread_run rc %d\n", __func__
, __LINE__
, rc
);
384 cosm_scif_listen_exit();
389 /* Stop the running server thread and close the listening SCIF endpoint */
390 void cosm_scif_exit(void)
394 if (!IS_ERR_OR_NULL(server_thread
)) {
395 rc
= send_sig(SIGKILL
, server_thread
, 0);
397 pr_err("%s %d send_sig rc %d\n",
398 __func__
, __LINE__
, rc
);
401 kthread_stop(server_thread
);
404 cosm_scif_listen_exit();