1 // SPDX-License-Identifier: GPL-2.0-only
3 * An implementation of host initiated guest snapshot.
5 * Copyright (C) 2013, Microsoft, Inc.
6 * Author : K. Y. Srinivasan <kys@microsoft.com>
8 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
10 #include <linux/net.h>
11 #include <linux/nls.h>
12 #include <linux/connector.h>
13 #include <linux/workqueue.h>
14 #include <linux/hyperv.h>
15 #include <asm/hyperv-tlfs.h>
17 #include "hyperv_vmbus.h"
18 #include "hv_utils_transport.h"
22 #define VSS_VERSION (VSS_MAJOR << 16 | VSS_MINOR)
24 #define VSS_VER_COUNT 1
25 static const int vss_versions
[] = {
29 #define FW_VER_COUNT 1
30 static const int fw_versions
[] = {
34 /* See comment with struct hv_vss_msg regarding the max VMbus packet size */
35 #define VSS_MAX_PKT_SIZE (HV_HYP_PAGE_SIZE * 2)
38 * Timeout values are based on expecations from host
40 #define VSS_FREEZE_TIMEOUT (15 * 60)
43 * Global state maintained for transaction that is being processed. For a class
44 * of integration services, including the "VSS service", the specified protocol
45 * is a "request/response" protocol which means that there can only be single
46 * outstanding transaction from the host at any given point in time. We use
47 * this to simplify memory management in this driver - we cache and process
48 * only one message at a time.
50 * While the request/response protocol is guaranteed by the host, we further
51 * ensure this by serializing packet processing in this driver - we do not
52 * read additional packets from the VMBUs until the current packet is fully
57 int state
; /* hvutil_device_state */
58 int recv_len
; /* number of bytes received. */
59 struct vmbus_channel
*recv_channel
; /* chn we got the request */
60 u64 recv_req_id
; /* request ID. */
61 struct hv_vss_msg
*msg
; /* current message */
65 static void vss_respond_to_host(int error
);
68 * This state maintains the version number registered by the daemon.
70 static int dm_reg_value
;
72 static const char vss_devname
[] = "vmbus/hv_vss";
73 static __u8
*recv_buffer
;
74 static struct hvutil_transport
*hvt
;
76 static void vss_timeout_func(struct work_struct
*dummy
);
77 static void vss_handle_request(struct work_struct
*dummy
);
79 static DECLARE_DELAYED_WORK(vss_timeout_work
, vss_timeout_func
);
80 static DECLARE_WORK(vss_handle_request_work
, vss_handle_request
);
82 static void vss_poll_wrapper(void *channel
)
84 /* Transaction is finished, reset the state here to avoid races. */
85 vss_transaction
.state
= HVUTIL_READY
;
86 tasklet_schedule(&((struct vmbus_channel
*)channel
)->callback_event
);
90 * Callback when data is received from user mode.
93 static void vss_timeout_func(struct work_struct
*dummy
)
96 * Timeout waiting for userspace component to reply happened.
98 pr_warn("VSS: timeout waiting for daemon to reply\n");
99 vss_respond_to_host(HV_E_FAIL
);
101 hv_poll_channel(vss_transaction
.recv_channel
, vss_poll_wrapper
);
104 static void vss_register_done(void)
106 hv_poll_channel(vss_transaction
.recv_channel
, vss_poll_wrapper
);
107 pr_debug("VSS: userspace daemon registered\n");
110 static int vss_handle_handshake(struct hv_vss_msg
*vss_msg
)
112 u32 our_ver
= VSS_OP_REGISTER1
;
114 switch (vss_msg
->vss_hdr
.operation
) {
115 case VSS_OP_REGISTER
:
116 /* Daemon doesn't expect us to reply */
117 dm_reg_value
= VSS_OP_REGISTER
;
119 case VSS_OP_REGISTER1
:
120 /* Daemon expects us to reply with our own version */
121 if (hvutil_transport_send(hvt
, &our_ver
, sizeof(our_ver
),
124 dm_reg_value
= VSS_OP_REGISTER1
;
129 pr_info("VSS: userspace daemon ver. %d connected\n", dm_reg_value
);
133 static int vss_on_msg(void *msg
, int len
)
135 struct hv_vss_msg
*vss_msg
= (struct hv_vss_msg
*)msg
;
137 if (len
!= sizeof(*vss_msg
)) {
138 pr_debug("VSS: Message size does not match length\n");
142 if (vss_msg
->vss_hdr
.operation
== VSS_OP_REGISTER
||
143 vss_msg
->vss_hdr
.operation
== VSS_OP_REGISTER1
) {
145 * Don't process registration messages if we're in the middle
146 * of a transaction processing.
148 if (vss_transaction
.state
> HVUTIL_READY
) {
149 pr_debug("VSS: Got unexpected registration request\n");
153 return vss_handle_handshake(vss_msg
);
154 } else if (vss_transaction
.state
== HVUTIL_USERSPACE_REQ
) {
155 vss_transaction
.state
= HVUTIL_USERSPACE_RECV
;
157 if (vss_msg
->vss_hdr
.operation
== VSS_OP_HOT_BACKUP
)
158 vss_transaction
.msg
->vss_cf
.flags
=
159 VSS_HBU_NO_AUTO_RECOVERY
;
161 if (cancel_delayed_work_sync(&vss_timeout_work
)) {
162 vss_respond_to_host(vss_msg
->error
);
163 /* Transaction is finished, reset the state. */
164 hv_poll_channel(vss_transaction
.recv_channel
,
168 /* This is a spurious call! */
169 pr_debug("VSS: Transaction not active\n");
175 static void vss_send_op(void)
177 int op
= vss_transaction
.msg
->vss_hdr
.operation
;
179 struct hv_vss_msg
*vss_msg
;
181 /* The transaction state is wrong. */
182 if (vss_transaction
.state
!= HVUTIL_HOSTMSG_RECEIVED
) {
183 pr_debug("VSS: Unexpected attempt to send to daemon\n");
187 vss_msg
= kzalloc(sizeof(*vss_msg
), GFP_KERNEL
);
191 vss_msg
->vss_hdr
.operation
= op
;
193 vss_transaction
.state
= HVUTIL_USERSPACE_REQ
;
195 schedule_delayed_work(&vss_timeout_work
, op
== VSS_OP_FREEZE
?
196 VSS_FREEZE_TIMEOUT
* HZ
: HV_UTIL_TIMEOUT
* HZ
);
198 rc
= hvutil_transport_send(hvt
, vss_msg
, sizeof(*vss_msg
), NULL
);
200 pr_warn("VSS: failed to communicate to the daemon: %d\n", rc
);
201 if (cancel_delayed_work_sync(&vss_timeout_work
)) {
202 vss_respond_to_host(HV_E_FAIL
);
203 vss_transaction
.state
= HVUTIL_READY
;
210 static void vss_handle_request(struct work_struct
*dummy
)
212 switch (vss_transaction
.msg
->vss_hdr
.operation
) {
214 * Initiate a "freeze/thaw" operation in the guest.
215 * We respond to the host once the operation is complete.
217 * We send the message to the user space daemon and the operation is
218 * performed in the daemon.
222 case VSS_OP_HOT_BACKUP
:
223 if (vss_transaction
.state
< HVUTIL_READY
) {
224 /* Userspace is not registered yet */
225 pr_debug("VSS: Not ready for request.\n");
226 vss_respond_to_host(HV_E_FAIL
);
230 pr_debug("VSS: Received request for op code: %d\n",
231 vss_transaction
.msg
->vss_hdr
.operation
);
232 vss_transaction
.state
= HVUTIL_HOSTMSG_RECEIVED
;
235 case VSS_OP_GET_DM_INFO
:
236 vss_transaction
.msg
->dm_info
.flags
= 0;
242 vss_respond_to_host(0);
243 hv_poll_channel(vss_transaction
.recv_channel
, vss_poll_wrapper
);
247 * Send a response back to the host.
251 vss_respond_to_host(int error
)
253 struct icmsg_hdr
*icmsghdrp
;
255 struct vmbus_channel
*channel
;
259 * Copy the global state for completing the transaction. Note that
260 * only one transaction can be active at a time.
263 buf_len
= vss_transaction
.recv_len
;
264 channel
= vss_transaction
.recv_channel
;
265 req_id
= vss_transaction
.recv_req_id
;
267 icmsghdrp
= (struct icmsg_hdr
*)
268 &recv_buffer
[sizeof(struct vmbuspipe_hdr
)];
270 if (channel
->onchannel_callback
== NULL
)
272 * We have raced with util driver being unloaded;
277 icmsghdrp
->status
= error
;
279 icmsghdrp
->icflags
= ICMSGHDRFLAG_TRANSACTION
| ICMSGHDRFLAG_RESPONSE
;
281 vmbus_sendpacket(channel
, recv_buffer
, buf_len
, req_id
,
282 VM_PKT_DATA_INBAND
, 0);
287 * This callback is invoked when we get a VSS message from the host.
288 * The host ensures that only one VSS transaction can be active at a time.
291 void hv_vss_onchannelcallback(void *context
)
293 struct vmbus_channel
*channel
= context
;
296 struct hv_vss_msg
*vss_msg
;
299 struct icmsg_hdr
*icmsghdrp
;
301 if (vss_transaction
.state
> HVUTIL_READY
)
304 if (vmbus_recvpacket(channel
, recv_buffer
, VSS_MAX_PKT_SIZE
, &recvlen
, &requestid
)) {
305 pr_err_ratelimited("VSS request received. Could not read into recv buf\n");
312 /* Ensure recvlen is big enough to read header data */
313 if (recvlen
< ICMSG_HDR
) {
314 pr_err_ratelimited("VSS request received. Packet length too small: %d\n",
319 icmsghdrp
= (struct icmsg_hdr
*)&recv_buffer
[sizeof(struct vmbuspipe_hdr
)];
321 if (icmsghdrp
->icmsgtype
== ICMSGTYPE_NEGOTIATE
) {
322 if (vmbus_prep_negotiate_resp(icmsghdrp
,
323 recv_buffer
, recvlen
,
324 fw_versions
, FW_VER_COUNT
,
325 vss_versions
, VSS_VER_COUNT
,
326 NULL
, &vss_srv_version
)) {
328 pr_info("VSS IC version %d.%d\n",
329 vss_srv_version
>> 16,
330 vss_srv_version
& 0xFFFF);
332 } else if (icmsghdrp
->icmsgtype
== ICMSGTYPE_VSS
) {
333 /* Ensure recvlen is big enough to contain hv_vss_msg */
334 if (recvlen
< ICMSG_HDR
+ sizeof(struct hv_vss_msg
)) {
335 pr_err_ratelimited("Invalid VSS msg. Packet length too small: %u\n",
339 vss_msg
= (struct hv_vss_msg
*)&recv_buffer
[ICMSG_HDR
];
342 * Stash away this global state for completing the
343 * transaction; note transactions are serialized.
346 vss_transaction
.recv_len
= recvlen
;
347 vss_transaction
.recv_req_id
= requestid
;
348 vss_transaction
.msg
= (struct hv_vss_msg
*)vss_msg
;
350 schedule_work(&vss_handle_request_work
);
353 pr_err_ratelimited("VSS request received. Invalid msg type: %d\n",
354 icmsghdrp
->icmsgtype
);
358 icmsghdrp
->icflags
= ICMSGHDRFLAG_TRANSACTION
|
359 ICMSGHDRFLAG_RESPONSE
;
360 vmbus_sendpacket(channel
, recv_buffer
, recvlen
, requestid
,
361 VM_PKT_DATA_INBAND
, 0);
364 static void vss_on_reset(void)
366 if (cancel_delayed_work_sync(&vss_timeout_work
))
367 vss_respond_to_host(HV_E_FAIL
);
368 vss_transaction
.state
= HVUTIL_DEVICE_INIT
;
372 hv_vss_init(struct hv_util_service
*srv
)
374 if (vmbus_proto_version
< VERSION_WIN8_1
) {
375 pr_warn("Integration service 'Backup (volume snapshot)'"
376 " not supported on this host version.\n");
379 recv_buffer
= srv
->recv_buffer
;
380 vss_transaction
.recv_channel
= srv
->channel
;
381 vss_transaction
.recv_channel
->max_pkt_size
= VSS_MAX_PKT_SIZE
;
384 * When this driver loads, the user level daemon that
385 * processes the host requests may not yet be running.
386 * Defer processing channel callbacks until the daemon
389 vss_transaction
.state
= HVUTIL_DEVICE_INIT
;
391 hvt
= hvutil_transport_init(vss_devname
, CN_VSS_IDX
, CN_VSS_VAL
,
392 vss_on_msg
, vss_on_reset
);
394 pr_warn("VSS: Failed to initialize transport\n");
401 static void hv_vss_cancel_work(void)
403 cancel_delayed_work_sync(&vss_timeout_work
);
404 cancel_work_sync(&vss_handle_request_work
);
407 int hv_vss_pre_suspend(void)
409 struct vmbus_channel
*channel
= vss_transaction
.recv_channel
;
410 struct hv_vss_msg
*vss_msg
;
413 * Fake a THAW message for the user space daemon in case the daemon
414 * has frozen the file systems. It doesn't matter if there is already
415 * a message pending to be delivered to the user space since we force
416 * vss_transaction.state to be HVUTIL_READY, so the user space daemon's
417 * write() will fail with EINVAL (see vss_on_msg()), and the daemon
418 * will reset the device by closing and re-opening it.
420 vss_msg
= kzalloc(sizeof(*vss_msg
), GFP_KERNEL
);
424 tasklet_disable(&channel
->callback_event
);
426 vss_msg
->vss_hdr
.operation
= VSS_OP_THAW
;
428 /* Cancel any possible pending work. */
429 hv_vss_cancel_work();
431 /* We don't care about the return value. */
432 hvutil_transport_send(hvt
, vss_msg
, sizeof(*vss_msg
), NULL
);
436 vss_transaction
.state
= HVUTIL_READY
;
438 /* tasklet_enable() will be called in hv_vss_pre_resume(). */
442 int hv_vss_pre_resume(void)
444 struct vmbus_channel
*channel
= vss_transaction
.recv_channel
;
446 tasklet_enable(&channel
->callback_event
);
451 void hv_vss_deinit(void)
453 vss_transaction
.state
= HVUTIL_DEVICE_DYING
;
455 hv_vss_cancel_work();
457 hvutil_transport_destroy(hvt
);