2 * Copyright (c) 2010, Microsoft Corporation.
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms and conditions of the GNU General Public License,
6 * version 2, as published by the Free Software Foundation.
8 * This program is distributed in the hope it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
13 * You should have received a copy of the GNU General Public License along with
14 * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
15 * Place - Suite 330, Boston, MA 02111-1307 USA.
18 * Haiyang Zhang <haiyangz@microsoft.com>
19 * Hank Janssen <hjanssen@microsoft.com>
21 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
23 #include <linux/kernel.h>
24 #include <linux/init.h>
25 #include <linux/module.h>
26 #include <linux/slab.h>
27 #include <linux/sysctl.h>
28 #include <linux/reboot.h>
29 #include <linux/hyperv.h>
30 #include <linux/clockchips.h>
31 #include <linux/ptp_clock_kernel.h>
32 #include <asm/mshyperv.h>
34 #include "hyperv_vmbus.h"
38 #define SD_VERSION (SD_MAJOR << 16 | SD_MINOR)
41 #define SD_VERSION_1 (SD_MAJOR_1 << 16 | SD_MINOR)
45 #define TS_VERSION (TS_MAJOR << 16 | TS_MINOR)
48 #define TS_VERSION_1 (TS_MAJOR_1 << 16 | TS_MINOR)
51 #define TS_VERSION_3 (TS_MAJOR_3 << 16 | TS_MINOR)
55 #define HB_VERSION (HB_MAJOR << 16 | HB_MINOR)
58 #define HB_VERSION_1 (HB_MAJOR_1 << 16 | HB_MINOR)
60 static int sd_srv_version
;
61 static int ts_srv_version
;
62 static int hb_srv_version
;
64 #define SD_VER_COUNT 2
65 static const int sd_versions
[] = {
70 #define TS_VER_COUNT 3
71 static const int ts_versions
[] = {
77 #define HB_VER_COUNT 2
78 static const int hb_versions
[] = {
83 #define FW_VER_COUNT 2
84 static const int fw_versions
[] = {
89 static void shutdown_onchannelcallback(void *context
);
90 static struct hv_util_service util_shutdown
= {
91 .util_cb
= shutdown_onchannelcallback
,
94 static int hv_timesync_init(struct hv_util_service
*srv
);
95 static void hv_timesync_deinit(void);
97 static void timesync_onchannelcallback(void *context
);
98 static struct hv_util_service util_timesynch
= {
99 .util_cb
= timesync_onchannelcallback
,
100 .util_init
= hv_timesync_init
,
101 .util_deinit
= hv_timesync_deinit
,
104 static void heartbeat_onchannelcallback(void *context
);
105 static struct hv_util_service util_heartbeat
= {
106 .util_cb
= heartbeat_onchannelcallback
,
109 static struct hv_util_service util_kvp
= {
110 .util_cb
= hv_kvp_onchannelcallback
,
111 .util_init
= hv_kvp_init
,
112 .util_deinit
= hv_kvp_deinit
,
115 static struct hv_util_service util_vss
= {
116 .util_cb
= hv_vss_onchannelcallback
,
117 .util_init
= hv_vss_init
,
118 .util_deinit
= hv_vss_deinit
,
121 static struct hv_util_service util_fcopy
= {
122 .util_cb
= hv_fcopy_onchannelcallback
,
123 .util_init
= hv_fcopy_init
,
124 .util_deinit
= hv_fcopy_deinit
,
127 static void perform_shutdown(struct work_struct
*dummy
)
129 orderly_poweroff(true);
133 * Perform the shutdown operation in a thread context.
135 static DECLARE_WORK(shutdown_work
, perform_shutdown
);
137 static void shutdown_onchannelcallback(void *context
)
139 struct vmbus_channel
*channel
= context
;
142 bool execute_shutdown
= false;
143 u8
*shut_txf_buf
= util_shutdown
.recv_buffer
;
145 struct shutdown_msg_data
*shutdown_msg
;
147 struct icmsg_hdr
*icmsghdrp
;
149 vmbus_recvpacket(channel
, shut_txf_buf
,
150 PAGE_SIZE
, &recvlen
, &requestid
);
153 icmsghdrp
= (struct icmsg_hdr
*)&shut_txf_buf
[
154 sizeof(struct vmbuspipe_hdr
)];
156 if (icmsghdrp
->icmsgtype
== ICMSGTYPE_NEGOTIATE
) {
157 if (vmbus_prep_negotiate_resp(icmsghdrp
, shut_txf_buf
,
158 fw_versions
, FW_VER_COUNT
,
159 sd_versions
, SD_VER_COUNT
,
160 NULL
, &sd_srv_version
)) {
161 pr_info("Shutdown IC version %d.%d\n",
162 sd_srv_version
>> 16,
163 sd_srv_version
& 0xFFFF);
167 (struct shutdown_msg_data
*)&shut_txf_buf
[
168 sizeof(struct vmbuspipe_hdr
) +
169 sizeof(struct icmsg_hdr
)];
171 switch (shutdown_msg
->flags
) {
174 icmsghdrp
->status
= HV_S_OK
;
175 execute_shutdown
= true;
177 pr_info("Shutdown request received -"
178 " graceful shutdown initiated\n");
181 icmsghdrp
->status
= HV_E_FAIL
;
182 execute_shutdown
= false;
184 pr_info("Shutdown request received -"
185 " Invalid request\n");
190 icmsghdrp
->icflags
= ICMSGHDRFLAG_TRANSACTION
191 | ICMSGHDRFLAG_RESPONSE
;
193 vmbus_sendpacket(channel
, shut_txf_buf
,
195 VM_PKT_DATA_INBAND
, 0);
198 if (execute_shutdown
== true)
199 schedule_work(&shutdown_work
);
203 * Set the host time in a process context.
205 static struct work_struct adj_time_work
;
208 * The last time sample, received from the host. PTP device responds to
209 * requests by using this data and the current partition-wide time reference
218 static struct timespec64
hv_get_adj_host_time(void)
220 struct timespec64 ts
;
221 u64 newtime
, reftime
;
224 spin_lock_irqsave(&host_ts
.lock
, flags
);
225 reftime
= hyperv_cs
->read(hyperv_cs
);
226 newtime
= host_ts
.host_time
+ (reftime
- host_ts
.ref_time
);
227 ts
= ns_to_timespec64((newtime
- WLTIMEDELTA
) * 100);
228 spin_unlock_irqrestore(&host_ts
.lock
, flags
);
233 static void hv_set_host_time(struct work_struct
*work
)
235 struct timespec64 ts
= hv_get_adj_host_time();
237 do_settimeofday64(&ts
);
241 * Synchronize time with host after reboot, restore, etc.
243 * ICTIMESYNCFLAG_SYNC flag bit indicates reboot, restore events of the VM.
244 * After reboot the flag ICTIMESYNCFLAG_SYNC is included in the first time
245 * message after the timesync channel is opened. Since the hv_utils module is
246 * loaded after hv_vmbus, the first message is usually missed. This bit is
247 * considered a hard request to discipline the clock.
249 * ICTIMESYNCFLAG_SAMPLE bit indicates a time sample from host. This is
250 * typically used as a hint to the guest. The guest is under no obligation
251 * to discipline the clock.
253 static inline void adj_guesttime(u64 hosttime
, u64 reftime
, u8 adj_flags
)
259 * Save the adjusted time sample from the host and the snapshot
260 * of the current system time.
262 spin_lock_irqsave(&host_ts
.lock
, flags
);
264 cur_reftime
= hyperv_cs
->read(hyperv_cs
);
265 host_ts
.host_time
= hosttime
;
266 host_ts
.ref_time
= cur_reftime
;
269 * TimeSync v4 messages contain reference time (guest's Hyper-V
270 * clocksource read when the time sample was generated), we can
271 * improve the precision by adding the delta between now and the
272 * time of generation. For older protocols we set
273 * reftime == cur_reftime on call.
275 host_ts
.host_time
+= (cur_reftime
- reftime
);
277 spin_unlock_irqrestore(&host_ts
.lock
, flags
);
279 /* Schedule work to do do_settimeofday64() */
280 if (adj_flags
& ICTIMESYNCFLAG_SYNC
)
281 schedule_work(&adj_time_work
);
285 * Time Sync Channel message handler.
287 static void timesync_onchannelcallback(void *context
)
289 struct vmbus_channel
*channel
= context
;
292 struct icmsg_hdr
*icmsghdrp
;
293 struct ictimesync_data
*timedatap
;
294 struct ictimesync_ref_data
*refdata
;
295 u8
*time_txf_buf
= util_timesynch
.recv_buffer
;
297 vmbus_recvpacket(channel
, time_txf_buf
,
298 PAGE_SIZE
, &recvlen
, &requestid
);
301 icmsghdrp
= (struct icmsg_hdr
*)&time_txf_buf
[
302 sizeof(struct vmbuspipe_hdr
)];
304 if (icmsghdrp
->icmsgtype
== ICMSGTYPE_NEGOTIATE
) {
305 if (vmbus_prep_negotiate_resp(icmsghdrp
, time_txf_buf
,
306 fw_versions
, FW_VER_COUNT
,
307 ts_versions
, TS_VER_COUNT
,
308 NULL
, &ts_srv_version
)) {
309 pr_info("TimeSync IC version %d.%d\n",
310 ts_srv_version
>> 16,
311 ts_srv_version
& 0xFFFF);
314 if (ts_srv_version
> TS_VERSION_3
) {
315 refdata
= (struct ictimesync_ref_data
*)
317 sizeof(struct vmbuspipe_hdr
) +
318 sizeof(struct icmsg_hdr
)];
320 adj_guesttime(refdata
->parenttime
,
321 refdata
->vmreferencetime
,
324 timedatap
= (struct ictimesync_data
*)
326 sizeof(struct vmbuspipe_hdr
) +
327 sizeof(struct icmsg_hdr
)];
328 adj_guesttime(timedatap
->parenttime
,
329 hyperv_cs
->read(hyperv_cs
),
334 icmsghdrp
->icflags
= ICMSGHDRFLAG_TRANSACTION
335 | ICMSGHDRFLAG_RESPONSE
;
337 vmbus_sendpacket(channel
, time_txf_buf
,
339 VM_PKT_DATA_INBAND
, 0);
344 * Heartbeat functionality.
345 * Every two seconds, Hyper-V send us a heartbeat request message.
346 * we respond to this message, and Hyper-V knows we are alive.
348 static void heartbeat_onchannelcallback(void *context
)
350 struct vmbus_channel
*channel
= context
;
353 struct icmsg_hdr
*icmsghdrp
;
354 struct heartbeat_msg_data
*heartbeat_msg
;
355 u8
*hbeat_txf_buf
= util_heartbeat
.recv_buffer
;
359 vmbus_recvpacket(channel
, hbeat_txf_buf
,
360 PAGE_SIZE
, &recvlen
, &requestid
);
365 icmsghdrp
= (struct icmsg_hdr
*)&hbeat_txf_buf
[
366 sizeof(struct vmbuspipe_hdr
)];
368 if (icmsghdrp
->icmsgtype
== ICMSGTYPE_NEGOTIATE
) {
369 if (vmbus_prep_negotiate_resp(icmsghdrp
,
371 fw_versions
, FW_VER_COUNT
,
372 hb_versions
, HB_VER_COUNT
,
373 NULL
, &hb_srv_version
)) {
375 pr_info("Heartbeat IC version %d.%d\n",
376 hb_srv_version
>> 16,
377 hb_srv_version
& 0xFFFF);
381 (struct heartbeat_msg_data
*)&hbeat_txf_buf
[
382 sizeof(struct vmbuspipe_hdr
) +
383 sizeof(struct icmsg_hdr
)];
385 heartbeat_msg
->seq_num
+= 1;
388 icmsghdrp
->icflags
= ICMSGHDRFLAG_TRANSACTION
389 | ICMSGHDRFLAG_RESPONSE
;
391 vmbus_sendpacket(channel
, hbeat_txf_buf
,
393 VM_PKT_DATA_INBAND
, 0);
397 static int util_probe(struct hv_device
*dev
,
398 const struct hv_vmbus_device_id
*dev_id
)
400 struct hv_util_service
*srv
=
401 (struct hv_util_service
*)dev_id
->driver_data
;
404 srv
->recv_buffer
= kmalloc(PAGE_SIZE
* 4, GFP_KERNEL
);
405 if (!srv
->recv_buffer
)
407 srv
->channel
= dev
->channel
;
408 if (srv
->util_init
) {
409 ret
= srv
->util_init(srv
);
417 * The set of services managed by the util driver are not performance
418 * critical and do not need batched reading. Furthermore, some services
419 * such as KVP can only handle one message from the host at a time.
420 * Turn off batched reading for all util drivers before we open the
423 set_channel_read_mode(dev
->channel
, HV_CALL_DIRECT
);
425 hv_set_drvdata(dev
, srv
);
427 ret
= vmbus_open(dev
->channel
, 4 * PAGE_SIZE
, 4 * PAGE_SIZE
, NULL
, 0,
428 srv
->util_cb
, dev
->channel
);
435 if (srv
->util_deinit
)
438 kfree(srv
->recv_buffer
);
442 static int util_remove(struct hv_device
*dev
)
444 struct hv_util_service
*srv
= hv_get_drvdata(dev
);
446 if (srv
->util_deinit
)
448 vmbus_close(dev
->channel
);
449 kfree(srv
->recv_buffer
);
454 static const struct hv_vmbus_device_id id_table
[] = {
457 .driver_data
= (unsigned long)&util_shutdown
459 /* Time synch guid */
461 .driver_data
= (unsigned long)&util_timesynch
464 { HV_HEART_BEAT_GUID
,
465 .driver_data
= (unsigned long)&util_heartbeat
469 .driver_data
= (unsigned long)&util_kvp
473 .driver_data
= (unsigned long)&util_vss
477 .driver_data
= (unsigned long)&util_fcopy
482 MODULE_DEVICE_TABLE(vmbus
, id_table
);
484 /* The one and only one */
485 static struct hv_driver util_drv
= {
487 .id_table
= id_table
,
489 .remove
= util_remove
,
491 .probe_type
= PROBE_PREFER_ASYNCHRONOUS
,
495 static int hv_ptp_enable(struct ptp_clock_info
*info
,
496 struct ptp_clock_request
*request
, int on
)
501 static int hv_ptp_settime(struct ptp_clock_info
*p
, const struct timespec64
*ts
)
506 static int hv_ptp_adjfreq(struct ptp_clock_info
*ptp
, s32 delta
)
510 static int hv_ptp_adjtime(struct ptp_clock_info
*ptp
, s64 delta
)
515 static int hv_ptp_gettime(struct ptp_clock_info
*info
, struct timespec64
*ts
)
517 *ts
= hv_get_adj_host_time();
522 static struct ptp_clock_info ptp_hyperv_info
= {
524 .enable
= hv_ptp_enable
,
525 .adjtime
= hv_ptp_adjtime
,
526 .adjfreq
= hv_ptp_adjfreq
,
527 .gettime64
= hv_ptp_gettime
,
528 .settime64
= hv_ptp_settime
,
529 .owner
= THIS_MODULE
,
532 static struct ptp_clock
*hv_ptp_clock
;
534 static int hv_timesync_init(struct hv_util_service
*srv
)
536 /* TimeSync requires Hyper-V clocksource. */
540 spin_lock_init(&host_ts
.lock
);
542 INIT_WORK(&adj_time_work
, hv_set_host_time
);
545 * ptp_clock_register() returns NULL when CONFIG_PTP_1588_CLOCK is
546 * disabled but the driver is still useful without the PTP device
547 * as it still handles the ICTIMESYNCFLAG_SYNC case.
549 hv_ptp_clock
= ptp_clock_register(&ptp_hyperv_info
, NULL
);
550 if (IS_ERR_OR_NULL(hv_ptp_clock
)) {
551 pr_err("cannot register PTP clock: %ld\n",
552 PTR_ERR(hv_ptp_clock
));
559 static void hv_timesync_deinit(void)
562 ptp_clock_unregister(hv_ptp_clock
);
563 cancel_work_sync(&adj_time_work
);
566 static int __init
init_hyperv_utils(void)
568 pr_info("Registering HyperV Utility Driver\n");
570 return vmbus_driver_register(&util_drv
);
573 static void exit_hyperv_utils(void)
575 pr_info("De-Registered HyperV Utility Driver\n");
577 vmbus_driver_unregister(&util_drv
);
580 module_init(init_hyperv_utils
);
581 module_exit(exit_hyperv_utils
);
583 MODULE_DESCRIPTION("Hyper-V Utilities");
584 MODULE_LICENSE("GPL");