Linux kernel mirror (for testing)
git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel
os
linux
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Copyright (c) 2010, Microsoft Corporation.
4 *
5 * Authors:
6 * Haiyang Zhang <haiyangz@microsoft.com>
7 * Hank Janssen <hjanssen@microsoft.com>
8 */
9#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
10
11#include <linux/kernel.h>
12#include <linux/init.h>
13#include <linux/module.h>
14#include <linux/slab.h>
15#include <linux/sysctl.h>
16#include <linux/reboot.h>
17#include <linux/hyperv.h>
18#include <linux/clockchips.h>
19#include <linux/ptp_clock_kernel.h>
20#include <clocksource/hyperv_timer.h>
21#include <asm/mshyperv.h>
22
23#include "hyperv_vmbus.h"
24
25#define SD_MAJOR 3
26#define SD_MINOR 0
27#define SD_MINOR_1 1
28#define SD_MINOR_2 2
29#define SD_VERSION_3_1 (SD_MAJOR << 16 | SD_MINOR_1)
30#define SD_VERSION_3_2 (SD_MAJOR << 16 | SD_MINOR_2)
31#define SD_VERSION (SD_MAJOR << 16 | SD_MINOR)
32
33#define SD_MAJOR_1 1
34#define SD_VERSION_1 (SD_MAJOR_1 << 16 | SD_MINOR)
35
36#define TS_MAJOR 4
37#define TS_MINOR 0
38#define TS_VERSION (TS_MAJOR << 16 | TS_MINOR)
39
40#define TS_MAJOR_1 1
41#define TS_VERSION_1 (TS_MAJOR_1 << 16 | TS_MINOR)
42
43#define TS_MAJOR_3 3
44#define TS_VERSION_3 (TS_MAJOR_3 << 16 | TS_MINOR)
45
46#define HB_MAJOR 3
47#define HB_MINOR 0
48#define HB_VERSION (HB_MAJOR << 16 | HB_MINOR)
49
50#define HB_MAJOR_1 1
51#define HB_VERSION_1 (HB_MAJOR_1 << 16 | HB_MINOR)
52
53static int sd_srv_version;
54static int ts_srv_version;
55static int hb_srv_version;
56
57#define SD_VER_COUNT 4
58static const int sd_versions[] = {
59 SD_VERSION_3_2,
60 SD_VERSION_3_1,
61 SD_VERSION,
62 SD_VERSION_1
63};
64
65#define TS_VER_COUNT 3
66static const int ts_versions[] = {
67 TS_VERSION,
68 TS_VERSION_3,
69 TS_VERSION_1
70};
71
72#define HB_VER_COUNT 2
73static const int hb_versions[] = {
74 HB_VERSION,
75 HB_VERSION_1
76};
77
78#define FW_VER_COUNT 2
79static const int fw_versions[] = {
80 UTIL_FW_VERSION,
81 UTIL_WS2K8_FW_VERSION
82};
83
84/*
85 * Send the "hibernate" udev event in a thread context.
86 */
87struct hibernate_work_context {
88 struct work_struct work;
89 struct hv_device *dev;
90};
91
92static struct hibernate_work_context hibernate_context;
93static bool hibernation_supported;
94
95static void send_hibernate_uevent(struct work_struct *work)
96{
97 char *uevent_env[2] = { "EVENT=hibernate", NULL };
98 struct hibernate_work_context *ctx;
99
100 ctx = container_of(work, struct hibernate_work_context, work);
101
102 kobject_uevent_env(&ctx->dev->device.kobj, KOBJ_CHANGE, uevent_env);
103
104 pr_info("Sent hibernation uevent\n");
105}
106
107static int hv_shutdown_init(struct hv_util_service *srv)
108{
109 struct vmbus_channel *channel = srv->channel;
110
111 INIT_WORK(&hibernate_context.work, send_hibernate_uevent);
112 hibernate_context.dev = channel->device_obj;
113
114 hibernation_supported = hv_is_hibernation_supported();
115
116 return 0;
117}
118
119static void shutdown_onchannelcallback(void *context);
120static struct hv_util_service util_shutdown = {
121 .util_cb = shutdown_onchannelcallback,
122 .util_init = hv_shutdown_init,
123};
124
125static int hv_timesync_init(struct hv_util_service *srv);
126static int hv_timesync_pre_suspend(void);
127static void hv_timesync_deinit(void);
128
129static void timesync_onchannelcallback(void *context);
130static struct hv_util_service util_timesynch = {
131 .util_cb = timesync_onchannelcallback,
132 .util_init = hv_timesync_init,
133 .util_pre_suspend = hv_timesync_pre_suspend,
134 .util_deinit = hv_timesync_deinit,
135};
136
137static void heartbeat_onchannelcallback(void *context);
138static struct hv_util_service util_heartbeat = {
139 .util_cb = heartbeat_onchannelcallback,
140};
141
142static struct hv_util_service util_kvp = {
143 .util_cb = hv_kvp_onchannelcallback,
144 .util_init = hv_kvp_init,
145 .util_pre_suspend = hv_kvp_pre_suspend,
146 .util_pre_resume = hv_kvp_pre_resume,
147 .util_deinit = hv_kvp_deinit,
148};
149
150static struct hv_util_service util_vss = {
151 .util_cb = hv_vss_onchannelcallback,
152 .util_init = hv_vss_init,
153 .util_pre_suspend = hv_vss_pre_suspend,
154 .util_pre_resume = hv_vss_pre_resume,
155 .util_deinit = hv_vss_deinit,
156};
157
158static struct hv_util_service util_fcopy = {
159 .util_cb = hv_fcopy_onchannelcallback,
160 .util_init = hv_fcopy_init,
161 .util_pre_suspend = hv_fcopy_pre_suspend,
162 .util_pre_resume = hv_fcopy_pre_resume,
163 .util_deinit = hv_fcopy_deinit,
164};
165
166static void perform_shutdown(struct work_struct *dummy)
167{
168 orderly_poweroff(true);
169}
170
171static void perform_restart(struct work_struct *dummy)
172{
173 orderly_reboot();
174}
175
176/*
177 * Perform the shutdown operation in a thread context.
178 */
179static DECLARE_WORK(shutdown_work, perform_shutdown);
180
181/*
182 * Perform the restart operation in a thread context.
183 */
184static DECLARE_WORK(restart_work, perform_restart);
185
186static void shutdown_onchannelcallback(void *context)
187{
188 struct vmbus_channel *channel = context;
189 struct work_struct *work = NULL;
190 u32 recvlen;
191 u64 requestid;
192 u8 *shut_txf_buf = util_shutdown.recv_buffer;
193
194 struct shutdown_msg_data *shutdown_msg;
195
196 struct icmsg_hdr *icmsghdrp;
197
198 vmbus_recvpacket(channel, shut_txf_buf,
199 HV_HYP_PAGE_SIZE, &recvlen, &requestid);
200
201 if (recvlen > 0) {
202 icmsghdrp = (struct icmsg_hdr *)&shut_txf_buf[
203 sizeof(struct vmbuspipe_hdr)];
204
205 if (icmsghdrp->icmsgtype == ICMSGTYPE_NEGOTIATE) {
206 if (vmbus_prep_negotiate_resp(icmsghdrp, shut_txf_buf,
207 fw_versions, FW_VER_COUNT,
208 sd_versions, SD_VER_COUNT,
209 NULL, &sd_srv_version)) {
210 pr_info("Shutdown IC version %d.%d\n",
211 sd_srv_version >> 16,
212 sd_srv_version & 0xFFFF);
213 }
214 } else {
215 shutdown_msg =
216 (struct shutdown_msg_data *)&shut_txf_buf[
217 sizeof(struct vmbuspipe_hdr) +
218 sizeof(struct icmsg_hdr)];
219
220 /*
221 * shutdown_msg->flags can be 0(shut down), 2(reboot),
222 * or 4(hibernate). It may bitwise-OR 1, which means
223 * performing the request by force. Linux always tries
224 * to perform the request by force.
225 */
226 switch (shutdown_msg->flags) {
227 case 0:
228 case 1:
229 icmsghdrp->status = HV_S_OK;
230 work = &shutdown_work;
231 pr_info("Shutdown request received -"
232 " graceful shutdown initiated\n");
233 break;
234 case 2:
235 case 3:
236 icmsghdrp->status = HV_S_OK;
237 work = &restart_work;
238 pr_info("Restart request received -"
239 " graceful restart initiated\n");
240 break;
241 case 4:
242 case 5:
243 pr_info("Hibernation request received\n");
244 icmsghdrp->status = hibernation_supported ?
245 HV_S_OK : HV_E_FAIL;
246 if (hibernation_supported)
247 work = &hibernate_context.work;
248 break;
249 default:
250 icmsghdrp->status = HV_E_FAIL;
251 pr_info("Shutdown request received -"
252 " Invalid request\n");
253 break;
254 }
255 }
256
257 icmsghdrp->icflags = ICMSGHDRFLAG_TRANSACTION
258 | ICMSGHDRFLAG_RESPONSE;
259
260 vmbus_sendpacket(channel, shut_txf_buf,
261 recvlen, requestid,
262 VM_PKT_DATA_INBAND, 0);
263 }
264
265 if (work)
266 schedule_work(work);
267}
268
269/*
270 * Set the host time in a process context.
271 */
272static struct work_struct adj_time_work;
273
274/*
275 * The last time sample, received from the host. PTP device responds to
276 * requests by using this data and the current partition-wide time reference
277 * count.
278 */
279static struct {
280 u64 host_time;
281 u64 ref_time;
282 spinlock_t lock;
283} host_ts;
284
285static struct timespec64 hv_get_adj_host_time(void)
286{
287 struct timespec64 ts;
288 u64 newtime, reftime;
289 unsigned long flags;
290
291 spin_lock_irqsave(&host_ts.lock, flags);
292 reftime = hv_read_reference_counter();
293 newtime = host_ts.host_time + (reftime - host_ts.ref_time);
294 ts = ns_to_timespec64((newtime - WLTIMEDELTA) * 100);
295 spin_unlock_irqrestore(&host_ts.lock, flags);
296
297 return ts;
298}
299
300static void hv_set_host_time(struct work_struct *work)
301{
302 struct timespec64 ts = hv_get_adj_host_time();
303
304 do_settimeofday64(&ts);
305}
306
307/*
308 * Synchronize time with host after reboot, restore, etc.
309 *
310 * ICTIMESYNCFLAG_SYNC flag bit indicates reboot, restore events of the VM.
311 * After reboot the flag ICTIMESYNCFLAG_SYNC is included in the first time
312 * message after the timesync channel is opened. Since the hv_utils module is
313 * loaded after hv_vmbus, the first message is usually missed. This bit is
314 * considered a hard request to discipline the clock.
315 *
316 * ICTIMESYNCFLAG_SAMPLE bit indicates a time sample from host. This is
317 * typically used as a hint to the guest. The guest is under no obligation
318 * to discipline the clock.
319 */
320static inline void adj_guesttime(u64 hosttime, u64 reftime, u8 adj_flags)
321{
322 unsigned long flags;
323 u64 cur_reftime;
324
325 /*
326 * Save the adjusted time sample from the host and the snapshot
327 * of the current system time.
328 */
329 spin_lock_irqsave(&host_ts.lock, flags);
330
331 cur_reftime = hv_read_reference_counter();
332 host_ts.host_time = hosttime;
333 host_ts.ref_time = cur_reftime;
334
335 /*
336 * TimeSync v4 messages contain reference time (guest's Hyper-V
337 * clocksource read when the time sample was generated), we can
338 * improve the precision by adding the delta between now and the
339 * time of generation. For older protocols we set
340 * reftime == cur_reftime on call.
341 */
342 host_ts.host_time += (cur_reftime - reftime);
343
344 spin_unlock_irqrestore(&host_ts.lock, flags);
345
346 /* Schedule work to do do_settimeofday64() */
347 if (adj_flags & ICTIMESYNCFLAG_SYNC)
348 schedule_work(&adj_time_work);
349}
350
351/*
352 * Time Sync Channel message handler.
353 */
354static void timesync_onchannelcallback(void *context)
355{
356 struct vmbus_channel *channel = context;
357 u32 recvlen;
358 u64 requestid;
359 struct icmsg_hdr *icmsghdrp;
360 struct ictimesync_data *timedatap;
361 struct ictimesync_ref_data *refdata;
362 u8 *time_txf_buf = util_timesynch.recv_buffer;
363
364 vmbus_recvpacket(channel, time_txf_buf,
365 HV_HYP_PAGE_SIZE, &recvlen, &requestid);
366
367 if (recvlen > 0) {
368 icmsghdrp = (struct icmsg_hdr *)&time_txf_buf[
369 sizeof(struct vmbuspipe_hdr)];
370
371 if (icmsghdrp->icmsgtype == ICMSGTYPE_NEGOTIATE) {
372 if (vmbus_prep_negotiate_resp(icmsghdrp, time_txf_buf,
373 fw_versions, FW_VER_COUNT,
374 ts_versions, TS_VER_COUNT,
375 NULL, &ts_srv_version)) {
376 pr_info("TimeSync IC version %d.%d\n",
377 ts_srv_version >> 16,
378 ts_srv_version & 0xFFFF);
379 }
380 } else {
381 if (ts_srv_version > TS_VERSION_3) {
382 refdata = (struct ictimesync_ref_data *)
383 &time_txf_buf[
384 sizeof(struct vmbuspipe_hdr) +
385 sizeof(struct icmsg_hdr)];
386
387 adj_guesttime(refdata->parenttime,
388 refdata->vmreferencetime,
389 refdata->flags);
390 } else {
391 timedatap = (struct ictimesync_data *)
392 &time_txf_buf[
393 sizeof(struct vmbuspipe_hdr) +
394 sizeof(struct icmsg_hdr)];
395 adj_guesttime(timedatap->parenttime,
396 hv_read_reference_counter(),
397 timedatap->flags);
398 }
399 }
400
401 icmsghdrp->icflags = ICMSGHDRFLAG_TRANSACTION
402 | ICMSGHDRFLAG_RESPONSE;
403
404 vmbus_sendpacket(channel, time_txf_buf,
405 recvlen, requestid,
406 VM_PKT_DATA_INBAND, 0);
407 }
408}
409
410/*
411 * Heartbeat functionality.
412 * Every two seconds, Hyper-V send us a heartbeat request message.
413 * we respond to this message, and Hyper-V knows we are alive.
414 */
415static void heartbeat_onchannelcallback(void *context)
416{
417 struct vmbus_channel *channel = context;
418 u32 recvlen;
419 u64 requestid;
420 struct icmsg_hdr *icmsghdrp;
421 struct heartbeat_msg_data *heartbeat_msg;
422 u8 *hbeat_txf_buf = util_heartbeat.recv_buffer;
423
424 while (1) {
425
426 vmbus_recvpacket(channel, hbeat_txf_buf,
427 HV_HYP_PAGE_SIZE, &recvlen, &requestid);
428
429 if (!recvlen)
430 break;
431
432 icmsghdrp = (struct icmsg_hdr *)&hbeat_txf_buf[
433 sizeof(struct vmbuspipe_hdr)];
434
435 if (icmsghdrp->icmsgtype == ICMSGTYPE_NEGOTIATE) {
436 if (vmbus_prep_negotiate_resp(icmsghdrp,
437 hbeat_txf_buf,
438 fw_versions, FW_VER_COUNT,
439 hb_versions, HB_VER_COUNT,
440 NULL, &hb_srv_version)) {
441
442 pr_info("Heartbeat IC version %d.%d\n",
443 hb_srv_version >> 16,
444 hb_srv_version & 0xFFFF);
445 }
446 } else {
447 heartbeat_msg =
448 (struct heartbeat_msg_data *)&hbeat_txf_buf[
449 sizeof(struct vmbuspipe_hdr) +
450 sizeof(struct icmsg_hdr)];
451
452 heartbeat_msg->seq_num += 1;
453 }
454
455 icmsghdrp->icflags = ICMSGHDRFLAG_TRANSACTION
456 | ICMSGHDRFLAG_RESPONSE;
457
458 vmbus_sendpacket(channel, hbeat_txf_buf,
459 recvlen, requestid,
460 VM_PKT_DATA_INBAND, 0);
461 }
462}
463
464static int util_probe(struct hv_device *dev,
465 const struct hv_vmbus_device_id *dev_id)
466{
467 struct hv_util_service *srv =
468 (struct hv_util_service *)dev_id->driver_data;
469 int ret;
470
471 srv->recv_buffer = kmalloc(HV_HYP_PAGE_SIZE * 4, GFP_KERNEL);
472 if (!srv->recv_buffer)
473 return -ENOMEM;
474 srv->channel = dev->channel;
475 if (srv->util_init) {
476 ret = srv->util_init(srv);
477 if (ret) {
478 ret = -ENODEV;
479 goto error1;
480 }
481 }
482
483 /*
484 * The set of services managed by the util driver are not performance
485 * critical and do not need batched reading. Furthermore, some services
486 * such as KVP can only handle one message from the host at a time.
487 * Turn off batched reading for all util drivers before we open the
488 * channel.
489 */
490 set_channel_read_mode(dev->channel, HV_CALL_DIRECT);
491
492 hv_set_drvdata(dev, srv);
493
494 ret = vmbus_open(dev->channel, 4 * HV_HYP_PAGE_SIZE,
495 4 * HV_HYP_PAGE_SIZE, NULL, 0, srv->util_cb,
496 dev->channel);
497 if (ret)
498 goto error;
499
500 return 0;
501
502error:
503 if (srv->util_deinit)
504 srv->util_deinit();
505error1:
506 kfree(srv->recv_buffer);
507 return ret;
508}
509
510static int util_remove(struct hv_device *dev)
511{
512 struct hv_util_service *srv = hv_get_drvdata(dev);
513
514 if (srv->util_deinit)
515 srv->util_deinit();
516 vmbus_close(dev->channel);
517 kfree(srv->recv_buffer);
518
519 return 0;
520}
521
522/*
523 * When we're in util_suspend(), all the userspace processes have been frozen
524 * (refer to hibernate() -> freeze_processes()). The userspace is thawed only
525 * after the whole resume procedure, including util_resume(), finishes.
526 */
527static int util_suspend(struct hv_device *dev)
528{
529 struct hv_util_service *srv = hv_get_drvdata(dev);
530 int ret = 0;
531
532 if (srv->util_pre_suspend) {
533 ret = srv->util_pre_suspend();
534 if (ret)
535 return ret;
536 }
537
538 vmbus_close(dev->channel);
539
540 return 0;
541}
542
543static int util_resume(struct hv_device *dev)
544{
545 struct hv_util_service *srv = hv_get_drvdata(dev);
546 int ret = 0;
547
548 if (srv->util_pre_resume) {
549 ret = srv->util_pre_resume();
550 if (ret)
551 return ret;
552 }
553
554 ret = vmbus_open(dev->channel, 4 * HV_HYP_PAGE_SIZE,
555 4 * HV_HYP_PAGE_SIZE, NULL, 0, srv->util_cb,
556 dev->channel);
557 return ret;
558}
559
560static const struct hv_vmbus_device_id id_table[] = {
561 /* Shutdown guid */
562 { HV_SHUTDOWN_GUID,
563 .driver_data = (unsigned long)&util_shutdown
564 },
565 /* Time synch guid */
566 { HV_TS_GUID,
567 .driver_data = (unsigned long)&util_timesynch
568 },
569 /* Heartbeat guid */
570 { HV_HEART_BEAT_GUID,
571 .driver_data = (unsigned long)&util_heartbeat
572 },
573 /* KVP guid */
574 { HV_KVP_GUID,
575 .driver_data = (unsigned long)&util_kvp
576 },
577 /* VSS GUID */
578 { HV_VSS_GUID,
579 .driver_data = (unsigned long)&util_vss
580 },
581 /* File copy GUID */
582 { HV_FCOPY_GUID,
583 .driver_data = (unsigned long)&util_fcopy
584 },
585 { },
586};
587
588MODULE_DEVICE_TABLE(vmbus, id_table);
589
590/* The one and only one */
591static struct hv_driver util_drv = {
592 .name = "hv_utils",
593 .id_table = id_table,
594 .probe = util_probe,
595 .remove = util_remove,
596 .suspend = util_suspend,
597 .resume = util_resume,
598 .driver = {
599 .probe_type = PROBE_PREFER_ASYNCHRONOUS,
600 },
601};
602
603static int hv_ptp_enable(struct ptp_clock_info *info,
604 struct ptp_clock_request *request, int on)
605{
606 return -EOPNOTSUPP;
607}
608
609static int hv_ptp_settime(struct ptp_clock_info *p, const struct timespec64 *ts)
610{
611 return -EOPNOTSUPP;
612}
613
614static int hv_ptp_adjfreq(struct ptp_clock_info *ptp, s32 delta)
615{
616 return -EOPNOTSUPP;
617}
618static int hv_ptp_adjtime(struct ptp_clock_info *ptp, s64 delta)
619{
620 return -EOPNOTSUPP;
621}
622
623static int hv_ptp_gettime(struct ptp_clock_info *info, struct timespec64 *ts)
624{
625 *ts = hv_get_adj_host_time();
626
627 return 0;
628}
629
630static struct ptp_clock_info ptp_hyperv_info = {
631 .name = "hyperv",
632 .enable = hv_ptp_enable,
633 .adjtime = hv_ptp_adjtime,
634 .adjfreq = hv_ptp_adjfreq,
635 .gettime64 = hv_ptp_gettime,
636 .settime64 = hv_ptp_settime,
637 .owner = THIS_MODULE,
638};
639
640static struct ptp_clock *hv_ptp_clock;
641
642static int hv_timesync_init(struct hv_util_service *srv)
643{
644 /* TimeSync requires Hyper-V clocksource. */
645 if (!hv_read_reference_counter)
646 return -ENODEV;
647
648 spin_lock_init(&host_ts.lock);
649
650 INIT_WORK(&adj_time_work, hv_set_host_time);
651
652 /*
653 * ptp_clock_register() returns NULL when CONFIG_PTP_1588_CLOCK is
654 * disabled but the driver is still useful without the PTP device
655 * as it still handles the ICTIMESYNCFLAG_SYNC case.
656 */
657 hv_ptp_clock = ptp_clock_register(&ptp_hyperv_info, NULL);
658 if (IS_ERR_OR_NULL(hv_ptp_clock)) {
659 pr_err("cannot register PTP clock: %ld\n",
660 PTR_ERR(hv_ptp_clock));
661 hv_ptp_clock = NULL;
662 }
663
664 return 0;
665}
666
667static void hv_timesync_cancel_work(void)
668{
669 cancel_work_sync(&adj_time_work);
670}
671
672static int hv_timesync_pre_suspend(void)
673{
674 hv_timesync_cancel_work();
675 return 0;
676}
677
678static void hv_timesync_deinit(void)
679{
680 if (hv_ptp_clock)
681 ptp_clock_unregister(hv_ptp_clock);
682
683 hv_timesync_cancel_work();
684}
685
686static int __init init_hyperv_utils(void)
687{
688 pr_info("Registering HyperV Utility Driver\n");
689
690 return vmbus_driver_register(&util_drv);
691}
692
693static void exit_hyperv_utils(void)
694{
695 pr_info("De-Registered HyperV Utility Driver\n");
696
697 vmbus_driver_unregister(&util_drv);
698}
699
700module_init(init_hyperv_utils);
701module_exit(exit_hyperv_utils);
702
703MODULE_DESCRIPTION("Hyper-V Utilities");
704MODULE_LICENSE("GPL");