at v6.17 383 lines 11 kB view raw
1/* SPDX-License-Identifier: GPL-2.0 */ 2 3/* 4 * Linux-specific definitions for managing interactions with Microsoft's 5 * Hyper-V hypervisor. The definitions in this file are architecture 6 * independent. See arch/<arch>/include/asm/mshyperv.h for definitions 7 * that are specific to architecture <arch>. 8 * 9 * Definitions that are derived from Hyper-V code or headers should not go in 10 * this file, but should instead go in the relevant files in include/hyperv. 11 * 12 * Copyright (C) 2019, Microsoft, Inc. 13 * 14 * Author : Michael Kelley <mikelley@microsoft.com> 15 */ 16 17#ifndef _ASM_GENERIC_MSHYPERV_H 18#define _ASM_GENERIC_MSHYPERV_H 19 20#include <linux/types.h> 21#include <linux/atomic.h> 22#include <linux/bitops.h> 23#include <acpi/acpi_numa.h> 24#include <linux/cpumask.h> 25#include <linux/nmi.h> 26#include <asm/ptrace.h> 27#include <hyperv/hvhdk.h> 28 29#define VTPM_BASE_ADDRESS 0xfed40000 30 31enum hv_partition_type { 32 HV_PARTITION_TYPE_GUEST, 33 HV_PARTITION_TYPE_ROOT, 34}; 35 36struct ms_hyperv_info { 37 u32 features; 38 u32 priv_high; 39 u32 ext_features; 40 u32 misc_features; 41 u32 hints; 42 u32 nested_features; 43 u32 max_vp_index; 44 u32 max_lp_index; 45 u8 vtl; 46 union { 47 u32 isolation_config_a; 48 struct { 49 u32 paravisor_present : 1; 50 u32 reserved_a1 : 31; 51 }; 52 }; 53 union { 54 u32 isolation_config_b; 55 struct { 56 u32 cvm_type : 4; 57 u32 reserved_b1 : 1; 58 u32 shared_gpa_boundary_active : 1; 59 u32 shared_gpa_boundary_bits : 6; 60 u32 reserved_b2 : 20; 61 }; 62 }; 63 u64 shared_gpa_boundary; 64}; 65extern struct ms_hyperv_info ms_hyperv; 66extern bool hv_nested; 67extern u64 hv_current_partition_id; 68extern enum hv_partition_type hv_curr_partition_type; 69 70extern void * __percpu *hyperv_pcpu_input_arg; 71extern void * __percpu *hyperv_pcpu_output_arg; 72 73u64 hv_do_hypercall(u64 control, void *inputaddr, void *outputaddr); 74u64 hv_do_fast_hypercall8(u16 control, u64 input8); 75u64 hv_do_fast_hypercall16(u16 control, u64 input1, u64 input2); 76 77bool hv_isolation_type_snp(void); 78bool hv_isolation_type_tdx(void); 79 80/* 81 * On architectures where Hyper-V doesn't support AEOI (e.g., ARM64), 82 * it doesn't provide a recommendation flag and AEOI must be disabled. 83 */ 84static inline bool hv_recommend_using_aeoi(void) 85{ 86#ifdef HV_DEPRECATING_AEOI_RECOMMENDED 87 return !(ms_hyperv.hints & HV_DEPRECATING_AEOI_RECOMMENDED); 88#else 89 return false; 90#endif 91} 92 93static inline struct hv_proximity_domain_info hv_numa_node_to_pxm_info(int node) 94{ 95 struct hv_proximity_domain_info pxm_info = {}; 96 97 if (node != NUMA_NO_NODE) { 98 pxm_info.domain_id = node_to_pxm(node); 99 pxm_info.flags.proximity_info_valid = 1; 100 pxm_info.flags.proximity_preferred = 1; 101 } 102 103 return pxm_info; 104} 105 106/* Helper functions that provide a consistent pattern for checking Hyper-V hypercall status. */ 107static inline int hv_result(u64 status) 108{ 109 return status & HV_HYPERCALL_RESULT_MASK; 110} 111 112static inline bool hv_result_success(u64 status) 113{ 114 return hv_result(status) == HV_STATUS_SUCCESS; 115} 116 117static inline unsigned int hv_repcomp(u64 status) 118{ 119 /* Bits [43:32] of status have 'Reps completed' data. */ 120 return (status & HV_HYPERCALL_REP_COMP_MASK) >> 121 HV_HYPERCALL_REP_COMP_OFFSET; 122} 123 124/* 125 * Rep hypercalls. Callers of this functions are supposed to ensure that 126 * rep_count and varhead_size comply with Hyper-V hypercall definition. 127 */ 128static inline u64 hv_do_rep_hypercall(u16 code, u16 rep_count, u16 varhead_size, 129 void *input, void *output) 130{ 131 u64 control = code; 132 u64 status; 133 u16 rep_comp; 134 135 control |= (u64)varhead_size << HV_HYPERCALL_VARHEAD_OFFSET; 136 control |= (u64)rep_count << HV_HYPERCALL_REP_COMP_OFFSET; 137 138 do { 139 status = hv_do_hypercall(control, input, output); 140 if (!hv_result_success(status)) 141 return status; 142 143 rep_comp = hv_repcomp(status); 144 145 control &= ~HV_HYPERCALL_REP_START_MASK; 146 control |= (u64)rep_comp << HV_HYPERCALL_REP_START_OFFSET; 147 148 touch_nmi_watchdog(); 149 } while (rep_comp < rep_count); 150 151 return status; 152} 153 154/* Generate the guest OS identifier as described in the Hyper-V TLFS */ 155static inline u64 hv_generate_guest_id(u64 kernel_version) 156{ 157 u64 guest_id; 158 159 guest_id = (((u64)HV_LINUX_VENDOR_ID) << 48); 160 guest_id |= (kernel_version << 16); 161 162 return guest_id; 163} 164 165/* Free the message slot and signal end-of-message if required */ 166static inline void vmbus_signal_eom(struct hv_message *msg, u32 old_msg_type) 167{ 168 /* 169 * On crash we're reading some other CPU's message page and we need 170 * to be careful: this other CPU may already had cleared the header 171 * and the host may already had delivered some other message there. 172 * In case we blindly write msg->header.message_type we're going 173 * to lose it. We can still lose a message of the same type but 174 * we count on the fact that there can only be one 175 * CHANNELMSG_UNLOAD_RESPONSE and we don't care about other messages 176 * on crash. 177 */ 178 if (cmpxchg(&msg->header.message_type, old_msg_type, 179 HVMSG_NONE) != old_msg_type) 180 return; 181 182 /* 183 * The cmxchg() above does an implicit memory barrier to 184 * ensure the write to MessageType (ie set to 185 * HVMSG_NONE) happens before we read the 186 * MessagePending and EOMing. Otherwise, the EOMing 187 * will not deliver any more messages since there is 188 * no empty slot 189 */ 190 if (msg->header.message_flags.msg_pending) { 191 /* 192 * This will cause message queue rescan to 193 * possibly deliver another msg from the 194 * hypervisor 195 */ 196 hv_set_msr(HV_MSR_EOM, 0); 197 } 198} 199 200int hv_get_hypervisor_version(union hv_hypervisor_version_info *info); 201 202void hv_setup_vmbus_handler(void (*handler)(void)); 203void hv_remove_vmbus_handler(void); 204void hv_setup_stimer0_handler(void (*handler)(void)); 205void hv_remove_stimer0_handler(void); 206 207void hv_setup_kexec_handler(void (*handler)(void)); 208void hv_remove_kexec_handler(void); 209void hv_setup_crash_handler(void (*handler)(struct pt_regs *regs)); 210void hv_remove_crash_handler(void); 211void hv_setup_mshv_handler(void (*handler)(void)); 212 213extern int vmbus_interrupt; 214extern int vmbus_irq; 215 216#if IS_ENABLED(CONFIG_HYPERV) 217/* 218 * Hypervisor's notion of virtual processor ID is different from 219 * Linux' notion of CPU ID. This information can only be retrieved 220 * in the context of the calling CPU. Setup a map for easy access 221 * to this information. 222 */ 223extern u32 *hv_vp_index; 224extern u32 hv_max_vp_index; 225 226extern u64 (*hv_read_reference_counter)(void); 227 228/* Sentinel value for an uninitialized entry in hv_vp_index array */ 229#define VP_INVAL U32_MAX 230 231int __init hv_common_init(void); 232void __init hv_get_partition_id(void); 233void __init hv_common_free(void); 234void __init ms_hyperv_late_init(void); 235int hv_common_cpu_init(unsigned int cpu); 236int hv_common_cpu_die(unsigned int cpu); 237void hv_identify_partition_type(void); 238 239/** 240 * hv_cpu_number_to_vp_number() - Map CPU to VP. 241 * @cpu_number: CPU number in Linux terms 242 * 243 * This function returns the mapping between the Linux processor 244 * number and the hypervisor's virtual processor number, useful 245 * in making hypercalls and such that talk about specific 246 * processors. 247 * 248 * Return: Virtual processor number in Hyper-V terms 249 */ 250static inline int hv_cpu_number_to_vp_number(int cpu_number) 251{ 252 return hv_vp_index[cpu_number]; 253} 254 255static inline int __cpumask_to_vpset(struct hv_vpset *vpset, 256 const struct cpumask *cpus, 257 bool (*func)(int cpu)) 258{ 259 int cpu, vcpu, vcpu_bank, vcpu_offset, nr_bank = 1; 260 int max_vcpu_bank = hv_max_vp_index / HV_VCPUS_PER_SPARSE_BANK; 261 262 /* vpset.valid_bank_mask can represent up to HV_MAX_SPARSE_VCPU_BANKS banks */ 263 if (max_vcpu_bank >= HV_MAX_SPARSE_VCPU_BANKS) 264 return 0; 265 266 /* 267 * Clear all banks up to the maximum possible bank as hv_tlb_flush_ex 268 * structs are not cleared between calls, we risk flushing unneeded 269 * vCPUs otherwise. 270 */ 271 for (vcpu_bank = 0; vcpu_bank <= max_vcpu_bank; vcpu_bank++) 272 vpset->bank_contents[vcpu_bank] = 0; 273 274 /* 275 * Some banks may end up being empty but this is acceptable. 276 */ 277 for_each_cpu(cpu, cpus) { 278 if (func && func(cpu)) 279 continue; 280 vcpu = hv_cpu_number_to_vp_number(cpu); 281 if (vcpu == VP_INVAL) 282 return -1; 283 vcpu_bank = vcpu / HV_VCPUS_PER_SPARSE_BANK; 284 vcpu_offset = vcpu % HV_VCPUS_PER_SPARSE_BANK; 285 __set_bit(vcpu_offset, (unsigned long *) 286 &vpset->bank_contents[vcpu_bank]); 287 if (vcpu_bank >= nr_bank) 288 nr_bank = vcpu_bank + 1; 289 } 290 vpset->valid_bank_mask = GENMASK_ULL(nr_bank - 1, 0); 291 return nr_bank; 292} 293 294/* 295 * Convert a Linux cpumask into a Hyper-V VPset. In the _skip variant, 296 * 'func' is called for each CPU present in cpumask. If 'func' returns 297 * true, that CPU is skipped -- i.e., that CPU from cpumask is *not* 298 * added to the Hyper-V VPset. If 'func' is NULL, no CPUs are 299 * skipped. 300 */ 301static inline int cpumask_to_vpset(struct hv_vpset *vpset, 302 const struct cpumask *cpus) 303{ 304 return __cpumask_to_vpset(vpset, cpus, NULL); 305} 306 307static inline int cpumask_to_vpset_skip(struct hv_vpset *vpset, 308 const struct cpumask *cpus, 309 bool (*func)(int cpu)) 310{ 311 return __cpumask_to_vpset(vpset, cpus, func); 312} 313 314#define _hv_status_fmt(fmt) "%s: Hyper-V status: %#x = %s: " fmt 315#define hv_status_printk(level, status, fmt, ...) \ 316do { \ 317 u64 __status = (status); \ 318 pr_##level(_hv_status_fmt(fmt), __func__, hv_result(__status), \ 319 hv_result_to_string(__status), ##__VA_ARGS__); \ 320} while (0) 321#define hv_status_err(status, fmt, ...) \ 322 hv_status_printk(err, status, fmt, ##__VA_ARGS__) 323#define hv_status_debug(status, fmt, ...) \ 324 hv_status_printk(debug, status, fmt, ##__VA_ARGS__) 325 326const char *hv_result_to_string(u64 hv_status); 327int hv_result_to_errno(u64 status); 328void hyperv_report_panic(struct pt_regs *regs, long err, bool in_die); 329bool hv_is_hyperv_initialized(void); 330bool hv_is_hibernation_supported(void); 331enum hv_isolation_type hv_get_isolation_type(void); 332bool hv_is_isolation_supported(void); 333bool hv_isolation_type_snp(void); 334u64 hv_ghcb_hypercall(u64 control, void *input, void *output, u32 input_size); 335u64 hv_tdx_hypercall(u64 control, u64 param1, u64 param2); 336void hyperv_cleanup(void); 337bool hv_query_ext_cap(u64 cap_query); 338void hv_setup_dma_ops(struct device *dev, bool coherent); 339#else /* CONFIG_HYPERV */ 340static inline void hv_identify_partition_type(void) {} 341static inline bool hv_is_hyperv_initialized(void) { return false; } 342static inline bool hv_is_hibernation_supported(void) { return false; } 343static inline void hyperv_cleanup(void) {} 344static inline void ms_hyperv_late_init(void) {} 345static inline bool hv_is_isolation_supported(void) { return false; } 346static inline enum hv_isolation_type hv_get_isolation_type(void) 347{ 348 return HV_ISOLATION_TYPE_NONE; 349} 350#endif /* CONFIG_HYPERV */ 351 352#if IS_ENABLED(CONFIG_MSHV_ROOT) 353static inline bool hv_root_partition(void) 354{ 355 return hv_curr_partition_type == HV_PARTITION_TYPE_ROOT; 356} 357int hv_call_deposit_pages(int node, u64 partition_id, u32 num_pages); 358int hv_call_add_logical_proc(int node, u32 lp_index, u32 acpi_id); 359int hv_call_create_vp(int node, u64 partition_id, u32 vp_index, u32 flags); 360 361#else /* CONFIG_MSHV_ROOT */ 362static inline bool hv_root_partition(void) { return false; } 363static inline int hv_call_deposit_pages(int node, u64 partition_id, u32 num_pages) 364{ 365 return -EOPNOTSUPP; 366} 367static inline int hv_call_add_logical_proc(int node, u32 lp_index, u32 acpi_id) 368{ 369 return -EOPNOTSUPP; 370} 371static inline int hv_call_create_vp(int node, u64 partition_id, u32 vp_index, u32 flags) 372{ 373 return -EOPNOTSUPP; 374} 375#endif /* CONFIG_MSHV_ROOT */ 376 377#if IS_ENABLED(CONFIG_HYPERV_VTL_MODE) 378u8 __init get_vtl(void); 379#else 380static inline u8 get_vtl(void) { return 0; } 381#endif 382 383#endif