1 /* 2 * Copyright (c) 2009, Microsoft Corporation. 3 * 4 * This program is free software; you can redistribute it and/or modify it 5 * under the terms and conditions of the GNU General Public License, 6 * version 2, as published by the Free Software Foundation. 7 * 8 * This program is distributed in the hope it will be useful, but WITHOUT 9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 11 * more details. 12 * 13 * You should have received a copy of the GNU General Public License along with 14 * this program; if not, write to the Free Software Foundation, Inc., 59 Temple 15 * Place - Suite 330, Boston, MA 02111-1307 USA. 16 * 17 * Authors: 18 * Haiyang Zhang <haiyangz@microsoft.com> 19 * Hank Janssen <hjanssen@microsoft.com> 20 * 21 */ 22 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 23 24 #include <linux/kernel.h> 25 #include <linux/mm.h> 26 #include <linux/slab.h> 27 #include <linux/vmalloc.h> 28 #include <linux/hyperv.h> 29 #include <asm/hyperv.h> 30 #include "hyperv_vmbus.h" 31 32 /* The one and only */ 33 struct hv_context hv_context = { 34 .synic_initialized = false, 35 .hypercall_page = NULL, 36 .signal_event_param = NULL, 37 .signal_event_buffer = NULL, 38 }; 39 40 /* 41 * query_hypervisor_presence 42 * - Query the cpuid for presence of windows hypervisor 43 */ 44 static int query_hypervisor_presence(void) 45 { 46 unsigned int eax; 47 unsigned int ebx; 48 unsigned int ecx; 49 unsigned int edx; 50 unsigned int op; 51 52 eax = 0; 53 ebx = 0; 54 ecx = 0; 55 edx = 0; 56 op = HVCPUID_VERSION_FEATURES; 57 cpuid(op, &eax, &ebx, &ecx, &edx); 58 59 return ecx & HV_PRESENT_BIT; 60 } 61 62 /* 63 * query_hypervisor_info - Get version info of the windows hypervisor 64 */ 65 static int query_hypervisor_info(void) 66 { 67 unsigned int eax; 68 unsigned int ebx; 69 unsigned int ecx; 70 unsigned int edx; 71 unsigned int max_leaf; 72 unsigned int op; 73 74 /* 75 * Its assumed that this is called after confirming that Viridian 76 * is present. Query id and revision. 77 */ 78 eax = 0; 79 ebx = 0; 80 ecx = 0; 81 edx = 0; 82 op = HVCPUID_VENDOR_MAXFUNCTION; 83 cpuid(op, &eax, &ebx, &ecx, &edx); 84 85 max_leaf = eax; 86 87 if (max_leaf >= HVCPUID_VERSION) { 88 eax = 0; 89 ebx = 0; 90 ecx = 0; 91 edx = 0; 92 op = HVCPUID_VERSION; 93 cpuid(op, &eax, &ebx, &ecx, &edx); 94 pr_info("Hyper-V Host OS Build:%d-%d.%d-%d-%d.%d\n", 95 eax, 96 ebx >> 16, 97 ebx & 0xFFFF, 98 ecx, 99 edx >> 24, 100 edx & 0xFFFFFF); 101 } 102 return max_leaf; 103 } 104 105 /* 106 * do_hypercall- Invoke the specified hypercall 107 */ 108 static u64 do_hypercall(u64 control, void *input, void *output) 109 { 110 #ifdef CONFIG_X86_64 111 u64 hv_status = 0; 112 u64 input_address = (input) ? virt_to_phys(input) : 0; 113 u64 output_address = (output) ? virt_to_phys(output) : 0; 114 void *hypercall_page = hv_context.hypercall_page; 115 116 __asm__ __volatile__("mov %0, %%r8" : : "r" (output_address) : "r8"); 117 __asm__ __volatile__("call *%3" : "=a" (hv_status) : 118 "c" (control), "d" (input_address), 119 "m" (hypercall_page)); 120 121 return hv_status; 122 123 #else 124 125 u32 control_hi = control >> 32; 126 u32 control_lo = control & 0xFFFFFFFF; 127 u32 hv_status_hi = 1; 128 u32 hv_status_lo = 1; 129 u64 input_address = (input) ? virt_to_phys(input) : 0; 130 u32 input_address_hi = input_address >> 32; 131 u32 input_address_lo = input_address & 0xFFFFFFFF; 132 u64 output_address = (output) ? virt_to_phys(output) : 0; 133 u32 output_address_hi = output_address >> 32; 134 u32 output_address_lo = output_address & 0xFFFFFFFF; 135 void *hypercall_page = hv_context.hypercall_page; 136 137 __asm__ __volatile__ ("call *%8" : "=d"(hv_status_hi), 138 "=a"(hv_status_lo) : "d" (control_hi), 139 "a" (control_lo), "b" (input_address_hi), 140 "c" (input_address_lo), "D"(output_address_hi), 141 "S"(output_address_lo), "m" (hypercall_page)); 142 143 return hv_status_lo | ((u64)hv_status_hi << 32); 144 #endif /* !x86_64 */ 145 } 146 147 /* 148 * hv_init - Main initialization routine. 149 * 150 * This routine must be called before any other routines in here are called 151 */ 152 int hv_init(void) 153 { 154 int max_leaf; 155 union hv_x64_msr_hypercall_contents hypercall_msr; 156 void *virtaddr = NULL; 157 158 memset(hv_context.synic_event_page, 0, sizeof(void *) * NR_CPUS); 159 memset(hv_context.synic_message_page, 0, 160 sizeof(void *) * NR_CPUS); 161 162 if (!query_hypervisor_presence()) 163 goto cleanup; 164 165 max_leaf = query_hypervisor_info(); 166 167 /* Write our OS info */ 168 wrmsrl(HV_X64_MSR_GUEST_OS_ID, HV_LINUX_GUEST_ID); 169 hv_context.guestid = HV_LINUX_GUEST_ID; 170 171 /* See if the hypercall page is already set */ 172 rdmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64); 173 174 virtaddr = __vmalloc(PAGE_SIZE, GFP_KERNEL, PAGE_KERNEL_EXEC); 175 176 if (!virtaddr) 177 goto cleanup; 178 179 hypercall_msr.enable = 1; 180 181 hypercall_msr.guest_physical_address = vmalloc_to_pfn(virtaddr); 182 wrmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64); 183 184 /* Confirm that hypercall page did get setup. */ 185 hypercall_msr.as_uint64 = 0; 186 rdmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64); 187 188 if (!hypercall_msr.enable) 189 goto cleanup; 190 191 hv_context.hypercall_page = virtaddr; 192 193 /* Setup the global signal event param for the signal event hypercall */ 194 hv_context.signal_event_buffer = 195 kmalloc(sizeof(struct hv_input_signal_event_buffer), 196 GFP_KERNEL); 197 if (!hv_context.signal_event_buffer) 198 goto cleanup; 199 200 hv_context.signal_event_param = 201 (struct hv_input_signal_event *) 202 (ALIGN((unsigned long) 203 hv_context.signal_event_buffer, 204 HV_HYPERCALL_PARAM_ALIGN)); 205 hv_context.signal_event_param->connectionid.asu32 = 0; 206 hv_context.signal_event_param->connectionid.u.id = 207 VMBUS_EVENT_CONNECTION_ID; 208 hv_context.signal_event_param->flag_number = 0; 209 hv_context.signal_event_param->rsvdz = 0; 210 211 return 0; 212 213 cleanup: 214 if (virtaddr) { 215 if (hypercall_msr.enable) { 216 hypercall_msr.as_uint64 = 0; 217 wrmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64); 218 } 219 220 vfree(virtaddr); 221 } 222 223 return -ENOTSUPP; 224 } 225 226 /* 227 * hv_cleanup - Cleanup routine. 228 * 229 * This routine is called normally during driver unloading or exiting. 230 */ 231 void hv_cleanup(void) 232 { 233 union hv_x64_msr_hypercall_contents hypercall_msr; 234 235 /* Reset our OS id */ 236 wrmsrl(HV_X64_MSR_GUEST_OS_ID, 0); 237 238 kfree(hv_context.signal_event_buffer); 239 hv_context.signal_event_buffer = NULL; 240 hv_context.signal_event_param = NULL; 241 242 if (hv_context.hypercall_page) { 243 hypercall_msr.as_uint64 = 0; 244 wrmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64); 245 vfree(hv_context.hypercall_page); 246 hv_context.hypercall_page = NULL; 247 } 248 } 249 250 /* 251 * hv_post_message - Post a message using the hypervisor message IPC. 252 * 253 * This involves a hypercall. 254 */ 255 u16 hv_post_message(union hv_connection_id connection_id, 256 enum hv_message_type message_type, 257 void *payload, size_t payload_size) 258 { 259 struct aligned_input { 260 u64 alignment8; 261 struct hv_input_post_message msg; 262 }; 263 264 struct hv_input_post_message *aligned_msg; 265 u16 status; 266 unsigned long addr; 267 268 if (payload_size > HV_MESSAGE_PAYLOAD_BYTE_COUNT) 269 return -EMSGSIZE; 270 271 addr = (unsigned long)kmalloc(sizeof(struct aligned_input), GFP_ATOMIC); 272 if (!addr) 273 return -ENOMEM; 274 275 aligned_msg = (struct hv_input_post_message *) 276 (ALIGN(addr, HV_HYPERCALL_PARAM_ALIGN)); 277 278 aligned_msg->connectionid = connection_id; 279 aligned_msg->message_type = message_type; 280 aligned_msg->payload_size = payload_size; 281 memcpy((void *)aligned_msg->payload, payload, payload_size); 282 283 status = do_hypercall(HVCALL_POST_MESSAGE, aligned_msg, NULL) 284 & 0xFFFF; 285 286 kfree((void *)addr); 287 288 return status; 289 } 290 291 292 /* 293 * hv_signal_event - 294 * Signal an event on the specified connection using the hypervisor event IPC. 295 * 296 * This involves a hypercall. 297 */ 298 u16 hv_signal_event(void) 299 { 300 u16 status; 301 302 status = do_hypercall(HVCALL_SIGNAL_EVENT, 303 hv_context.signal_event_param, 304 NULL) & 0xFFFF; 305 return status; 306 } 307 308 /* 309 * hv_synic_init - Initialize the Synthethic Interrupt Controller. 310 * 311 * If it is already initialized by another entity (ie x2v shim), we need to 312 * retrieve the initialized message and event pages. Otherwise, we create and 313 * initialize the message and event pages. 314 */ 315 void hv_synic_init(void *irqarg) 316 { 317 u64 version; 318 union hv_synic_simp simp; 319 union hv_synic_siefp siefp; 320 union hv_synic_sint shared_sint; 321 union hv_synic_scontrol sctrl; 322 323 u32 irq_vector = *((u32 *)(irqarg)); 324 int cpu = smp_processor_id(); 325 326 if (!hv_context.hypercall_page) 327 return; 328 329 /* Check the version */ 330 rdmsrl(HV_X64_MSR_SVERSION, version); 331 332 hv_context.synic_message_page[cpu] = 333 (void *)get_zeroed_page(GFP_ATOMIC); 334 335 if (hv_context.synic_message_page[cpu] == NULL) { 336 pr_err("Unable to allocate SYNIC message page\n"); 337 goto cleanup; 338 } 339 340 hv_context.synic_event_page[cpu] = 341 (void *)get_zeroed_page(GFP_ATOMIC); 342 343 if (hv_context.synic_event_page[cpu] == NULL) { 344 pr_err("Unable to allocate SYNIC event page\n"); 345 goto cleanup; 346 } 347 348 /* Setup the Synic's message page */ 349 rdmsrl(HV_X64_MSR_SIMP, simp.as_uint64); 350 simp.simp_enabled = 1; 351 simp.base_simp_gpa = virt_to_phys(hv_context.synic_message_page[cpu]) 352 >> PAGE_SHIFT; 353 354 wrmsrl(HV_X64_MSR_SIMP, simp.as_uint64); 355 356 /* Setup the Synic's event page */ 357 rdmsrl(HV_X64_MSR_SIEFP, siefp.as_uint64); 358 siefp.siefp_enabled = 1; 359 siefp.base_siefp_gpa = virt_to_phys(hv_context.synic_event_page[cpu]) 360 >> PAGE_SHIFT; 361 362 wrmsrl(HV_X64_MSR_SIEFP, siefp.as_uint64); 363 364 /* Setup the shared SINT. */ 365 rdmsrl(HV_X64_MSR_SINT0 + VMBUS_MESSAGE_SINT, shared_sint.as_uint64); 366 367 shared_sint.as_uint64 = 0; 368 shared_sint.vector = irq_vector; /* HV_SHARED_SINT_IDT_VECTOR + 0x20; */ 369 shared_sint.masked = false; 370 shared_sint.auto_eoi = false; 371 372 wrmsrl(HV_X64_MSR_SINT0 + VMBUS_MESSAGE_SINT, shared_sint.as_uint64); 373 374 /* Enable the global synic bit */ 375 rdmsrl(HV_X64_MSR_SCONTROL, sctrl.as_uint64); 376 sctrl.enable = 1; 377 378 wrmsrl(HV_X64_MSR_SCONTROL, sctrl.as_uint64); 379 380 hv_context.synic_initialized = true; 381 return; 382 383 cleanup: 384 if (hv_context.synic_event_page[cpu]) 385 free_page((unsigned long)hv_context.synic_event_page[cpu]); 386 387 if (hv_context.synic_message_page[cpu]) 388 free_page((unsigned long)hv_context.synic_message_page[cpu]); 389 return; 390 } 391 392 /* 393 * hv_synic_cleanup - Cleanup routine for hv_synic_init(). 394 */ 395 void hv_synic_cleanup(void *arg) 396 { 397 union hv_synic_sint shared_sint; 398 union hv_synic_simp simp; 399 union hv_synic_siefp siefp; 400 int cpu = smp_processor_id(); 401 402 if (!hv_context.synic_initialized) 403 return; 404 405 rdmsrl(HV_X64_MSR_SINT0 + VMBUS_MESSAGE_SINT, shared_sint.as_uint64); 406 407 shared_sint.masked = 1; 408 409 /* Need to correctly cleanup in the case of SMP!!! */ 410 /* Disable the interrupt */ 411 wrmsrl(HV_X64_MSR_SINT0 + VMBUS_MESSAGE_SINT, shared_sint.as_uint64); 412 413 rdmsrl(HV_X64_MSR_SIMP, simp.as_uint64); 414 simp.simp_enabled = 0; 415 simp.base_simp_gpa = 0; 416 417 wrmsrl(HV_X64_MSR_SIMP, simp.as_uint64); 418 419 rdmsrl(HV_X64_MSR_SIEFP, siefp.as_uint64); 420 siefp.siefp_enabled = 0; 421 siefp.base_siefp_gpa = 0; 422 423 wrmsrl(HV_X64_MSR_SIEFP, siefp.as_uint64); 424 425 free_page((unsigned long)hv_context.synic_message_page[cpu]); 426 free_page((unsigned long)hv_context.synic_event_page[cpu]); 427 } 428