Linux Kernel  3.7.1
 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Groups Pages
hv.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2009, Microsoft Corporation.
3  *
4  * This program is free software; you can redistribute it and/or modify it
5  * under the terms and conditions of the GNU General Public License,
6  * version 2, as published by the Free Software Foundation.
7  *
8  * This program is distributed in the hope it will be useful, but WITHOUT
9  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10  * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
11  * more details.
12  *
13  * You should have received a copy of the GNU General Public License along with
14  * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
15  * Place - Suite 330, Boston, MA 02111-1307 USA.
16  *
17  * Authors:
18  * Haiyang Zhang <[email protected]>
19  * Hank Janssen <[email protected]>
20  *
21  */
22 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
23 
24 #include <linux/kernel.h>
25 #include <linux/mm.h>
26 #include <linux/slab.h>
27 #include <linux/vmalloc.h>
28 #include <linux/hyperv.h>
29 #include <linux/version.h>
30 #include <asm/hyperv.h>
31 #include "hyperv_vmbus.h"
32 
33 /* The one and only */
35  .synic_initialized = false,
36  .hypercall_page = NULL,
37  .signal_event_param = NULL,
38  .signal_event_buffer = NULL,
39 };
40 
41 /*
42  * query_hypervisor_info - Get version info of the windows hypervisor
43  */
44 static int query_hypervisor_info(void)
45 {
46  unsigned int eax;
47  unsigned int ebx;
48  unsigned int ecx;
49  unsigned int edx;
50  unsigned int max_leaf;
51  unsigned int op;
52 
53  /*
54  * Its assumed that this is called after confirming that Viridian
55  * is present. Query id and revision.
56  */
57  eax = 0;
58  ebx = 0;
59  ecx = 0;
60  edx = 0;
62  cpuid(op, &eax, &ebx, &ecx, &edx);
63 
64  max_leaf = eax;
65 
66  if (max_leaf >= HVCPUID_VERSION) {
67  eax = 0;
68  ebx = 0;
69  ecx = 0;
70  edx = 0;
71  op = HVCPUID_VERSION;
72  cpuid(op, &eax, &ebx, &ecx, &edx);
73  pr_info("Hyper-V Host OS Build:%d-%d.%d-%d-%d.%d\n",
74  eax,
75  ebx >> 16,
76  ebx & 0xFFFF,
77  ecx,
78  edx >> 24,
79  edx & 0xFFFFFF);
80  }
81  return max_leaf;
82 }
83 
84 /*
85  * do_hypercall- Invoke the specified hypercall
86  */
87 static u64 do_hypercall(u64 control, void *input, void *output)
88 {
89 #ifdef CONFIG_X86_64
90  u64 hv_status = 0;
91  u64 input_address = (input) ? virt_to_phys(input) : 0;
92  u64 output_address = (output) ? virt_to_phys(output) : 0;
93  void *hypercall_page = hv_context.hypercall_page;
94 
95  __asm__ __volatile__("mov %0, %%r8" : : "r" (output_address) : "r8");
96  __asm__ __volatile__("call *%3" : "=a" (hv_status) :
97  "c" (control), "d" (input_address),
98  "m" (hypercall_page));
99 
100  return hv_status;
101 
102 #else
103 
104  u32 control_hi = control >> 32;
105  u32 control_lo = control & 0xFFFFFFFF;
106  u32 hv_status_hi = 1;
107  u32 hv_status_lo = 1;
108  u64 input_address = (input) ? virt_to_phys(input) : 0;
109  u32 input_address_hi = input_address >> 32;
110  u32 input_address_lo = input_address & 0xFFFFFFFF;
111  u64 output_address = (output) ? virt_to_phys(output) : 0;
112  u32 output_address_hi = output_address >> 32;
113  u32 output_address_lo = output_address & 0xFFFFFFFF;
114  void *hypercall_page = hv_context.hypercall_page;
115 
116  __asm__ __volatile__ ("call *%8" : "=d"(hv_status_hi),
117  "=a"(hv_status_lo) : "d" (control_hi),
118  "a" (control_lo), "b" (input_address_hi),
119  "c" (input_address_lo), "D"(output_address_hi),
120  "S"(output_address_lo), "m" (hypercall_page));
121 
122  return hv_status_lo | ((u64)hv_status_hi << 32);
123 #endif /* !x86_64 */
124 }
125 
126 /*
127  * hv_init - Main initialization routine.
128  *
129  * This routine must be called before any other routines in here are called
130  */
131 int hv_init(void)
132 {
133  int max_leaf;
134  union hv_x64_msr_hypercall_contents hypercall_msr;
135  void *virtaddr = NULL;
136 
137  memset(hv_context.synic_event_page, 0, sizeof(void *) * NR_CPUS);
138  memset(hv_context.synic_message_page, 0,
139  sizeof(void *) * NR_CPUS);
140 
141  max_leaf = query_hypervisor_info();
142 
143  /*
144  * Write our OS ID.
145  */
146  hv_context.guestid = generate_guest_id(0, LINUX_VERSION_CODE, 0);
147  wrmsrl(HV_X64_MSR_GUEST_OS_ID, hv_context.guestid);
148 
149  /* See if the hypercall page is already set */
150  rdmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64);
151 
153 
154  if (!virtaddr)
155  goto cleanup;
156 
157  hypercall_msr.enable = 1;
158 
159  hypercall_msr.guest_physical_address = vmalloc_to_pfn(virtaddr);
160  wrmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64);
161 
162  /* Confirm that hypercall page did get setup. */
163  hypercall_msr.as_uint64 = 0;
164  rdmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64);
165 
166  if (!hypercall_msr.enable)
167  goto cleanup;
168 
169  hv_context.hypercall_page = virtaddr;
170 
171  /* Setup the global signal event param for the signal event hypercall */
172  hv_context.signal_event_buffer =
173  kmalloc(sizeof(struct hv_input_signal_event_buffer),
174  GFP_KERNEL);
175  if (!hv_context.signal_event_buffer)
176  goto cleanup;
177 
178  hv_context.signal_event_param =
179  (struct hv_input_signal_event *)
180  (ALIGN((unsigned long)
181  hv_context.signal_event_buffer,
183  hv_context.signal_event_param->connectionid.asu32 = 0;
184  hv_context.signal_event_param->connectionid.u.id =
186  hv_context.signal_event_param->flag_number = 0;
187  hv_context.signal_event_param->rsvdz = 0;
188 
189  return 0;
190 
191 cleanup:
192  if (virtaddr) {
193  if (hypercall_msr.enable) {
194  hypercall_msr.as_uint64 = 0;
195  wrmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64);
196  }
197 
198  vfree(virtaddr);
199  }
200 
201  return -ENOTSUPP;
202 }
203 
204 /*
205  * hv_cleanup - Cleanup routine.
206  *
207  * This routine is called normally during driver unloading or exiting.
208  */
209 void hv_cleanup(void)
210 {
211  union hv_x64_msr_hypercall_contents hypercall_msr;
212 
213  /* Reset our OS id */
214  wrmsrl(HV_X64_MSR_GUEST_OS_ID, 0);
215 
216  kfree(hv_context.signal_event_buffer);
217  hv_context.signal_event_buffer = NULL;
218  hv_context.signal_event_param = NULL;
219 
220  if (hv_context.hypercall_page) {
221  hypercall_msr.as_uint64 = 0;
222  wrmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64);
223  vfree(hv_context.hypercall_page);
224  hv_context.hypercall_page = NULL;
225  }
226 }
227 
228 /*
229  * hv_post_message - Post a message using the hypervisor message IPC.
230  *
231  * This involves a hypercall.
232  */
233 int hv_post_message(union hv_connection_id connection_id,
234  enum hv_message_type message_type,
235  void *payload, size_t payload_size)
236 {
237  struct aligned_input {
238  u64 alignment8;
239  struct hv_input_post_message msg;
240  };
241 
242  struct hv_input_post_message *aligned_msg;
243  u16 status;
244  unsigned long addr;
245 
246  if (payload_size > HV_MESSAGE_PAYLOAD_BYTE_COUNT)
247  return -EMSGSIZE;
248 
249  addr = (unsigned long)kmalloc(sizeof(struct aligned_input), GFP_ATOMIC);
250  if (!addr)
251  return -ENOMEM;
252 
253  aligned_msg = (struct hv_input_post_message *)
255 
256  aligned_msg->connectionid = connection_id;
257  aligned_msg->message_type = message_type;
258  aligned_msg->payload_size = payload_size;
259  memcpy((void *)aligned_msg->payload, payload, payload_size);
260 
261  status = do_hypercall(HVCALL_POST_MESSAGE, aligned_msg, NULL)
262  & 0xFFFF;
263 
264  kfree((void *)addr);
265 
266  return status;
267 }
268 
269 
270 /*
271  * hv_signal_event -
272  * Signal an event on the specified connection using the hypervisor event IPC.
273  *
274  * This involves a hypercall.
275  */
277 {
278  u16 status;
279 
280  status = do_hypercall(HVCALL_SIGNAL_EVENT,
281  hv_context.signal_event_param,
282  NULL) & 0xFFFF;
283  return status;
284 }
285 
286 /*
287  * hv_synic_init - Initialize the Synthethic Interrupt Controller.
288  *
289  * If it is already initialized by another entity (ie x2v shim), we need to
290  * retrieve the initialized message and event pages. Otherwise, we create and
291  * initialize the message and event pages.
292  */
293 void hv_synic_init(void *irqarg)
294 {
295  u64 version;
296  union hv_synic_simp simp;
297  union hv_synic_siefp siefp;
298  union hv_synic_sint shared_sint;
299  union hv_synic_scontrol sctrl;
300 
301  u32 irq_vector = *((u32 *)(irqarg));
302  int cpu = smp_processor_id();
303 
304  if (!hv_context.hypercall_page)
305  return;
306 
307  /* Check the version */
308  rdmsrl(HV_X64_MSR_SVERSION, version);
309 
310  hv_context.synic_message_page[cpu] =
311  (void *)get_zeroed_page(GFP_ATOMIC);
312 
313  if (hv_context.synic_message_page[cpu] == NULL) {
314  pr_err("Unable to allocate SYNIC message page\n");
315  goto cleanup;
316  }
317 
318  hv_context.synic_event_page[cpu] =
319  (void *)get_zeroed_page(GFP_ATOMIC);
320 
321  if (hv_context.synic_event_page[cpu] == NULL) {
322  pr_err("Unable to allocate SYNIC event page\n");
323  goto cleanup;
324  }
325 
326  /* Setup the Synic's message page */
327  rdmsrl(HV_X64_MSR_SIMP, simp.as_uint64);
328  simp.simp_enabled = 1;
329  simp.base_simp_gpa = virt_to_phys(hv_context.synic_message_page[cpu])
330  >> PAGE_SHIFT;
331 
332  wrmsrl(HV_X64_MSR_SIMP, simp.as_uint64);
333 
334  /* Setup the Synic's event page */
335  rdmsrl(HV_X64_MSR_SIEFP, siefp.as_uint64);
336  siefp.siefp_enabled = 1;
337  siefp.base_siefp_gpa = virt_to_phys(hv_context.synic_event_page[cpu])
338  >> PAGE_SHIFT;
339 
340  wrmsrl(HV_X64_MSR_SIEFP, siefp.as_uint64);
341 
342  /* Setup the shared SINT. */
343  rdmsrl(HV_X64_MSR_SINT0 + VMBUS_MESSAGE_SINT, shared_sint.as_uint64);
344 
345  shared_sint.as_uint64 = 0;
346  shared_sint.vector = irq_vector; /* HV_SHARED_SINT_IDT_VECTOR + 0x20; */
347  shared_sint.masked = false;
348  shared_sint.auto_eoi = false;
349 
350  wrmsrl(HV_X64_MSR_SINT0 + VMBUS_MESSAGE_SINT, shared_sint.as_uint64);
351 
352  /* Enable the global synic bit */
353  rdmsrl(HV_X64_MSR_SCONTROL, sctrl.as_uint64);
354  sctrl.enable = 1;
355 
356  wrmsrl(HV_X64_MSR_SCONTROL, sctrl.as_uint64);
357 
358  hv_context.synic_initialized = true;
359  return;
360 
361 cleanup:
362  if (hv_context.synic_event_page[cpu])
363  free_page((unsigned long)hv_context.synic_event_page[cpu]);
364 
365  if (hv_context.synic_message_page[cpu])
366  free_page((unsigned long)hv_context.synic_message_page[cpu]);
367  return;
368 }
369 
370 /*
371  * hv_synic_cleanup - Cleanup routine for hv_synic_init().
372  */
374 {
375  union hv_synic_sint shared_sint;
376  union hv_synic_simp simp;
377  union hv_synic_siefp siefp;
378  int cpu = smp_processor_id();
379 
380  if (!hv_context.synic_initialized)
381  return;
382 
383  rdmsrl(HV_X64_MSR_SINT0 + VMBUS_MESSAGE_SINT, shared_sint.as_uint64);
384 
385  shared_sint.masked = 1;
386 
387  /* Need to correctly cleanup in the case of SMP!!! */
388  /* Disable the interrupt */
389  wrmsrl(HV_X64_MSR_SINT0 + VMBUS_MESSAGE_SINT, shared_sint.as_uint64);
390 
391  rdmsrl(HV_X64_MSR_SIMP, simp.as_uint64);
392  simp.simp_enabled = 0;
393  simp.base_simp_gpa = 0;
394 
395  wrmsrl(HV_X64_MSR_SIMP, simp.as_uint64);
396 
397  rdmsrl(HV_X64_MSR_SIEFP, siefp.as_uint64);
398  siefp.siefp_enabled = 0;
399  siefp.base_siefp_gpa = 0;
400 
401  wrmsrl(HV_X64_MSR_SIEFP, siefp.as_uint64);
402 
403  free_page((unsigned long)hv_context.synic_message_page[cpu]);
404  free_page((unsigned long)hv_context.synic_event_page[cpu]);
405 }