1 #include "kvm/kvm-cpu.h"
3 #include "kvm/symbol.h"
7 #include <asm/msr-index.h>
17 static inline bool is_in_protected_mode(struct kvm_cpu *vcpu)
19 return vcpu->sregs.cr0 & 0x01;
22 static inline u64 ip_to_flat(struct kvm_cpu *vcpu, u64 ip)
27 * NOTE! We should take code segment base address into account here.
28 * Luckily it's usually zero because Linux uses flat memory model.
30 if (is_in_protected_mode(vcpu))
33 cs = vcpu->sregs.cs.selector;
35 return ip + (cs << 4);
38 static inline u32 selector_to_base(u16 selector)
41 * KVM on Intel requires 'base' to be 'selector * 16' in real mode.
43 return (u32)selector * 16;
46 static struct kvm_cpu *kvm_cpu__new(struct kvm *kvm)
50 vcpu = calloc(1, sizeof *vcpu);
59 void kvm_cpu__delete(struct kvm_cpu *vcpu)
67 struct kvm_cpu *kvm_cpu__init(struct kvm *kvm, unsigned long cpu_id)
72 vcpu = kvm_cpu__new(kvm);
76 vcpu->cpu_id = cpu_id;
78 vcpu->vcpu_fd = ioctl(vcpu->kvm->vm_fd, KVM_CREATE_VCPU, cpu_id);
79 if (vcpu->vcpu_fd < 0)
80 die_perror("KVM_CREATE_VCPU ioctl");
82 mmap_size = ioctl(vcpu->kvm->sys_fd, KVM_GET_VCPU_MMAP_SIZE, 0);
84 die_perror("KVM_GET_VCPU_MMAP_SIZE ioctl");
86 vcpu->kvm_run = mmap(NULL, mmap_size, PROT_RW, MAP_SHARED, vcpu->vcpu_fd, 0);
87 if (vcpu->kvm_run == MAP_FAILED)
88 die("unable to mmap vcpu fd");
93 void kvm_cpu__enable_singlestep(struct kvm_cpu *vcpu)
95 struct kvm_guest_debug debug = {
96 .control = KVM_GUESTDBG_ENABLE | KVM_GUESTDBG_SINGLESTEP,
99 if (ioctl(vcpu->vcpu_fd, KVM_SET_GUEST_DEBUG, &debug) < 0)
100 pr_warning("KVM_SET_GUEST_DEBUG failed");
103 static struct kvm_msrs *kvm_msrs__new(size_t nmsrs)
105 struct kvm_msrs *vcpu = calloc(1, sizeof(*vcpu) + (sizeof(struct kvm_msr_entry) * nmsrs));
108 die("out of memory");
113 #define KVM_MSR_ENTRY(_index, _data) \
114 (struct kvm_msr_entry) { .index = _index, .data = _data }
116 static void kvm_cpu__setup_msrs(struct kvm_cpu *vcpu)
118 unsigned long ndx = 0;
120 vcpu->msrs = kvm_msrs__new(100);
122 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_SYSENTER_CS, 0x0);
123 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_SYSENTER_ESP, 0x0);
124 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_SYSENTER_EIP, 0x0);
126 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_STAR, 0x0);
127 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_CSTAR, 0x0);
128 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_KERNEL_GS_BASE, 0x0);
129 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_SYSCALL_MASK, 0x0);
130 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_LSTAR, 0x0);
132 vcpu->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_TSC, 0x0);
134 vcpu->msrs->nmsrs = ndx;
136 if (ioctl(vcpu->vcpu_fd, KVM_SET_MSRS, vcpu->msrs) < 0)
137 die_perror("KVM_SET_MSRS failed");
140 static void kvm_cpu__setup_fpu(struct kvm_cpu *vcpu)
142 vcpu->fpu = (struct kvm_fpu) {
147 if (ioctl(vcpu->vcpu_fd, KVM_SET_FPU, &vcpu->fpu) < 0)
148 die_perror("KVM_SET_FPU failed");
151 static void kvm_cpu__setup_regs(struct kvm_cpu *vcpu)
153 vcpu->regs = (struct kvm_regs) {
154 /* We start the guest in 16-bit real mode */
155 .rflags = 0x0000000000000002ULL,
157 .rip = vcpu->kvm->boot_ip,
158 .rsp = vcpu->kvm->boot_sp,
159 .rbp = vcpu->kvm->boot_sp,
162 if (vcpu->regs.rip > USHRT_MAX)
163 die("ip 0x%llx is too high for real mode", (u64) vcpu->regs.rip);
165 if (ioctl(vcpu->vcpu_fd, KVM_SET_REGS, &vcpu->regs) < 0)
166 die_perror("KVM_SET_REGS failed");
169 static void kvm_cpu__setup_sregs(struct kvm_cpu *vcpu)
172 if (ioctl(vcpu->vcpu_fd, KVM_GET_SREGS, &vcpu->sregs) < 0)
173 die_perror("KVM_GET_SREGS failed");
175 vcpu->sregs.cs.selector = vcpu->kvm->boot_selector;
176 vcpu->sregs.cs.base = selector_to_base(vcpu->kvm->boot_selector);
177 vcpu->sregs.ss.selector = vcpu->kvm->boot_selector;
178 vcpu->sregs.ss.base = selector_to_base(vcpu->kvm->boot_selector);
179 vcpu->sregs.ds.selector = vcpu->kvm->boot_selector;
180 vcpu->sregs.ds.base = selector_to_base(vcpu->kvm->boot_selector);
181 vcpu->sregs.es.selector = vcpu->kvm->boot_selector;
182 vcpu->sregs.es.base = selector_to_base(vcpu->kvm->boot_selector);
183 vcpu->sregs.fs.selector = vcpu->kvm->boot_selector;
184 vcpu->sregs.fs.base = selector_to_base(vcpu->kvm->boot_selector);
185 vcpu->sregs.gs.selector = vcpu->kvm->boot_selector;
186 vcpu->sregs.gs.base = selector_to_base(vcpu->kvm->boot_selector);
188 if (ioctl(vcpu->vcpu_fd, KVM_SET_SREGS, &vcpu->sregs) < 0)
189 die_perror("KVM_SET_SREGS failed");
193 * kvm_cpu__reset_vcpu - reset virtual CPU to a known state
195 void kvm_cpu__reset_vcpu(struct kvm_cpu *vcpu)
197 kvm_cpu__setup_sregs(vcpu);
198 kvm_cpu__setup_regs(vcpu);
199 kvm_cpu__setup_fpu(vcpu);
200 kvm_cpu__setup_msrs(vcpu);
203 static void print_dtable(const char *name, struct kvm_dtable *dtable)
205 printf(" %s %016llx %08hx\n",
206 name, (u64) dtable->base, (u16) dtable->limit);
209 static void print_segment(const char *name, struct kvm_segment *seg)
211 printf(" %s %04hx %016llx %08x %02hhx %x %x %x %x %x %x %x\n",
212 name, (u16) seg->selector, (u64) seg->base, (u32) seg->limit,
213 (u8) seg->type, seg->present, seg->dpl, seg->db, seg->s, seg->l, seg->g, seg->avl);
216 void kvm_cpu__show_registers(struct kvm_cpu *vcpu)
218 unsigned long cr0, cr2, cr3;
219 unsigned long cr4, cr8;
220 unsigned long rax, rbx, rcx;
221 unsigned long rdx, rsi, rdi;
222 unsigned long rbp, r8, r9;
223 unsigned long r10, r11, r12;
224 unsigned long r13, r14, r15;
225 unsigned long rip, rsp;
226 struct kvm_sregs sregs;
227 unsigned long rflags;
228 struct kvm_regs regs;
231 if (ioctl(vcpu->vcpu_fd, KVM_GET_REGS, ®s) < 0)
232 die("KVM_GET_REGS failed");
234 rflags = regs.rflags;
236 rip = regs.rip; rsp = regs.rsp;
237 rax = regs.rax; rbx = regs.rbx; rcx = regs.rcx;
238 rdx = regs.rdx; rsi = regs.rsi; rdi = regs.rdi;
239 rbp = regs.rbp; r8 = regs.r8; r9 = regs.r9;
240 r10 = regs.r10; r11 = regs.r11; r12 = regs.r12;
241 r13 = regs.r13; r14 = regs.r14; r15 = regs.r15;
243 printf("\n Registers:\n");
244 printf( " ----------\n");
245 printf(" rip: %016lx rsp: %016lx flags: %016lx\n", rip, rsp, rflags);
246 printf(" rax: %016lx rbx: %016lx rcx: %016lx\n", rax, rbx, rcx);
247 printf(" rdx: %016lx rsi: %016lx rdi: %016lx\n", rdx, rsi, rdi);
248 printf(" rbp: %016lx r8: %016lx r9: %016lx\n", rbp, r8, r9);
249 printf(" r10: %016lx r11: %016lx r12: %016lx\n", r10, r11, r12);
250 printf(" r13: %016lx r14: %016lx r15: %016lx\n", r13, r14, r15);
252 if (ioctl(vcpu->vcpu_fd, KVM_GET_SREGS, &sregs) < 0)
253 die("KVM_GET_REGS failed");
255 cr0 = sregs.cr0; cr2 = sregs.cr2; cr3 = sregs.cr3;
256 cr4 = sregs.cr4; cr8 = sregs.cr8;
258 printf(" cr0: %016lx cr2: %016lx cr3: %016lx\n", cr0, cr2, cr3);
259 printf(" cr4: %016lx cr8: %016lx\n", cr4, cr8);
260 printf("\n Segment registers:\n");
261 printf( " ------------------\n");
262 printf(" register selector base limit type p dpl db s l g avl\n");
263 print_segment("cs ", &sregs.cs);
264 print_segment("ss ", &sregs.ss);
265 print_segment("ds ", &sregs.ds);
266 print_segment("es ", &sregs.es);
267 print_segment("fs ", &sregs.fs);
268 print_segment("gs ", &sregs.gs);
269 print_segment("tr ", &sregs.tr);
270 print_segment("ldt", &sregs.ldt);
271 print_dtable("gdt", &sregs.gdt);
272 print_dtable("idt", &sregs.idt);
274 printf("\n APIC:\n");
276 printf(" efer: %016llx apic base: %016llx nmi: %s\n",
277 (u64) sregs.efer, (u64) sregs.apic_base,
278 (vcpu->kvm->nmi_disabled ? "disabled" : "enabled"));
280 printf("\n Interrupt bitmap:\n");
281 printf( " -----------------\n");
282 for (i = 0; i < (KVM_NR_INTERRUPTS + 63) / 64; i++)
283 printf(" %016llx", (u64) sregs.interrupt_bitmap[i]);
287 #define MAX_SYM_LEN 128
289 void kvm_cpu__show_code(struct kvm_cpu *vcpu)
291 unsigned int code_bytes = 64;
292 unsigned int code_prologue = code_bytes * 43 / 64;
293 unsigned int code_len = code_bytes;
294 char sym[MAX_SYM_LEN];
299 if (ioctl(vcpu->vcpu_fd, KVM_GET_REGS, &vcpu->regs) < 0)
300 die("KVM_GET_REGS failed");
302 if (ioctl(vcpu->vcpu_fd, KVM_GET_SREGS, &vcpu->sregs) < 0)
303 die("KVM_GET_SREGS failed");
305 ip = guest_flat_to_host(vcpu->kvm, ip_to_flat(vcpu, vcpu->regs.rip) - code_prologue);
307 printf("\n Code:\n");
310 symbol__lookup(vcpu->kvm, vcpu->regs.rip, sym, MAX_SYM_LEN);
312 printf(" rip: [<%016lx>] %s\n\n", (unsigned long) vcpu->regs.rip, sym);
314 for (i = 0; i < code_len; i++, ip++) {
315 if (!host_ptr_in_ram(vcpu->kvm, ip))
320 if (ip == guest_flat_to_host(vcpu->kvm, ip_to_flat(vcpu, vcpu->regs.rip)))
321 printf(" <%02x>", c);
328 printf("\n Stack:\n");
329 printf( " ------\n");
330 kvm__dump_mem(vcpu->kvm, vcpu->regs.rsp, 32);
333 void kvm_cpu__show_page_tables(struct kvm_cpu *vcpu)
340 if (!is_in_protected_mode(vcpu))
343 if (ioctl(vcpu->vcpu_fd, KVM_GET_SREGS, &vcpu->sregs) < 0)
344 die("KVM_GET_SREGS failed");
346 pte4 = guest_flat_to_host(vcpu->kvm, vcpu->sregs.cr3);
347 if (!host_ptr_in_ram(vcpu->kvm, pte4))
350 pte3 = guest_flat_to_host(vcpu->kvm, (*pte4 & ~0xfff));
351 if (!host_ptr_in_ram(vcpu->kvm, pte3))
354 pte2 = guest_flat_to_host(vcpu->kvm, (*pte3 & ~0xfff));
355 if (!host_ptr_in_ram(vcpu->kvm, pte2))
358 pte1 = guest_flat_to_host(vcpu->kvm, (*pte2 & ~0xfff));
359 if (!host_ptr_in_ram(vcpu->kvm, pte1))
362 printf("Page Tables:\n");
363 if (*pte2 & (1 << 7))
364 printf(" pte4: %016llx pte3: %016llx"
366 *pte4, *pte3, *pte2);
368 printf(" pte4: %016llx pte3: %016llx pte2: %016"
369 "llx pte1: %016llx\n",
370 *pte4, *pte3, *pte2, *pte1);
373 void kvm_cpu__run(struct kvm_cpu *vcpu)
377 err = ioctl(vcpu->vcpu_fd, KVM_RUN, 0);
378 if (err && (errno != EINTR && errno != EAGAIN))
379 die_perror("KVM_RUN failed");
382 int kvm_cpu__start(struct kvm_cpu *cpu)
386 sigemptyset(&sigset);
387 sigaddset(&sigset, SIGALRM);
389 pthread_sigmask(SIG_BLOCK, &sigset, NULL);
391 kvm_cpu__setup_cpuid(cpu);
392 kvm_cpu__reset_vcpu(cpu);
397 switch (cpu->kvm_run->exit_reason) {
398 case KVM_EXIT_UNKNOWN:
401 kvm_cpu__show_registers(cpu);
402 kvm_cpu__show_code(cpu);
407 ret = kvm__emulate_io(cpu->kvm,
408 cpu->kvm_run->io.port,
410 cpu->kvm_run->io.data_offset,
411 cpu->kvm_run->io.direction,
412 cpu->kvm_run->io.size,
413 cpu->kvm_run->io.count);
419 case KVM_EXIT_MMIO: {
422 ret = kvm__emulate_mmio(cpu->kvm,
423 cpu->kvm_run->mmio.phys_addr,
424 cpu->kvm_run->mmio.data,
425 cpu->kvm_run->mmio.len,
426 cpu->kvm_run->mmio.is_write);
434 case KVM_EXIT_SHUTDOWN: