lg.h 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260
  1. #ifndef _LGUEST_H
  2. #define _LGUEST_H
  3. #ifndef __ASSEMBLY__
  4. #include <linux/types.h>
  5. #include <linux/init.h>
  6. #include <linux/stringify.h>
  7. #include <linux/lguest.h>
  8. #include <linux/lguest_launcher.h>
  9. #include <linux/wait.h>
  10. #include <linux/hrtimer.h>
  11. #include <linux/err.h>
  12. #include <linux/slab.h>
  13. #include <asm/lguest.h>
  14. struct pgdir {
  15. unsigned long gpgdir;
  16. bool switcher_mapped;
  17. int last_host_cpu;
  18. pgd_t *pgdir;
  19. };
  20. /* We have two pages shared with guests, per cpu. */
  21. struct lguest_pages {
  22. /* This is the stack page mapped rw in guest */
  23. char spare[PAGE_SIZE - sizeof(struct lguest_regs)];
  24. struct lguest_regs regs;
  25. /* This is the host state & guest descriptor page, ro in guest */
  26. struct lguest_ro_state state;
  27. } __attribute__((aligned(PAGE_SIZE)));
  28. #define CHANGED_IDT 1
  29. #define CHANGED_GDT 2
  30. #define CHANGED_GDT_TLS 4 /* Actually a subset of CHANGED_GDT */
  31. #define CHANGED_ALL 3
  32. struct lg_cpu {
  33. unsigned int id;
  34. struct lguest *lg;
  35. struct task_struct *tsk;
  36. struct mm_struct *mm; /* == tsk->mm, but that becomes NULL on exit */
  37. u32 cr2;
  38. int ts;
  39. u32 esp1;
  40. u16 ss1;
  41. /* Bitmap of what has changed: see CHANGED_* above. */
  42. int changed;
  43. /* Pending operation. */
  44. struct lguest_pending pending;
  45. unsigned long *reg_read; /* register from LHREQ_GETREG */
  46. /* At end of a page shared mapped over lguest_pages in guest. */
  47. unsigned long regs_page;
  48. struct lguest_regs *regs;
  49. struct lguest_pages *last_pages;
  50. /* Initialization mode: linear map everything. */
  51. bool linear_pages;
  52. int cpu_pgd; /* Which pgd this cpu is currently using */
  53. /* If a hypercall was asked for, this points to the arguments. */
  54. struct hcall_args *hcall;
  55. u32 next_hcall;
  56. /* Virtual clock device */
  57. struct hrtimer hrt;
  58. /* Did the Guest tell us to halt? */
  59. int halted;
  60. /* Pending virtual interrupts */
  61. DECLARE_BITMAP(irqs_pending, LGUEST_IRQS);
  62. struct lg_cpu_arch arch;
  63. };
  64. /* The private info the thread maintains about the guest. */
  65. struct lguest {
  66. struct lguest_data __user *lguest_data;
  67. struct lg_cpu cpus[NR_CPUS];
  68. unsigned int nr_cpus;
  69. /* Valid guest memory pages must be < this. */
  70. u32 pfn_limit;
  71. /* Device memory is >= pfn_limit and < device_limit. */
  72. u32 device_limit;
  73. /*
  74. * This provides the offset to the base of guest-physical memory in the
  75. * Launcher.
  76. */
  77. void __user *mem_base;
  78. unsigned long kernel_address;
  79. struct pgdir pgdirs[4];
  80. unsigned long noirq_iret;
  81. unsigned int stack_pages;
  82. u32 tsc_khz;
  83. /* Dead? */
  84. const char *dead;
  85. };
  86. extern struct mutex lguest_lock;
  87. /* core.c: */
  88. bool lguest_address_ok(const struct lguest *lg,
  89. unsigned long addr, unsigned long len);
  90. void __lgread(struct lg_cpu *, void *, unsigned long, unsigned);
  91. void __lgwrite(struct lg_cpu *, unsigned long, const void *, unsigned);
  92. extern struct page **lg_switcher_pages;
  93. /*H:035
  94. * Using memory-copy operations like that is usually inconvient, so we
  95. * have the following helper macros which read and write a specific type (often
  96. * an unsigned long).
  97. *
  98. * This reads into a variable of the given type then returns that.
  99. */
  100. #define lgread(cpu, addr, type) \
  101. ({ type _v; __lgread((cpu), &_v, (addr), sizeof(_v)); _v; })
  102. /* This checks that the variable is of the given type, then writes it out. */
  103. #define lgwrite(cpu, addr, type, val) \
  104. do { \
  105. typecheck(type, val); \
  106. __lgwrite((cpu), (addr), &(val), sizeof(val)); \
  107. } while(0)
  108. /* (end of memory access helper routines) :*/
  109. int run_guest(struct lg_cpu *cpu, unsigned long __user *user);
  110. /*
  111. * Helper macros to obtain the first 12 or the last 20 bits, this is only the
  112. * first step in the migration to the kernel types. pte_pfn is already defined
  113. * in the kernel.
  114. */
  115. #define pgd_flags(x) (pgd_val(x) & ~PAGE_MASK)
  116. #define pgd_pfn(x) (pgd_val(x) >> PAGE_SHIFT)
  117. #define pmd_flags(x) (pmd_val(x) & ~PAGE_MASK)
  118. #define pmd_pfn(x) (pmd_val(x) >> PAGE_SHIFT)
  119. /* interrupts_and_traps.c: */
  120. unsigned int interrupt_pending(struct lg_cpu *cpu, bool *more);
  121. void try_deliver_interrupt(struct lg_cpu *cpu, unsigned int irq, bool more);
  122. void set_interrupt(struct lg_cpu *cpu, unsigned int irq);
  123. bool deliver_trap(struct lg_cpu *cpu, unsigned int num);
  124. void load_guest_idt_entry(struct lg_cpu *cpu, unsigned int i,
  125. u32 low, u32 hi);
  126. void guest_set_stack(struct lg_cpu *cpu, u32 seg, u32 esp, unsigned int pages);
  127. void pin_stack_pages(struct lg_cpu *cpu);
  128. void setup_default_idt_entries(struct lguest_ro_state *state,
  129. const unsigned long *def);
  130. void copy_traps(const struct lg_cpu *cpu, struct desc_struct *idt,
  131. const unsigned long *def);
  132. void guest_set_clockevent(struct lg_cpu *cpu, unsigned long delta);
  133. bool send_notify_to_eventfd(struct lg_cpu *cpu);
  134. void init_clockdev(struct lg_cpu *cpu);
  135. bool check_syscall_vector(struct lguest *lg);
  136. bool could_be_syscall(unsigned int num);
  137. int init_interrupts(void);
  138. void free_interrupts(void);
  139. /* segments.c: */
  140. void setup_default_gdt_entries(struct lguest_ro_state *state);
  141. void setup_guest_gdt(struct lg_cpu *cpu);
  142. void load_guest_gdt_entry(struct lg_cpu *cpu, unsigned int i,
  143. u32 low, u32 hi);
  144. void guest_load_tls(struct lg_cpu *cpu, unsigned long tls_array);
  145. void copy_gdt(const struct lg_cpu *cpu, struct desc_struct *gdt);
  146. void copy_gdt_tls(const struct lg_cpu *cpu, struct desc_struct *gdt);
  147. /* page_tables.c: */
  148. int init_guest_pagetable(struct lguest *lg);
  149. void free_guest_pagetable(struct lguest *lg);
  150. void guest_new_pagetable(struct lg_cpu *cpu, unsigned long pgtable);
  151. void guest_set_pgd(struct lguest *lg, unsigned long gpgdir, u32 i);
  152. #ifdef CONFIG_X86_PAE
  153. void guest_set_pmd(struct lguest *lg, unsigned long gpgdir, u32 i);
  154. #endif
  155. void guest_pagetable_clear_all(struct lg_cpu *cpu);
  156. void guest_pagetable_flush_user(struct lg_cpu *cpu);
  157. void guest_set_pte(struct lg_cpu *cpu, unsigned long gpgdir,
  158. unsigned long vaddr, pte_t val);
  159. void map_switcher_in_guest(struct lg_cpu *cpu, struct lguest_pages *pages);
  160. bool demand_page(struct lg_cpu *cpu, unsigned long cr2, int errcode,
  161. unsigned long *iomem);
  162. void pin_page(struct lg_cpu *cpu, unsigned long vaddr);
  163. bool __guest_pa(struct lg_cpu *cpu, unsigned long vaddr, unsigned long *paddr);
  164. unsigned long guest_pa(struct lg_cpu *cpu, unsigned long vaddr);
  165. void page_table_guest_data_init(struct lg_cpu *cpu);
  166. /* <arch>/core.c: */
  167. void lguest_arch_host_init(void);
  168. void lguest_arch_host_fini(void);
  169. void lguest_arch_run_guest(struct lg_cpu *cpu);
  170. void lguest_arch_handle_trap(struct lg_cpu *cpu);
  171. int lguest_arch_init_hypercalls(struct lg_cpu *cpu);
  172. int lguest_arch_do_hcall(struct lg_cpu *cpu, struct hcall_args *args);
  173. void lguest_arch_setup_regs(struct lg_cpu *cpu, unsigned long start);
  174. unsigned long *lguest_arch_regptr(struct lg_cpu *cpu, size_t reg_off, bool any);
  175. /* <arch>/switcher.S: */
  176. extern char start_switcher_text[], end_switcher_text[], switch_to_guest[];
  177. /* lguest_user.c: */
  178. int lguest_device_init(void);
  179. void lguest_device_remove(void);
  180. /* hypercalls.c: */
  181. void do_hypercalls(struct lg_cpu *cpu);
  182. void write_timestamp(struct lg_cpu *cpu);
  183. /*L:035
  184. * Let's step aside for the moment, to study one important routine that's used
  185. * widely in the Host code.
  186. *
  187. * There are many cases where the Guest can do something invalid, like pass crap
  188. * to a hypercall. Since only the Guest kernel can make hypercalls, it's quite
  189. * acceptable to simply terminate the Guest and give the Launcher a nicely
  190. * formatted reason. It's also simpler for the Guest itself, which doesn't
  191. * need to check most hypercalls for "success"; if you're still running, it
  192. * succeeded.
  193. *
  194. * Once this is called, the Guest will never run again, so most Host code can
  195. * call this then continue as if nothing had happened. This means many
  196. * functions don't have to explicitly return an error code, which keeps the
  197. * code simple.
  198. *
  199. * It also means that this can be called more than once: only the first one is
  200. * remembered. The only trick is that we still need to kill the Guest even if
  201. * we can't allocate memory to store the reason. Linux has a neat way of
  202. * packing error codes into invalid pointers, so we use that here.
  203. *
  204. * Like any macro which uses an "if", it is safely wrapped in a run-once "do {
  205. * } while(0)".
  206. */
  207. #define kill_guest(cpu, fmt...) \
  208. do { \
  209. if (!(cpu)->lg->dead) { \
  210. (cpu)->lg->dead = kasprintf(GFP_ATOMIC, fmt); \
  211. if (!(cpu)->lg->dead) \
  212. (cpu)->lg->dead = ERR_PTR(-ENOMEM); \
  213. } \
  214. } while(0)
  215. /* (End of aside) :*/
  216. #endif /* __ASSEMBLY__ */
  217. #endif /* _LGUEST_H */