1 #ifndef _ASM_X86_PARAVIRT_H
2 #define _ASM_X86_PARAVIRT_H
3 /* Various instructions on x86 need to be replaced for
4 * para-virtualization: those hooks are defined here. */
7 #include <asm/pgtable_types.h>
10 #include <asm/paravirt_types.h>
13 #include <linux/bug.h>
14 #include <linux/types.h>
15 #include <linux/cpumask.h>
17 static inline int paravirt_enabled(void)
19 return pv_info
.paravirt_enabled
;
22 static inline void load_sp0(struct tss_struct
*tss
,
23 struct thread_struct
*thread
)
25 PVOP_VCALL2(pv_cpu_ops
.load_sp0
, tss
, thread
);
28 /* The paravirtualized CPUID instruction. */
29 static inline void __cpuid(unsigned int *eax
, unsigned int *ebx
,
30 unsigned int *ecx
, unsigned int *edx
)
32 PVOP_VCALL4(pv_cpu_ops
.cpuid
, eax
, ebx
, ecx
, edx
);
36 * These special macros can be used to get or set a debugging register
38 static inline unsigned long paravirt_get_debugreg(int reg
)
40 return PVOP_CALL1(unsigned long, pv_cpu_ops
.get_debugreg
, reg
);
42 #define get_debugreg(var, reg) var = paravirt_get_debugreg(reg)
43 static inline void set_debugreg(unsigned long val
, int reg
)
45 PVOP_VCALL2(pv_cpu_ops
.set_debugreg
, reg
, val
);
48 static inline void clts(void)
50 PVOP_VCALL0(pv_cpu_ops
.clts
);
53 static inline unsigned long read_cr0(void)
55 return PVOP_CALL0(unsigned long, pv_cpu_ops
.read_cr0
);
58 static inline void write_cr0(unsigned long x
)
60 PVOP_VCALL1(pv_cpu_ops
.write_cr0
, x
);
63 static inline unsigned long read_cr2(void)
65 return PVOP_CALL0(unsigned long, pv_mmu_ops
.read_cr2
);
68 static inline void write_cr2(unsigned long x
)
70 PVOP_VCALL1(pv_mmu_ops
.write_cr2
, x
);
73 static inline unsigned long read_cr3(void)
75 return PVOP_CALL0(unsigned long, pv_mmu_ops
.read_cr3
);
78 static inline void write_cr3(unsigned long x
)
80 PVOP_VCALL1(pv_mmu_ops
.write_cr3
, x
);
83 static inline unsigned long read_cr4(void)
85 return PVOP_CALL0(unsigned long, pv_cpu_ops
.read_cr4
);
87 static inline unsigned long read_cr4_safe(void)
89 return PVOP_CALL0(unsigned long, pv_cpu_ops
.read_cr4_safe
);
92 static inline void write_cr4(unsigned long x
)
94 PVOP_VCALL1(pv_cpu_ops
.write_cr4
, x
);
98 static inline unsigned long read_cr8(void)
100 return PVOP_CALL0(unsigned long, pv_cpu_ops
.read_cr8
);
103 static inline void write_cr8(unsigned long x
)
105 PVOP_VCALL1(pv_cpu_ops
.write_cr8
, x
);
109 static inline void arch_safe_halt(void)
111 PVOP_VCALL0(pv_irq_ops
.safe_halt
);
114 static inline void halt(void)
116 PVOP_VCALL0(pv_irq_ops
.halt
);
119 static inline void wbinvd(void)
121 PVOP_VCALL0(pv_cpu_ops
.wbinvd
);
124 #define get_kernel_rpl() (pv_info.kernel_rpl)
126 static inline u64
paravirt_read_msr(unsigned msr
, int *err
)
128 return PVOP_CALL2(u64
, pv_cpu_ops
.read_msr
, msr
, err
);
131 static inline int paravirt_write_msr(unsigned msr
, unsigned low
, unsigned high
)
133 return PVOP_CALL3(int, pv_cpu_ops
.write_msr
, msr
, low
, high
);
136 /* These should all do BUG_ON(_err), but our headers are too tangled. */
137 #define rdmsr(msr, val1, val2) \
140 u64 _l = paravirt_read_msr(msr, &_err); \
145 #define wrmsr(msr, val1, val2) \
147 paravirt_write_msr(msr, val1, val2); \
150 #define rdmsrl(msr, val) \
153 val = paravirt_read_msr(msr, &_err); \
156 #define wrmsrl(msr, val) wrmsr(msr, (u32)((u64)(val)), ((u64)(val))>>32)
157 #define wrmsr_safe(msr, a, b) paravirt_write_msr(msr, a, b)
159 /* rdmsr with exception handling */
160 #define rdmsr_safe(msr, a, b) \
163 u64 _l = paravirt_read_msr(msr, &_err); \
169 static inline int rdmsrl_safe(unsigned msr
, unsigned long long *p
)
173 *p
= paravirt_read_msr(msr
, &err
);
177 static inline u64
paravirt_read_tsc(void)
179 return PVOP_CALL0(u64
, pv_cpu_ops
.read_tsc
);
182 #define rdtscl(low) \
184 u64 _l = paravirt_read_tsc(); \
188 #define rdtscll(val) (val = paravirt_read_tsc())
190 static inline unsigned long long paravirt_sched_clock(void)
192 return PVOP_CALL0(unsigned long long, pv_time_ops
.sched_clock
);
196 extern struct static_key paravirt_steal_enabled
;
197 extern struct static_key paravirt_steal_rq_enabled
;
199 static inline u64
paravirt_steal_clock(int cpu
)
201 return PVOP_CALL1(u64
, pv_time_ops
.steal_clock
, cpu
);
204 static inline unsigned long long paravirt_read_pmc(int counter
)
206 return PVOP_CALL1(u64
, pv_cpu_ops
.read_pmc
, counter
);
209 #define rdpmc(counter, low, high) \
211 u64 _l = paravirt_read_pmc(counter); \
216 #define rdpmcl(counter, val) ((val) = paravirt_read_pmc(counter))
218 static inline unsigned long long paravirt_rdtscp(unsigned int *aux
)
220 return PVOP_CALL1(u64
, pv_cpu_ops
.read_tscp
, aux
);
223 #define rdtscp(low, high, aux) \
226 unsigned long __val = paravirt_rdtscp(&__aux); \
227 (low) = (u32)__val; \
228 (high) = (u32)(__val >> 32); \
232 #define rdtscpll(val, aux) \
234 unsigned long __aux; \
235 val = paravirt_rdtscp(&__aux); \
239 static inline void paravirt_alloc_ldt(struct desc_struct
*ldt
, unsigned entries
)
241 PVOP_VCALL2(pv_cpu_ops
.alloc_ldt
, ldt
, entries
);
244 static inline void paravirt_free_ldt(struct desc_struct
*ldt
, unsigned entries
)
246 PVOP_VCALL2(pv_cpu_ops
.free_ldt
, ldt
, entries
);
249 static inline void load_TR_desc(void)
251 PVOP_VCALL0(pv_cpu_ops
.load_tr_desc
);
253 static inline void load_gdt(const struct desc_ptr
*dtr
)
255 PVOP_VCALL1(pv_cpu_ops
.load_gdt
, dtr
);
257 static inline void load_idt(const struct desc_ptr
*dtr
)
259 PVOP_VCALL1(pv_cpu_ops
.load_idt
, dtr
);
261 static inline void set_ldt(const void *addr
, unsigned entries
)
263 PVOP_VCALL2(pv_cpu_ops
.set_ldt
, addr
, entries
);
265 static inline void store_idt(struct desc_ptr
*dtr
)
267 PVOP_VCALL1(pv_cpu_ops
.store_idt
, dtr
);
269 static inline unsigned long paravirt_store_tr(void)
271 return PVOP_CALL0(unsigned long, pv_cpu_ops
.store_tr
);
273 #define store_tr(tr) ((tr) = paravirt_store_tr())
274 static inline void load_TLS(struct thread_struct
*t
, unsigned cpu
)
276 PVOP_VCALL2(pv_cpu_ops
.load_tls
, t
, cpu
);
280 static inline void load_gs_index(unsigned int gs
)
282 PVOP_VCALL1(pv_cpu_ops
.load_gs_index
, gs
);
286 static inline void write_ldt_entry(struct desc_struct
*dt
, int entry
,
289 PVOP_VCALL3(pv_cpu_ops
.write_ldt_entry
, dt
, entry
, desc
);
292 static inline void write_gdt_entry(struct desc_struct
*dt
, int entry
,
293 void *desc
, int type
)
295 PVOP_VCALL4(pv_cpu_ops
.write_gdt_entry
, dt
, entry
, desc
, type
);
298 static inline void write_idt_entry(gate_desc
*dt
, int entry
, const gate_desc
*g
)
300 PVOP_VCALL3(pv_cpu_ops
.write_idt_entry
, dt
, entry
, g
);
302 static inline void set_iopl_mask(unsigned mask
)
304 PVOP_VCALL1(pv_cpu_ops
.set_iopl_mask
, mask
);
307 /* The paravirtualized I/O functions */
308 static inline void slow_down_io(void)
310 pv_cpu_ops
.io_delay();
311 #ifdef REALLY_SLOW_IO
312 pv_cpu_ops
.io_delay();
313 pv_cpu_ops
.io_delay();
314 pv_cpu_ops
.io_delay();
319 static inline void startup_ipi_hook(int phys_apicid
, unsigned long start_eip
,
320 unsigned long start_esp
)
322 PVOP_VCALL3(pv_apic_ops
.startup_ipi_hook
,
323 phys_apicid
, start_eip
, start_esp
);
327 static inline void paravirt_activate_mm(struct mm_struct
*prev
,
328 struct mm_struct
*next
)
330 PVOP_VCALL2(pv_mmu_ops
.activate_mm
, prev
, next
);
333 static inline void arch_dup_mmap(struct mm_struct
*oldmm
,
334 struct mm_struct
*mm
)
336 PVOP_VCALL2(pv_mmu_ops
.dup_mmap
, oldmm
, mm
);
339 static inline void arch_exit_mmap(struct mm_struct
*mm
)
341 PVOP_VCALL1(pv_mmu_ops
.exit_mmap
, mm
);
344 static inline void __flush_tlb(void)
346 PVOP_VCALL0(pv_mmu_ops
.flush_tlb_user
);
348 static inline void __flush_tlb_global(void)
350 PVOP_VCALL0(pv_mmu_ops
.flush_tlb_kernel
);
352 static inline void __flush_tlb_single(unsigned long addr
)
354 PVOP_VCALL1(pv_mmu_ops
.flush_tlb_single
, addr
);
357 static inline void flush_tlb_others(const struct cpumask
*cpumask
,
358 struct mm_struct
*mm
,
362 PVOP_VCALL4(pv_mmu_ops
.flush_tlb_others
, cpumask
, mm
, start
, end
);
365 static inline int paravirt_pgd_alloc(struct mm_struct
*mm
)
367 return PVOP_CALL1(int, pv_mmu_ops
.pgd_alloc
, mm
);
370 static inline void paravirt_pgd_free(struct mm_struct
*mm
, pgd_t
*pgd
)
372 PVOP_VCALL2(pv_mmu_ops
.pgd_free
, mm
, pgd
);
375 static inline void paravirt_alloc_pte(struct mm_struct
*mm
, unsigned long pfn
)
377 PVOP_VCALL2(pv_mmu_ops
.alloc_pte
, mm
, pfn
);
379 static inline void paravirt_release_pte(unsigned long pfn
)
381 PVOP_VCALL1(pv_mmu_ops
.release_pte
, pfn
);
384 static inline void paravirt_alloc_pmd(struct mm_struct
*mm
, unsigned long pfn
)
386 PVOP_VCALL2(pv_mmu_ops
.alloc_pmd
, mm
, pfn
);
389 static inline void paravirt_release_pmd(unsigned long pfn
)
391 PVOP_VCALL1(pv_mmu_ops
.release_pmd
, pfn
);
394 static inline void paravirt_alloc_pud(struct mm_struct
*mm
, unsigned long pfn
)
396 PVOP_VCALL2(pv_mmu_ops
.alloc_pud
, mm
, pfn
);
398 static inline void paravirt_release_pud(unsigned long pfn
)
400 PVOP_VCALL1(pv_mmu_ops
.release_pud
, pfn
);
403 static inline void pte_update(struct mm_struct
*mm
, unsigned long addr
,
406 PVOP_VCALL3(pv_mmu_ops
.pte_update
, mm
, addr
, ptep
);
408 static inline void pmd_update(struct mm_struct
*mm
, unsigned long addr
,
411 PVOP_VCALL3(pv_mmu_ops
.pmd_update
, mm
, addr
, pmdp
);
414 static inline void pte_update_defer(struct mm_struct
*mm
, unsigned long addr
,
417 PVOP_VCALL3(pv_mmu_ops
.pte_update_defer
, mm
, addr
, ptep
);
420 static inline void pmd_update_defer(struct mm_struct
*mm
, unsigned long addr
,
423 PVOP_VCALL3(pv_mmu_ops
.pmd_update_defer
, mm
, addr
, pmdp
);
426 static inline pte_t
__pte(pteval_t val
)
430 if (sizeof(pteval_t
) > sizeof(long))
431 ret
= PVOP_CALLEE2(pteval_t
,
433 val
, (u64
)val
>> 32);
435 ret
= PVOP_CALLEE1(pteval_t
,
439 return (pte_t
) { .pte
= ret
};
442 static inline pteval_t
pte_val(pte_t pte
)
446 if (sizeof(pteval_t
) > sizeof(long))
447 ret
= PVOP_CALLEE2(pteval_t
, pv_mmu_ops
.pte_val
,
448 pte
.pte
, (u64
)pte
.pte
>> 32);
450 ret
= PVOP_CALLEE1(pteval_t
, pv_mmu_ops
.pte_val
,
456 static inline pgd_t
__pgd(pgdval_t val
)
460 if (sizeof(pgdval_t
) > sizeof(long))
461 ret
= PVOP_CALLEE2(pgdval_t
, pv_mmu_ops
.make_pgd
,
462 val
, (u64
)val
>> 32);
464 ret
= PVOP_CALLEE1(pgdval_t
, pv_mmu_ops
.make_pgd
,
467 return (pgd_t
) { ret
};
470 static inline pgdval_t
pgd_val(pgd_t pgd
)
474 if (sizeof(pgdval_t
) > sizeof(long))
475 ret
= PVOP_CALLEE2(pgdval_t
, pv_mmu_ops
.pgd_val
,
476 pgd
.pgd
, (u64
)pgd
.pgd
>> 32);
478 ret
= PVOP_CALLEE1(pgdval_t
, pv_mmu_ops
.pgd_val
,
484 #define __HAVE_ARCH_PTEP_MODIFY_PROT_TRANSACTION
485 static inline pte_t
ptep_modify_prot_start(struct mm_struct
*mm
, unsigned long addr
,
490 ret
= PVOP_CALL3(pteval_t
, pv_mmu_ops
.ptep_modify_prot_start
,
493 return (pte_t
) { .pte
= ret
};
496 static inline void ptep_modify_prot_commit(struct mm_struct
*mm
, unsigned long addr
,
497 pte_t
*ptep
, pte_t pte
)
499 if (sizeof(pteval_t
) > sizeof(long))
501 pv_mmu_ops
.ptep_modify_prot_commit(mm
, addr
, ptep
, pte
);
503 PVOP_VCALL4(pv_mmu_ops
.ptep_modify_prot_commit
,
504 mm
, addr
, ptep
, pte
.pte
);
507 static inline void set_pte(pte_t
*ptep
, pte_t pte
)
509 if (sizeof(pteval_t
) > sizeof(long))
510 PVOP_VCALL3(pv_mmu_ops
.set_pte
, ptep
,
511 pte
.pte
, (u64
)pte
.pte
>> 32);
513 PVOP_VCALL2(pv_mmu_ops
.set_pte
, ptep
,
517 static inline void set_pte_at(struct mm_struct
*mm
, unsigned long addr
,
518 pte_t
*ptep
, pte_t pte
)
520 if (sizeof(pteval_t
) > sizeof(long))
522 pv_mmu_ops
.set_pte_at(mm
, addr
, ptep
, pte
);
524 PVOP_VCALL4(pv_mmu_ops
.set_pte_at
, mm
, addr
, ptep
, pte
.pte
);
527 static inline void set_pmd_at(struct mm_struct
*mm
, unsigned long addr
,
528 pmd_t
*pmdp
, pmd_t pmd
)
530 if (sizeof(pmdval_t
) > sizeof(long))
532 pv_mmu_ops
.set_pmd_at(mm
, addr
, pmdp
, pmd
);
534 PVOP_VCALL4(pv_mmu_ops
.set_pmd_at
, mm
, addr
, pmdp
,
535 native_pmd_val(pmd
));
538 static inline void set_pmd(pmd_t
*pmdp
, pmd_t pmd
)
540 pmdval_t val
= native_pmd_val(pmd
);
542 if (sizeof(pmdval_t
) > sizeof(long))
543 PVOP_VCALL3(pv_mmu_ops
.set_pmd
, pmdp
, val
, (u64
)val
>> 32);
545 PVOP_VCALL2(pv_mmu_ops
.set_pmd
, pmdp
, val
);
548 #if PAGETABLE_LEVELS >= 3
549 static inline pmd_t
__pmd(pmdval_t val
)
553 if (sizeof(pmdval_t
) > sizeof(long))
554 ret
= PVOP_CALLEE2(pmdval_t
, pv_mmu_ops
.make_pmd
,
555 val
, (u64
)val
>> 32);
557 ret
= PVOP_CALLEE1(pmdval_t
, pv_mmu_ops
.make_pmd
,
560 return (pmd_t
) { ret
};
563 static inline pmdval_t
pmd_val(pmd_t pmd
)
567 if (sizeof(pmdval_t
) > sizeof(long))
568 ret
= PVOP_CALLEE2(pmdval_t
, pv_mmu_ops
.pmd_val
,
569 pmd
.pmd
, (u64
)pmd
.pmd
>> 32);
571 ret
= PVOP_CALLEE1(pmdval_t
, pv_mmu_ops
.pmd_val
,
577 static inline void set_pud(pud_t
*pudp
, pud_t pud
)
579 pudval_t val
= native_pud_val(pud
);
581 if (sizeof(pudval_t
) > sizeof(long))
582 PVOP_VCALL3(pv_mmu_ops
.set_pud
, pudp
,
583 val
, (u64
)val
>> 32);
585 PVOP_VCALL2(pv_mmu_ops
.set_pud
, pudp
,
588 #if PAGETABLE_LEVELS == 4
589 static inline pud_t
__pud(pudval_t val
)
593 if (sizeof(pudval_t
) > sizeof(long))
594 ret
= PVOP_CALLEE2(pudval_t
, pv_mmu_ops
.make_pud
,
595 val
, (u64
)val
>> 32);
597 ret
= PVOP_CALLEE1(pudval_t
, pv_mmu_ops
.make_pud
,
600 return (pud_t
) { ret
};
603 static inline pudval_t
pud_val(pud_t pud
)
607 if (sizeof(pudval_t
) > sizeof(long))
608 ret
= PVOP_CALLEE2(pudval_t
, pv_mmu_ops
.pud_val
,
609 pud
.pud
, (u64
)pud
.pud
>> 32);
611 ret
= PVOP_CALLEE1(pudval_t
, pv_mmu_ops
.pud_val
,
617 static inline void set_pgd(pgd_t
*pgdp
, pgd_t pgd
)
619 pgdval_t val
= native_pgd_val(pgd
);
621 if (sizeof(pgdval_t
) > sizeof(long))
622 PVOP_VCALL3(pv_mmu_ops
.set_pgd
, pgdp
,
623 val
, (u64
)val
>> 32);
625 PVOP_VCALL2(pv_mmu_ops
.set_pgd
, pgdp
,
629 static inline void pgd_clear(pgd_t
*pgdp
)
631 set_pgd(pgdp
, __pgd(0));
634 static inline void pud_clear(pud_t
*pudp
)
636 set_pud(pudp
, __pud(0));
639 #endif /* PAGETABLE_LEVELS == 4 */
641 #endif /* PAGETABLE_LEVELS >= 3 */
643 #ifdef CONFIG_X86_PAE
644 /* Special-case pte-setting operations for PAE, which can't update a
645 64-bit pte atomically */
646 static inline void set_pte_atomic(pte_t
*ptep
, pte_t pte
)
648 PVOP_VCALL3(pv_mmu_ops
.set_pte_atomic
, ptep
,
649 pte
.pte
, pte
.pte
>> 32);
652 static inline void pte_clear(struct mm_struct
*mm
, unsigned long addr
,
655 PVOP_VCALL3(pv_mmu_ops
.pte_clear
, mm
, addr
, ptep
);
658 static inline void pmd_clear(pmd_t
*pmdp
)
660 PVOP_VCALL1(pv_mmu_ops
.pmd_clear
, pmdp
);
662 #else /* !CONFIG_X86_PAE */
663 static inline void set_pte_atomic(pte_t
*ptep
, pte_t pte
)
668 static inline void pte_clear(struct mm_struct
*mm
, unsigned long addr
,
671 set_pte_at(mm
, addr
, ptep
, __pte(0));
674 static inline void pmd_clear(pmd_t
*pmdp
)
676 set_pmd(pmdp
, __pmd(0));
678 #endif /* CONFIG_X86_PAE */
680 #define __HAVE_ARCH_START_CONTEXT_SWITCH
681 static inline void arch_start_context_switch(struct task_struct
*prev
)
683 PVOP_VCALL1(pv_cpu_ops
.start_context_switch
, prev
);
686 static inline void arch_end_context_switch(struct task_struct
*next
)
688 PVOP_VCALL1(pv_cpu_ops
.end_context_switch
, next
);
691 #define __HAVE_ARCH_ENTER_LAZY_MMU_MODE
692 static inline void arch_enter_lazy_mmu_mode(void)
694 PVOP_VCALL0(pv_mmu_ops
.lazy_mode
.enter
);
697 static inline void arch_leave_lazy_mmu_mode(void)
699 PVOP_VCALL0(pv_mmu_ops
.lazy_mode
.leave
);
702 static inline void arch_flush_lazy_mmu_mode(void)
704 PVOP_VCALL0(pv_mmu_ops
.lazy_mode
.flush
);
707 static inline void __set_fixmap(unsigned /* enum fixed_addresses */ idx
,
708 phys_addr_t phys
, pgprot_t flags
)
710 pv_mmu_ops
.set_fixmap(idx
, phys
, flags
);
713 #if defined(CONFIG_SMP) && defined(CONFIG_PARAVIRT_SPINLOCKS)
715 static inline int arch_spin_is_locked(struct arch_spinlock
*lock
)
717 return PVOP_CALL1(int, pv_lock_ops
.spin_is_locked
, lock
);
720 static inline int arch_spin_is_contended(struct arch_spinlock
*lock
)
722 return PVOP_CALL1(int, pv_lock_ops
.spin_is_contended
, lock
);
724 #define arch_spin_is_contended arch_spin_is_contended
726 static __always_inline
void arch_spin_lock(struct arch_spinlock
*lock
)
728 PVOP_VCALL1(pv_lock_ops
.spin_lock
, lock
);
731 static __always_inline
void arch_spin_lock_flags(struct arch_spinlock
*lock
,
734 PVOP_VCALL2(pv_lock_ops
.spin_lock_flags
, lock
, flags
);
737 static __always_inline
int arch_spin_trylock(struct arch_spinlock
*lock
)
739 return PVOP_CALL1(int, pv_lock_ops
.spin_trylock
, lock
);
742 static __always_inline
void arch_spin_unlock(struct arch_spinlock
*lock
)
744 PVOP_VCALL1(pv_lock_ops
.spin_unlock
, lock
);
750 #define PV_SAVE_REGS "pushl %ecx; pushl %edx;"
751 #define PV_RESTORE_REGS "popl %edx; popl %ecx;"
753 /* save and restore all caller-save registers, except return value */
754 #define PV_SAVE_ALL_CALLER_REGS "pushl %ecx;"
755 #define PV_RESTORE_ALL_CALLER_REGS "popl %ecx;"
757 #define PV_FLAGS_ARG "0"
758 #define PV_EXTRA_CLOBBERS
759 #define PV_VEXTRA_CLOBBERS
761 /* save and restore all caller-save registers, except return value */
762 #define PV_SAVE_ALL_CALLER_REGS \
771 #define PV_RESTORE_ALL_CALLER_REGS \
781 /* We save some registers, but all of them, that's too much. We clobber all
782 * caller saved registers but the argument parameter */
783 #define PV_SAVE_REGS "pushq %%rdi;"
784 #define PV_RESTORE_REGS "popq %%rdi;"
785 #define PV_EXTRA_CLOBBERS EXTRA_CLOBBERS, "rcx" , "rdx", "rsi"
786 #define PV_VEXTRA_CLOBBERS EXTRA_CLOBBERS, "rdi", "rcx" , "rdx", "rsi"
787 #define PV_FLAGS_ARG "D"
791 * Generate a thunk around a function which saves all caller-save
792 * registers except for the return value. This allows C functions to
793 * be called from assembler code where fewer than normal registers are
794 * available. It may also help code generation around calls from C
795 * code if the common case doesn't use many registers.
797 * When a callee is wrapped in a thunk, the caller can assume that all
798 * arg regs and all scratch registers are preserved across the
799 * call. The return value in rax/eax will not be saved, even for void
802 #define PV_CALLEE_SAVE_REGS_THUNK(func) \
803 extern typeof(func) __raw_callee_save_##func; \
804 static void *__##func##__ __used = func; \
806 asm(".pushsection .text;" \
807 "__raw_callee_save_" #func ": " \
808 PV_SAVE_ALL_CALLER_REGS \
810 PV_RESTORE_ALL_CALLER_REGS \
814 /* Get a reference to a callee-save function */
815 #define PV_CALLEE_SAVE(func) \
816 ((struct paravirt_callee_save) { __raw_callee_save_##func })
818 /* Promise that "func" already uses the right calling convention */
819 #define __PV_IS_CALLEE_SAVE(func) \
820 ((struct paravirt_callee_save) { func })
822 static inline notrace
unsigned long arch_local_save_flags(void)
824 return PVOP_CALLEE0(unsigned long, pv_irq_ops
.save_fl
);
827 static inline notrace
void arch_local_irq_restore(unsigned long f
)
829 PVOP_VCALLEE1(pv_irq_ops
.restore_fl
, f
);
832 static inline notrace
void arch_local_irq_disable(void)
834 PVOP_VCALLEE0(pv_irq_ops
.irq_disable
);
837 static inline notrace
void arch_local_irq_enable(void)
839 PVOP_VCALLEE0(pv_irq_ops
.irq_enable
);
842 static inline notrace
unsigned long arch_local_irq_save(void)
846 f
= arch_local_save_flags();
847 arch_local_irq_disable();
852 /* Make sure as little as possible of this mess escapes. */
867 extern void default_banner(void);
869 #else /* __ASSEMBLY__ */
871 #define _PVSITE(ptype, clobbers, ops, word, algn) \
875 .pushsection .parainstructions,"a"; \
884 #define COND_PUSH(set, mask, reg) \
885 .if ((~(set)) & mask); push %reg; .endif
886 #define COND_POP(set, mask, reg) \
887 .if ((~(set)) & mask); pop %reg; .endif
891 #define PV_SAVE_REGS(set) \
892 COND_PUSH(set, CLBR_RAX, rax); \
893 COND_PUSH(set, CLBR_RCX, rcx); \
894 COND_PUSH(set, CLBR_RDX, rdx); \
895 COND_PUSH(set, CLBR_RSI, rsi); \
896 COND_PUSH(set, CLBR_RDI, rdi); \
897 COND_PUSH(set, CLBR_R8, r8); \
898 COND_PUSH(set, CLBR_R9, r9); \
899 COND_PUSH(set, CLBR_R10, r10); \
900 COND_PUSH(set, CLBR_R11, r11)
901 #define PV_RESTORE_REGS(set) \
902 COND_POP(set, CLBR_R11, r11); \
903 COND_POP(set, CLBR_R10, r10); \
904 COND_POP(set, CLBR_R9, r9); \
905 COND_POP(set, CLBR_R8, r8); \
906 COND_POP(set, CLBR_RDI, rdi); \
907 COND_POP(set, CLBR_RSI, rsi); \
908 COND_POP(set, CLBR_RDX, rdx); \
909 COND_POP(set, CLBR_RCX, rcx); \
910 COND_POP(set, CLBR_RAX, rax)
912 #define PARA_PATCH(struct, off) ((PARAVIRT_PATCH_##struct + (off)) / 8)
913 #define PARA_SITE(ptype, clobbers, ops) _PVSITE(ptype, clobbers, ops, .quad, 8)
914 #define PARA_INDIRECT(addr) *addr(%rip)
916 #define PV_SAVE_REGS(set) \
917 COND_PUSH(set, CLBR_EAX, eax); \
918 COND_PUSH(set, CLBR_EDI, edi); \
919 COND_PUSH(set, CLBR_ECX, ecx); \
920 COND_PUSH(set, CLBR_EDX, edx)
921 #define PV_RESTORE_REGS(set) \
922 COND_POP(set, CLBR_EDX, edx); \
923 COND_POP(set, CLBR_ECX, ecx); \
924 COND_POP(set, CLBR_EDI, edi); \
925 COND_POP(set, CLBR_EAX, eax)
927 #define PARA_PATCH(struct, off) ((PARAVIRT_PATCH_##struct + (off)) / 4)
928 #define PARA_SITE(ptype, clobbers, ops) _PVSITE(ptype, clobbers, ops, .long, 4)
929 #define PARA_INDIRECT(addr) *%cs:addr
932 #define INTERRUPT_RETURN \
933 PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_iret), CLBR_NONE, \
934 jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_iret))
936 #define DISABLE_INTERRUPTS(clobbers) \
937 PARA_SITE(PARA_PATCH(pv_irq_ops, PV_IRQ_irq_disable), clobbers, \
938 PV_SAVE_REGS(clobbers | CLBR_CALLEE_SAVE); \
939 call PARA_INDIRECT(pv_irq_ops+PV_IRQ_irq_disable); \
940 PV_RESTORE_REGS(clobbers | CLBR_CALLEE_SAVE);)
942 #define ENABLE_INTERRUPTS(clobbers) \
943 PARA_SITE(PARA_PATCH(pv_irq_ops, PV_IRQ_irq_enable), clobbers, \
944 PV_SAVE_REGS(clobbers | CLBR_CALLEE_SAVE); \
945 call PARA_INDIRECT(pv_irq_ops+PV_IRQ_irq_enable); \
946 PV_RESTORE_REGS(clobbers | CLBR_CALLEE_SAVE);)
948 #define USERGS_SYSRET32 \
949 PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_usergs_sysret32), \
951 jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_usergs_sysret32))
954 #define GET_CR0_INTO_EAX \
955 push %ecx; push %edx; \
956 call PARA_INDIRECT(pv_cpu_ops+PV_CPU_read_cr0); \
959 #define ENABLE_INTERRUPTS_SYSEXIT \
960 PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_irq_enable_sysexit), \
962 jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_irq_enable_sysexit))
965 #else /* !CONFIG_X86_32 */
968 * If swapgs is used while the userspace stack is still current,
969 * there's no way to call a pvop. The PV replacement *must* be
970 * inlined, or the swapgs instruction must be trapped and emulated.
972 #define SWAPGS_UNSAFE_STACK \
973 PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_swapgs), CLBR_NONE, \
977 * Note: swapgs is very special, and in practise is either going to be
978 * implemented with a single "swapgs" instruction or something very
979 * special. Either way, we don't need to save any registers for
983 PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_swapgs), CLBR_NONE, \
984 call PARA_INDIRECT(pv_cpu_ops+PV_CPU_swapgs) \
987 #define GET_CR2_INTO_RAX \
988 call PARA_INDIRECT(pv_mmu_ops+PV_MMU_read_cr2)
990 #define PARAVIRT_ADJUST_EXCEPTION_FRAME \
991 PARA_SITE(PARA_PATCH(pv_irq_ops, PV_IRQ_adjust_exception_frame), \
993 call PARA_INDIRECT(pv_irq_ops+PV_IRQ_adjust_exception_frame))
995 #define USERGS_SYSRET64 \
996 PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_usergs_sysret64), \
998 jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_usergs_sysret64))
1000 #define ENABLE_INTERRUPTS_SYSEXIT32 \
1001 PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_irq_enable_sysexit), \
1003 jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_irq_enable_sysexit))
1004 #endif /* CONFIG_X86_32 */
1006 #endif /* __ASSEMBLY__ */
1007 #else /* CONFIG_PARAVIRT */
1008 # define default_banner x86_init_noop
1009 #endif /* !CONFIG_PARAVIRT */
1010 #endif /* _ASM_X86_PARAVIRT_H */