1 #ifndef _ASM_X86_DESC_H
2 #define _ASM_X86_DESC_H
4 #include <asm/desc_defs.h>
7 #include <asm/fixmap.h>
10 #include <linux/percpu.h>
12 static inline void fill_ldt(struct desc_struct
*desc
, const struct user_desc
*info
)
14 desc
->limit0
= info
->limit
& 0x0ffff;
16 desc
->base0
= (info
->base_addr
& 0x0000ffff);
17 desc
->base1
= (info
->base_addr
& 0x00ff0000) >> 16;
19 desc
->type
= (info
->read_exec_only
^ 1) << 1;
20 desc
->type
|= info
->contents
<< 2;
24 desc
->p
= info
->seg_not_present
^ 1;
25 desc
->limit
= (info
->limit
& 0xf0000) >> 16;
26 desc
->avl
= info
->useable
;
27 desc
->d
= info
->seg_32bit
;
28 desc
->g
= info
->limit_in_pages
;
30 desc
->base2
= (info
->base_addr
& 0xff000000) >> 24;
32 * Don't allow setting of the lm bit. It would confuse
33 * user_64bit_mode and would get overridden by sysret anyway.
38 extern struct desc_ptr idt_descr
;
39 extern gate_desc idt_table
[];
40 extern const struct desc_ptr debug_idt_descr
;
41 extern gate_desc debug_idt_table
[];
44 struct desc_struct gdt
[GDT_ENTRIES
];
45 } __attribute__((aligned(PAGE_SIZE
)));
47 DECLARE_PER_CPU_PAGE_ALIGNED(struct gdt_page
, gdt_page
);
49 /* Provide the original GDT */
50 static inline struct desc_struct
*get_cpu_gdt_rw(unsigned int cpu
)
52 return per_cpu(gdt_page
, cpu
).gdt
;
55 /* Provide the current original GDT */
56 static inline struct desc_struct
*get_current_gdt_rw(void)
58 return this_cpu_ptr(&gdt_page
)->gdt
;
61 /* Get the fixmap index for a specific processor */
62 static inline unsigned int get_cpu_gdt_ro_index(int cpu
)
64 return FIX_GDT_REMAP_BEGIN
+ cpu
;
67 /* Provide the fixmap address of the remapped GDT */
68 static inline struct desc_struct
*get_cpu_gdt_ro(int cpu
)
70 unsigned int idx
= get_cpu_gdt_ro_index(cpu
);
71 return (struct desc_struct
*)__fix_to_virt(idx
);
74 /* Provide the current read-only GDT */
75 static inline struct desc_struct
*get_current_gdt_ro(void)
77 return get_cpu_gdt_ro(smp_processor_id());
80 /* Provide the physical address of the GDT page. */
81 static inline phys_addr_t
get_cpu_gdt_paddr(unsigned int cpu
)
83 return per_cpu_ptr_to_phys(get_cpu_gdt_rw(cpu
));
88 static inline void pack_gate(gate_desc
*gate
, unsigned type
, unsigned long func
,
89 unsigned dpl
, unsigned ist
, unsigned seg
)
91 gate
->offset_low
= PTR_LOW(func
);
92 gate
->segment
= __KERNEL_CS
;
99 gate
->offset_middle
= PTR_MIDDLE(func
);
100 gate
->offset_high
= PTR_HIGH(func
);
104 static inline void pack_gate(gate_desc
*gate
, unsigned char type
,
105 unsigned long base
, unsigned dpl
, unsigned flags
,
108 gate
->a
= (seg
<< 16) | (base
& 0xffff);
109 gate
->b
= (base
& 0xffff0000) | (((0x80 | type
| (dpl
<< 5)) & 0xff) << 8);
114 static inline int desc_empty(const void *ptr
)
116 const u32
*desc
= ptr
;
118 return !(desc
[0] | desc
[1]);
121 #ifdef CONFIG_PARAVIRT
122 #include <asm/paravirt.h>
124 #define load_TR_desc() native_load_tr_desc()
125 #define load_gdt(dtr) native_load_gdt(dtr)
126 #define load_idt(dtr) native_load_idt(dtr)
127 #define load_tr(tr) asm volatile("ltr %0"::"m" (tr))
128 #define load_ldt(ldt) asm volatile("lldt %0"::"m" (ldt))
130 #define store_gdt(dtr) native_store_gdt(dtr)
131 #define store_idt(dtr) native_store_idt(dtr)
132 #define store_tr(tr) (tr = native_store_tr())
134 #define load_TLS(t, cpu) native_load_tls(t, cpu)
135 #define set_ldt native_set_ldt
137 #define write_ldt_entry(dt, entry, desc) native_write_ldt_entry(dt, entry, desc)
138 #define write_gdt_entry(dt, entry, desc, type) native_write_gdt_entry(dt, entry, desc, type)
139 #define write_idt_entry(dt, entry, g) native_write_idt_entry(dt, entry, g)
141 static inline void paravirt_alloc_ldt(struct desc_struct
*ldt
, unsigned entries
)
145 static inline void paravirt_free_ldt(struct desc_struct
*ldt
, unsigned entries
)
148 #endif /* CONFIG_PARAVIRT */
150 #define store_ldt(ldt) asm("sldt %0" : "=m"(ldt))
152 static inline void native_write_idt_entry(gate_desc
*idt
, int entry
, const gate_desc
*gate
)
154 memcpy(&idt
[entry
], gate
, sizeof(*gate
));
157 static inline void native_write_ldt_entry(struct desc_struct
*ldt
, int entry
, const void *desc
)
159 memcpy(&ldt
[entry
], desc
, 8);
163 native_write_gdt_entry(struct desc_struct
*gdt
, int entry
, const void *desc
, int type
)
168 case DESC_TSS
: size
= sizeof(tss_desc
); break;
169 case DESC_LDT
: size
= sizeof(ldt_desc
); break;
170 default: size
= sizeof(*gdt
); break;
173 memcpy(&gdt
[entry
], desc
, size
);
176 static inline void pack_descriptor(struct desc_struct
*desc
, unsigned long base
,
177 unsigned long limit
, unsigned char type
,
180 desc
->a
= ((base
& 0xffff) << 16) | (limit
& 0xffff);
181 desc
->b
= (base
& 0xff000000) | ((base
& 0xff0000) >> 16) |
182 (limit
& 0x000f0000) | ((type
& 0xff) << 8) |
183 ((flags
& 0xf) << 20);
188 static inline void set_tssldt_descriptor(void *d
, unsigned long addr
, unsigned type
, unsigned size
)
191 struct ldttss_desc64
*desc
= d
;
193 memset(desc
, 0, sizeof(*desc
));
195 desc
->limit0
= size
& 0xFFFF;
196 desc
->base0
= PTR_LOW(addr
);
197 desc
->base1
= PTR_MIDDLE(addr
) & 0xFF;
200 desc
->limit1
= (size
>> 16) & 0xF;
201 desc
->base2
= (PTR_MIDDLE(addr
) >> 8) & 0xFF;
202 desc
->base3
= PTR_HIGH(addr
);
204 pack_descriptor((struct desc_struct
*)d
, addr
, size
, 0x80 | type
, 0);
208 static inline void __set_tss_desc(unsigned cpu
, unsigned int entry
, void *addr
)
210 struct desc_struct
*d
= get_cpu_gdt_rw(cpu
);
213 set_tssldt_descriptor(&tss
, (unsigned long)addr
, DESC_TSS
,
215 write_gdt_entry(d
, entry
, &tss
, DESC_TSS
);
218 #define set_tss_desc(cpu, addr) __set_tss_desc(cpu, GDT_ENTRY_TSS, addr)
220 static inline void native_set_ldt(const void *addr
, unsigned int entries
)
222 if (likely(entries
== 0))
223 asm volatile("lldt %w0"::"q" (0));
225 unsigned cpu
= smp_processor_id();
228 set_tssldt_descriptor(&ldt
, (unsigned long)addr
, DESC_LDT
,
229 entries
* LDT_ENTRY_SIZE
- 1);
230 write_gdt_entry(get_cpu_gdt_rw(cpu
), GDT_ENTRY_LDT
,
232 asm volatile("lldt %w0"::"q" (GDT_ENTRY_LDT
*8));
236 static inline void native_load_gdt(const struct desc_ptr
*dtr
)
238 asm volatile("lgdt %0"::"m" (*dtr
));
241 static inline void native_load_idt(const struct desc_ptr
*dtr
)
243 asm volatile("lidt %0"::"m" (*dtr
));
246 static inline void native_store_gdt(struct desc_ptr
*dtr
)
248 asm volatile("sgdt %0":"=m" (*dtr
));
251 static inline void native_store_idt(struct desc_ptr
*dtr
)
253 asm volatile("sidt %0":"=m" (*dtr
));
257 * The LTR instruction marks the TSS GDT entry as busy. On 64-bit, the GDT is
258 * a read-only remapping. To prevent a page fault, the GDT is switched to the
259 * original writeable version when needed.
262 static inline void native_load_tr_desc(void)
265 int cpu
= raw_smp_processor_id();
267 struct desc_struct
*fixmap_gdt
;
269 native_store_gdt(&gdt
);
270 fixmap_gdt
= get_cpu_gdt_ro(cpu
);
273 * If the current GDT is the read-only fixmap, swap to the original
274 * writeable version. Swap back at the end.
276 if (gdt
.address
== (unsigned long)fixmap_gdt
) {
277 load_direct_gdt(cpu
);
280 asm volatile("ltr %w0"::"q" (GDT_ENTRY_TSS
*8));
282 load_fixmap_gdt(cpu
);
285 static inline void native_load_tr_desc(void)
287 asm volatile("ltr %w0"::"q" (GDT_ENTRY_TSS
*8));
291 static inline unsigned long native_store_tr(void)
295 asm volatile("str %0":"=r" (tr
));
300 static inline void native_load_tls(struct thread_struct
*t
, unsigned int cpu
)
302 struct desc_struct
*gdt
= get_cpu_gdt_rw(cpu
);
305 for (i
= 0; i
< GDT_ENTRY_TLS_ENTRIES
; i
++)
306 gdt
[GDT_ENTRY_TLS_MIN
+ i
] = t
->tls_array
[i
];
309 DECLARE_PER_CPU(bool, __tss_limit_invalid
);
311 static inline void force_reload_TR(void)
313 struct desc_struct
*d
= get_current_gdt_rw();
316 memcpy(&tss
, &d
[GDT_ENTRY_TSS
], sizeof(tss_desc
));
319 * LTR requires an available TSS, and the TSS is currently
320 * busy. Make it be available so that LTR will work.
323 write_gdt_entry(d
, GDT_ENTRY_TSS
, &tss
, DESC_TSS
);
326 this_cpu_write(__tss_limit_invalid
, false);
330 * Call this if you need the TSS limit to be correct, which should be the case
331 * if and only if you have TIF_IO_BITMAP set or you're switching to a task
332 * with TIF_IO_BITMAP set.
334 static inline void refresh_tss_limit(void)
336 DEBUG_LOCKS_WARN_ON(preemptible());
338 if (unlikely(this_cpu_read(__tss_limit_invalid
)))
343 * If you do something evil that corrupts the cached TSS limit (I'm looking
344 * at you, VMX exits), call this function.
346 * The optimization here is that the TSS limit only matters for Linux if the
347 * IO bitmap is in use. If the TSS limit gets forced to its minimum value,
348 * everything works except that IO bitmap will be ignored and all CPL 3 IO
349 * instructions will #GP, which is exactly what we want for normal tasks.
351 static inline void invalidate_tss_limit(void)
353 DEBUG_LOCKS_WARN_ON(preemptible());
355 if (unlikely(test_thread_flag(TIF_IO_BITMAP
)))
358 this_cpu_write(__tss_limit_invalid
, true);
361 /* This intentionally ignores lm, since 32-bit apps don't have that field. */
362 #define LDT_empty(info) \
363 ((info)->base_addr == 0 && \
364 (info)->limit == 0 && \
365 (info)->contents == 0 && \
366 (info)->read_exec_only == 1 && \
367 (info)->seg_32bit == 0 && \
368 (info)->limit_in_pages == 0 && \
369 (info)->seg_not_present == 1 && \
370 (info)->useable == 0)
372 /* Lots of programs expect an all-zero user_desc to mean "no segment at all". */
373 static inline bool LDT_zero(const struct user_desc
*info
)
375 return (info
->base_addr
== 0 &&
377 info
->contents
== 0 &&
378 info
->read_exec_only
== 0 &&
379 info
->seg_32bit
== 0 &&
380 info
->limit_in_pages
== 0 &&
381 info
->seg_not_present
== 0 &&
385 static inline void clear_LDT(void)
390 static inline unsigned long get_desc_base(const struct desc_struct
*desc
)
392 return (unsigned)(desc
->base0
| ((desc
->base1
) << 16) | ((desc
->base2
) << 24));
395 static inline void set_desc_base(struct desc_struct
*desc
, unsigned long base
)
397 desc
->base0
= base
& 0xffff;
398 desc
->base1
= (base
>> 16) & 0xff;
399 desc
->base2
= (base
>> 24) & 0xff;
402 static inline unsigned long get_desc_limit(const struct desc_struct
*desc
)
404 return desc
->limit0
| (desc
->limit
<< 16);
407 static inline void set_desc_limit(struct desc_struct
*desc
, unsigned long limit
)
409 desc
->limit0
= limit
& 0xffff;
410 desc
->limit
= (limit
>> 16) & 0xf;
414 static inline void set_nmi_gate(int gate
, void *addr
)
418 pack_gate(&s
, GATE_INTERRUPT
, (unsigned long)addr
, 0, 0, __KERNEL_CS
);
419 write_idt_entry(debug_idt_table
, gate
, &s
);
423 #ifdef CONFIG_TRACING
424 extern struct desc_ptr trace_idt_descr
;
425 extern gate_desc trace_idt_table
[];
426 static inline void write_trace_idt_entry(int entry
, const gate_desc
*gate
)
428 write_idt_entry(trace_idt_table
, entry
, gate
);
431 static inline void _trace_set_gate(int gate
, unsigned type
, void *addr
,
432 unsigned dpl
, unsigned ist
, unsigned seg
)
436 pack_gate(&s
, type
, (unsigned long)addr
, dpl
, ist
, seg
);
438 * does not need to be atomic because it is only done once at
441 write_trace_idt_entry(gate
, &s
);
444 static inline void write_trace_idt_entry(int entry
, const gate_desc
*gate
)
448 #define _trace_set_gate(gate, type, addr, dpl, ist, seg)
451 static inline void _set_gate(int gate
, unsigned type
, void *addr
,
452 unsigned dpl
, unsigned ist
, unsigned seg
)
456 pack_gate(&s
, type
, (unsigned long)addr
, dpl
, ist
, seg
);
458 * does not need to be atomic because it is only done once at
461 write_idt_entry(idt_table
, gate
, &s
);
462 write_trace_idt_entry(gate
, &s
);
466 * This needs to use 'idt_table' rather than 'idt', and
467 * thus use the _nonmapped_ version of the IDT, as the
468 * Pentium F0 0F bugfix can have resulted in the mapped
469 * IDT being write-protected.
471 #define set_intr_gate_notrace(n, addr) \
473 BUG_ON((unsigned)n > 0xFF); \
474 _set_gate(n, GATE_INTERRUPT, (void *)addr, 0, 0, \
478 #define set_intr_gate(n, addr) \
480 set_intr_gate_notrace(n, addr); \
481 _trace_set_gate(n, GATE_INTERRUPT, (void *)trace_##addr,\
482 0, 0, __KERNEL_CS); \
485 extern int first_system_vector
;
486 /* used_vectors is BITMAP for irq is not managed by percpu vector_irq */
487 extern unsigned long used_vectors
[];
489 static inline void alloc_system_vector(int vector
)
491 if (!test_bit(vector
, used_vectors
)) {
492 set_bit(vector
, used_vectors
);
493 if (first_system_vector
> vector
)
494 first_system_vector
= vector
;
500 #define alloc_intr_gate(n, addr) \
502 alloc_system_vector(n); \
503 set_intr_gate(n, addr); \
507 * This routine sets up an interrupt gate at directory privilege level 3.
509 static inline void set_system_intr_gate(unsigned int n
, void *addr
)
511 BUG_ON((unsigned)n
> 0xFF);
512 _set_gate(n
, GATE_INTERRUPT
, addr
, 0x3, 0, __KERNEL_CS
);
515 static inline void set_system_trap_gate(unsigned int n
, void *addr
)
517 BUG_ON((unsigned)n
> 0xFF);
518 _set_gate(n
, GATE_TRAP
, addr
, 0x3, 0, __KERNEL_CS
);
521 static inline void set_trap_gate(unsigned int n
, void *addr
)
523 BUG_ON((unsigned)n
> 0xFF);
524 _set_gate(n
, GATE_TRAP
, addr
, 0, 0, __KERNEL_CS
);
527 static inline void set_task_gate(unsigned int n
, unsigned int gdt_entry
)
529 BUG_ON((unsigned)n
> 0xFF);
530 _set_gate(n
, GATE_TASK
, (void *)0, 0, 0, (gdt_entry
<<3));
533 static inline void set_intr_gate_ist(int n
, void *addr
, unsigned ist
)
535 BUG_ON((unsigned)n
> 0xFF);
536 _set_gate(n
, GATE_INTERRUPT
, addr
, 0, ist
, __KERNEL_CS
);
539 static inline void set_system_intr_gate_ist(int n
, void *addr
, unsigned ist
)
541 BUG_ON((unsigned)n
> 0xFF);
542 _set_gate(n
, GATE_INTERRUPT
, addr
, 0x3, ist
, __KERNEL_CS
);
546 DECLARE_PER_CPU(u32
, debug_idt_ctr
);
547 static inline bool is_debug_idt_enabled(void)
549 if (this_cpu_read(debug_idt_ctr
))
555 static inline void load_debug_idt(void)
557 load_idt((const struct desc_ptr
*)&debug_idt_descr
);
560 static inline bool is_debug_idt_enabled(void)
565 static inline void load_debug_idt(void)
570 #ifdef CONFIG_TRACING
571 extern atomic_t trace_idt_ctr
;
572 static inline bool is_trace_idt_enabled(void)
574 if (atomic_read(&trace_idt_ctr
))
580 static inline void load_trace_idt(void)
582 load_idt((const struct desc_ptr
*)&trace_idt_descr
);
585 static inline bool is_trace_idt_enabled(void)
590 static inline void load_trace_idt(void)
596 * The load_current_idt() must be called with interrupts disabled
597 * to avoid races. That way the IDT will always be set back to the expected
598 * descriptor. It's also called when a CPU is being initialized, and
599 * that doesn't need to disable interrupts, as nothing should be
600 * bothering the CPU then.
602 static inline void load_current_idt(void)
604 if (is_debug_idt_enabled())
606 else if (is_trace_idt_enabled())
609 load_idt((const struct desc_ptr
*)&idt_descr
);
611 #endif /* _ASM_X86_DESC_H */