Linux kernel mirror (for testing)
git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel
os
linux
1/* SPDX-License-Identifier: GPL-2.0 */
2#ifndef _ASM_X86_DESC_H
3#define _ASM_X86_DESC_H
4
5#include <asm/desc_defs.h>
6#include <asm/ldt.h>
7#include <asm/mmu.h>
8#include <asm/fixmap.h>
9#include <asm/irq_vectors.h>
10#include <asm/cpu_entry_area.h>
11
12#include <linux/debug_locks.h>
13#include <linux/smp.h>
14#include <linux/percpu.h>
15
16static inline void fill_ldt(struct desc_struct *desc, const struct user_desc *info)
17{
18 desc->limit0 = info->limit & 0x0ffff;
19
20 desc->base0 = (info->base_addr & 0x0000ffff);
21 desc->base1 = (info->base_addr & 0x00ff0000) >> 16;
22
23 desc->type = (info->read_exec_only ^ 1) << 1;
24 desc->type |= info->contents << 2;
25 /* Set the ACCESS bit so it can be mapped RO */
26 desc->type |= 1;
27
28 desc->s = 1;
29 desc->dpl = 0x3;
30 desc->p = info->seg_not_present ^ 1;
31 desc->limit1 = (info->limit & 0xf0000) >> 16;
32 desc->avl = info->useable;
33 desc->d = info->seg_32bit;
34 desc->g = info->limit_in_pages;
35
36 desc->base2 = (info->base_addr & 0xff000000) >> 24;
37 /*
38 * Don't allow setting of the lm bit. It would confuse
39 * user_64bit_mode and would get overridden by sysret anyway.
40 */
41 desc->l = 0;
42}
43
44struct gdt_page {
45 struct desc_struct gdt[GDT_ENTRIES];
46} __attribute__((aligned(PAGE_SIZE)));
47
48DECLARE_PER_CPU_PAGE_ALIGNED(struct gdt_page, gdt_page);
49DECLARE_INIT_PER_CPU(gdt_page);
50
51/* Provide the original GDT */
52static inline struct desc_struct *get_cpu_gdt_rw(unsigned int cpu)
53{
54 return per_cpu(gdt_page, cpu).gdt;
55}
56
57/* Provide the current original GDT */
58static inline struct desc_struct *get_current_gdt_rw(void)
59{
60 return this_cpu_ptr(&gdt_page)->gdt;
61}
62
63/* Provide the fixmap address of the remapped GDT */
64static inline struct desc_struct *get_cpu_gdt_ro(int cpu)
65{
66 return (struct desc_struct *)&get_cpu_entry_area(cpu)->gdt;
67}
68
69/* Provide the current read-only GDT */
70static inline struct desc_struct *get_current_gdt_ro(void)
71{
72 return get_cpu_gdt_ro(smp_processor_id());
73}
74
75/* Provide the physical address of the GDT page. */
76static inline phys_addr_t get_cpu_gdt_paddr(unsigned int cpu)
77{
78 return per_cpu_ptr_to_phys(get_cpu_gdt_rw(cpu));
79}
80
81static inline void pack_gate(gate_desc *gate, unsigned type, unsigned long func,
82 unsigned dpl, unsigned ist, unsigned seg)
83{
84 gate->offset_low = (u16) func;
85 gate->bits.p = 1;
86 gate->bits.dpl = dpl;
87 gate->bits.zero = 0;
88 gate->bits.type = type;
89 gate->offset_middle = (u16) (func >> 16);
90#ifdef CONFIG_X86_64
91 gate->segment = __KERNEL_CS;
92 gate->bits.ist = ist;
93 gate->reserved = 0;
94 gate->offset_high = (u32) (func >> 32);
95#else
96 gate->segment = seg;
97 gate->bits.ist = 0;
98#endif
99}
100
101static inline int desc_empty(const void *ptr)
102{
103 const u32 *desc = ptr;
104
105 return !(desc[0] | desc[1]);
106}
107
108#ifdef CONFIG_PARAVIRT_XXL
109#include <asm/paravirt.h>
110#else
111#define load_TR_desc() native_load_tr_desc()
112#define load_gdt(dtr) native_load_gdt(dtr)
113#define load_idt(dtr) native_load_idt(dtr)
114#define load_tr(tr) asm volatile("ltr %0"::"m" (tr))
115#define load_ldt(ldt) asm volatile("lldt %0"::"m" (ldt))
116
117#define store_gdt(dtr) native_store_gdt(dtr)
118#define store_tr(tr) (tr = native_store_tr())
119
120#define load_TLS(t, cpu) native_load_tls(t, cpu)
121#define set_ldt native_set_ldt
122
123#define write_ldt_entry(dt, entry, desc) native_write_ldt_entry(dt, entry, desc)
124#define write_gdt_entry(dt, entry, desc, type) native_write_gdt_entry(dt, entry, desc, type)
125#define write_idt_entry(dt, entry, g) native_write_idt_entry(dt, entry, g)
126
127static inline void paravirt_alloc_ldt(struct desc_struct *ldt, unsigned entries)
128{
129}
130
131static inline void paravirt_free_ldt(struct desc_struct *ldt, unsigned entries)
132{
133}
134#endif /* CONFIG_PARAVIRT_XXL */
135
136#define store_ldt(ldt) asm("sldt %0" : "=m"(ldt))
137
138static inline void native_write_idt_entry(gate_desc *idt, int entry, const gate_desc *gate)
139{
140 memcpy(&idt[entry], gate, sizeof(*gate));
141}
142
143static inline void native_write_ldt_entry(struct desc_struct *ldt, int entry, const void *desc)
144{
145 memcpy(&ldt[entry], desc, 8);
146}
147
148static inline void
149native_write_gdt_entry(struct desc_struct *gdt, int entry, const void *desc, int type)
150{
151 unsigned int size;
152
153 switch (type) {
154 case DESC_TSS: size = sizeof(tss_desc); break;
155 case DESC_LDT: size = sizeof(ldt_desc); break;
156 default: size = sizeof(*gdt); break;
157 }
158
159 memcpy(&gdt[entry], desc, size);
160}
161
162static inline void set_tssldt_descriptor(void *d, unsigned long addr,
163 unsigned type, unsigned size)
164{
165 struct ldttss_desc *desc = d;
166
167 memset(desc, 0, sizeof(*desc));
168
169 desc->limit0 = (u16) size;
170 desc->base0 = (u16) addr;
171 desc->base1 = (addr >> 16) & 0xFF;
172 desc->type = type;
173 desc->p = 1;
174 desc->limit1 = (size >> 16) & 0xF;
175 desc->base2 = (addr >> 24) & 0xFF;
176#ifdef CONFIG_X86_64
177 desc->base3 = (u32) (addr >> 32);
178#endif
179}
180
181static inline void __set_tss_desc(unsigned cpu, unsigned int entry, struct x86_hw_tss *addr)
182{
183 struct desc_struct *d = get_cpu_gdt_rw(cpu);
184 tss_desc tss;
185
186 set_tssldt_descriptor(&tss, (unsigned long)addr, DESC_TSS,
187 __KERNEL_TSS_LIMIT);
188 write_gdt_entry(d, entry, &tss, DESC_TSS);
189}
190
191#define set_tss_desc(cpu, addr) __set_tss_desc(cpu, GDT_ENTRY_TSS, addr)
192
193static inline void native_set_ldt(const void *addr, unsigned int entries)
194{
195 if (likely(entries == 0))
196 asm volatile("lldt %w0"::"q" (0));
197 else {
198 unsigned cpu = smp_processor_id();
199 ldt_desc ldt;
200
201 set_tssldt_descriptor(&ldt, (unsigned long)addr, DESC_LDT,
202 entries * LDT_ENTRY_SIZE - 1);
203 write_gdt_entry(get_cpu_gdt_rw(cpu), GDT_ENTRY_LDT,
204 &ldt, DESC_LDT);
205 asm volatile("lldt %w0"::"q" (GDT_ENTRY_LDT*8));
206 }
207}
208
209static inline void native_load_gdt(const struct desc_ptr *dtr)
210{
211 asm volatile("lgdt %0"::"m" (*dtr));
212}
213
214static __always_inline void native_load_idt(const struct desc_ptr *dtr)
215{
216 asm volatile("lidt %0"::"m" (*dtr));
217}
218
219static inline void native_store_gdt(struct desc_ptr *dtr)
220{
221 asm volatile("sgdt %0":"=m" (*dtr));
222}
223
224static inline void store_idt(struct desc_ptr *dtr)
225{
226 asm volatile("sidt %0":"=m" (*dtr));
227}
228
229static inline void native_gdt_invalidate(void)
230{
231 const struct desc_ptr invalid_gdt = {
232 .address = 0,
233 .size = 0
234 };
235
236 native_load_gdt(&invalid_gdt);
237}
238
239static inline void native_idt_invalidate(void)
240{
241 const struct desc_ptr invalid_idt = {
242 .address = 0,
243 .size = 0
244 };
245
246 native_load_idt(&invalid_idt);
247}
248
249/*
250 * The LTR instruction marks the TSS GDT entry as busy. On 64-bit, the GDT is
251 * a read-only remapping. To prevent a page fault, the GDT is switched to the
252 * original writeable version when needed.
253 */
254#ifdef CONFIG_X86_64
255static inline void native_load_tr_desc(void)
256{
257 struct desc_ptr gdt;
258 int cpu = raw_smp_processor_id();
259 bool restore = 0;
260 struct desc_struct *fixmap_gdt;
261
262 native_store_gdt(&gdt);
263 fixmap_gdt = get_cpu_gdt_ro(cpu);
264
265 /*
266 * If the current GDT is the read-only fixmap, swap to the original
267 * writeable version. Swap back at the end.
268 */
269 if (gdt.address == (unsigned long)fixmap_gdt) {
270 load_direct_gdt(cpu);
271 restore = 1;
272 }
273 asm volatile("ltr %w0"::"q" (GDT_ENTRY_TSS*8));
274 if (restore)
275 load_fixmap_gdt(cpu);
276}
277#else
278static inline void native_load_tr_desc(void)
279{
280 asm volatile("ltr %w0"::"q" (GDT_ENTRY_TSS*8));
281}
282#endif
283
284static inline unsigned long native_store_tr(void)
285{
286 unsigned long tr;
287
288 asm volatile("str %0":"=r" (tr));
289
290 return tr;
291}
292
293static inline void native_load_tls(struct thread_struct *t, unsigned int cpu)
294{
295 struct desc_struct *gdt = get_cpu_gdt_rw(cpu);
296 unsigned int i;
297
298 for (i = 0; i < GDT_ENTRY_TLS_ENTRIES; i++)
299 gdt[GDT_ENTRY_TLS_MIN + i] = t->tls_array[i];
300}
301
302DECLARE_PER_CPU(bool, __tss_limit_invalid);
303
304static inline void force_reload_TR(void)
305{
306 struct desc_struct *d = get_current_gdt_rw();
307 tss_desc tss;
308
309 memcpy(&tss, &d[GDT_ENTRY_TSS], sizeof(tss_desc));
310
311 /*
312 * LTR requires an available TSS, and the TSS is currently
313 * busy. Make it be available so that LTR will work.
314 */
315 tss.type = DESC_TSS;
316 write_gdt_entry(d, GDT_ENTRY_TSS, &tss, DESC_TSS);
317
318 load_TR_desc();
319 this_cpu_write(__tss_limit_invalid, false);
320}
321
322/*
323 * Call this if you need the TSS limit to be correct, which should be the case
324 * if and only if you have TIF_IO_BITMAP set or you're switching to a task
325 * with TIF_IO_BITMAP set.
326 */
327static inline void refresh_tss_limit(void)
328{
329 DEBUG_LOCKS_WARN_ON(preemptible());
330
331 if (unlikely(this_cpu_read(__tss_limit_invalid)))
332 force_reload_TR();
333}
334
335/*
336 * If you do something evil that corrupts the cached TSS limit (I'm looking
337 * at you, VMX exits), call this function.
338 *
339 * The optimization here is that the TSS limit only matters for Linux if the
340 * IO bitmap is in use. If the TSS limit gets forced to its minimum value,
341 * everything works except that IO bitmap will be ignored and all CPL 3 IO
342 * instructions will #GP, which is exactly what we want for normal tasks.
343 */
344static inline void invalidate_tss_limit(void)
345{
346 DEBUG_LOCKS_WARN_ON(preemptible());
347
348 if (unlikely(test_thread_flag(TIF_IO_BITMAP)))
349 force_reload_TR();
350 else
351 this_cpu_write(__tss_limit_invalid, true);
352}
353
354/* This intentionally ignores lm, since 32-bit apps don't have that field. */
355#define LDT_empty(info) \
356 ((info)->base_addr == 0 && \
357 (info)->limit == 0 && \
358 (info)->contents == 0 && \
359 (info)->read_exec_only == 1 && \
360 (info)->seg_32bit == 0 && \
361 (info)->limit_in_pages == 0 && \
362 (info)->seg_not_present == 1 && \
363 (info)->useable == 0)
364
365/* Lots of programs expect an all-zero user_desc to mean "no segment at all". */
366static inline bool LDT_zero(const struct user_desc *info)
367{
368 return (info->base_addr == 0 &&
369 info->limit == 0 &&
370 info->contents == 0 &&
371 info->read_exec_only == 0 &&
372 info->seg_32bit == 0 &&
373 info->limit_in_pages == 0 &&
374 info->seg_not_present == 0 &&
375 info->useable == 0);
376}
377
378static inline void clear_LDT(void)
379{
380 set_ldt(NULL, 0);
381}
382
383static inline unsigned long get_desc_base(const struct desc_struct *desc)
384{
385 return (unsigned)(desc->base0 | ((desc->base1) << 16) | ((desc->base2) << 24));
386}
387
388static inline void set_desc_base(struct desc_struct *desc, unsigned long base)
389{
390 desc->base0 = base & 0xffff;
391 desc->base1 = (base >> 16) & 0xff;
392 desc->base2 = (base >> 24) & 0xff;
393}
394
395static inline unsigned long get_desc_limit(const struct desc_struct *desc)
396{
397 return desc->limit0 | (desc->limit1 << 16);
398}
399
400static inline void set_desc_limit(struct desc_struct *desc, unsigned long limit)
401{
402 desc->limit0 = limit & 0xffff;
403 desc->limit1 = (limit >> 16) & 0xf;
404}
405
406static inline void init_idt_data(struct idt_data *data, unsigned int n,
407 const void *addr)
408{
409 BUG_ON(n > 0xFF);
410
411 memset(data, 0, sizeof(*data));
412 data->vector = n;
413 data->addr = addr;
414 data->segment = __KERNEL_CS;
415 data->bits.type = GATE_INTERRUPT;
416 data->bits.p = 1;
417}
418
419static inline void idt_init_desc(gate_desc *gate, const struct idt_data *d)
420{
421 unsigned long addr = (unsigned long) d->addr;
422
423 gate->offset_low = (u16) addr;
424 gate->segment = (u16) d->segment;
425 gate->bits = d->bits;
426 gate->offset_middle = (u16) (addr >> 16);
427#ifdef CONFIG_X86_64
428 gate->offset_high = (u32) (addr >> 32);
429 gate->reserved = 0;
430#endif
431}
432
433extern unsigned long system_vectors[];
434
435extern void load_current_idt(void);
436extern void idt_setup_early_handler(void);
437extern void idt_setup_early_traps(void);
438extern void idt_setup_traps(void);
439extern void idt_setup_apic_and_irq_gates(void);
440extern bool idt_is_f00f_address(unsigned long address);
441
442#ifdef CONFIG_X86_64
443extern void idt_setup_early_pf(void);
444#else
445static inline void idt_setup_early_pf(void) { }
446#endif
447
448extern void idt_invalidate(void);
449
450#endif /* _ASM_X86_DESC_H */