Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 1 | /* SPDX-License-Identifier: GPL-2.0 */ |
| 2 | #ifndef _ASM_X86_DESC_H |
| 3 | #define _ASM_X86_DESC_H |
| 4 | |
| 5 | #include <asm/desc_defs.h> |
| 6 | #include <asm/ldt.h> |
| 7 | #include <asm/mmu.h> |
| 8 | #include <asm/fixmap.h> |
| 9 | #include <asm/irq_vectors.h> |
| 10 | #include <asm/cpu_entry_area.h> |
| 11 | |
| 12 | #include <linux/smp.h> |
| 13 | #include <linux/percpu.h> |
| 14 | |
| 15 | static inline void fill_ldt(struct desc_struct *desc, const struct user_desc *info) |
| 16 | { |
| 17 | desc->limit0 = info->limit & 0x0ffff; |
| 18 | |
| 19 | desc->base0 = (info->base_addr & 0x0000ffff); |
| 20 | desc->base1 = (info->base_addr & 0x00ff0000) >> 16; |
| 21 | |
| 22 | desc->type = (info->read_exec_only ^ 1) << 1; |
| 23 | desc->type |= info->contents << 2; |
| 24 | /* Set the ACCESS bit so it can be mapped RO */ |
| 25 | desc->type |= 1; |
| 26 | |
| 27 | desc->s = 1; |
| 28 | desc->dpl = 0x3; |
| 29 | desc->p = info->seg_not_present ^ 1; |
| 30 | desc->limit1 = (info->limit & 0xf0000) >> 16; |
| 31 | desc->avl = info->useable; |
| 32 | desc->d = info->seg_32bit; |
| 33 | desc->g = info->limit_in_pages; |
| 34 | |
| 35 | desc->base2 = (info->base_addr & 0xff000000) >> 24; |
| 36 | /* |
| 37 | * Don't allow setting of the lm bit. It would confuse |
| 38 | * user_64bit_mode and would get overridden by sysret anyway. |
| 39 | */ |
| 40 | desc->l = 0; |
| 41 | } |
| 42 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 43 | struct gdt_page { |
| 44 | struct desc_struct gdt[GDT_ENTRIES]; |
| 45 | } __attribute__((aligned(PAGE_SIZE))); |
| 46 | |
| 47 | DECLARE_PER_CPU_PAGE_ALIGNED(struct gdt_page, gdt_page); |
| 48 | |
| 49 | /* Provide the original GDT */ |
| 50 | static inline struct desc_struct *get_cpu_gdt_rw(unsigned int cpu) |
| 51 | { |
| 52 | return per_cpu(gdt_page, cpu).gdt; |
| 53 | } |
| 54 | |
| 55 | /* Provide the current original GDT */ |
| 56 | static inline struct desc_struct *get_current_gdt_rw(void) |
| 57 | { |
| 58 | return this_cpu_ptr(&gdt_page)->gdt; |
| 59 | } |
| 60 | |
| 61 | /* Provide the fixmap address of the remapped GDT */ |
| 62 | static inline struct desc_struct *get_cpu_gdt_ro(int cpu) |
| 63 | { |
| 64 | return (struct desc_struct *)&get_cpu_entry_area(cpu)->gdt; |
| 65 | } |
| 66 | |
| 67 | /* Provide the current read-only GDT */ |
| 68 | static inline struct desc_struct *get_current_gdt_ro(void) |
| 69 | { |
| 70 | return get_cpu_gdt_ro(smp_processor_id()); |
| 71 | } |
| 72 | |
| 73 | /* Provide the physical address of the GDT page. */ |
| 74 | static inline phys_addr_t get_cpu_gdt_paddr(unsigned int cpu) |
| 75 | { |
| 76 | return per_cpu_ptr_to_phys(get_cpu_gdt_rw(cpu)); |
| 77 | } |
| 78 | |
| 79 | static inline void pack_gate(gate_desc *gate, unsigned type, unsigned long func, |
| 80 | unsigned dpl, unsigned ist, unsigned seg) |
| 81 | { |
| 82 | gate->offset_low = (u16) func; |
| 83 | gate->bits.p = 1; |
| 84 | gate->bits.dpl = dpl; |
| 85 | gate->bits.zero = 0; |
| 86 | gate->bits.type = type; |
| 87 | gate->offset_middle = (u16) (func >> 16); |
| 88 | #ifdef CONFIG_X86_64 |
| 89 | gate->segment = __KERNEL_CS; |
| 90 | gate->bits.ist = ist; |
| 91 | gate->reserved = 0; |
| 92 | gate->offset_high = (u32) (func >> 32); |
| 93 | #else |
| 94 | gate->segment = seg; |
| 95 | gate->bits.ist = 0; |
| 96 | #endif |
| 97 | } |
| 98 | |
| 99 | static inline int desc_empty(const void *ptr) |
| 100 | { |
| 101 | const u32 *desc = ptr; |
| 102 | |
| 103 | return !(desc[0] | desc[1]); |
| 104 | } |
| 105 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 106 | #ifdef CONFIG_PARAVIRT_XXL |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 107 | #include <asm/paravirt.h> |
| 108 | #else |
| 109 | #define load_TR_desc() native_load_tr_desc() |
| 110 | #define load_gdt(dtr) native_load_gdt(dtr) |
| 111 | #define load_idt(dtr) native_load_idt(dtr) |
| 112 | #define load_tr(tr) asm volatile("ltr %0"::"m" (tr)) |
| 113 | #define load_ldt(ldt) asm volatile("lldt %0"::"m" (ldt)) |
| 114 | |
| 115 | #define store_gdt(dtr) native_store_gdt(dtr) |
| 116 | #define store_tr(tr) (tr = native_store_tr()) |
| 117 | |
| 118 | #define load_TLS(t, cpu) native_load_tls(t, cpu) |
| 119 | #define set_ldt native_set_ldt |
| 120 | |
| 121 | #define write_ldt_entry(dt, entry, desc) native_write_ldt_entry(dt, entry, desc) |
| 122 | #define write_gdt_entry(dt, entry, desc, type) native_write_gdt_entry(dt, entry, desc, type) |
| 123 | #define write_idt_entry(dt, entry, g) native_write_idt_entry(dt, entry, g) |
| 124 | |
| 125 | static inline void paravirt_alloc_ldt(struct desc_struct *ldt, unsigned entries) |
| 126 | { |
| 127 | } |
| 128 | |
| 129 | static inline void paravirt_free_ldt(struct desc_struct *ldt, unsigned entries) |
| 130 | { |
| 131 | } |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 132 | #endif /* CONFIG_PARAVIRT_XXL */ |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 133 | |
| 134 | #define store_ldt(ldt) asm("sldt %0" : "=m"(ldt)) |
| 135 | |
| 136 | static inline void native_write_idt_entry(gate_desc *idt, int entry, const gate_desc *gate) |
| 137 | { |
| 138 | memcpy(&idt[entry], gate, sizeof(*gate)); |
| 139 | } |
| 140 | |
| 141 | static inline void native_write_ldt_entry(struct desc_struct *ldt, int entry, const void *desc) |
| 142 | { |
| 143 | memcpy(&ldt[entry], desc, 8); |
| 144 | } |
| 145 | |
| 146 | static inline void |
| 147 | native_write_gdt_entry(struct desc_struct *gdt, int entry, const void *desc, int type) |
| 148 | { |
| 149 | unsigned int size; |
| 150 | |
| 151 | switch (type) { |
| 152 | case DESC_TSS: size = sizeof(tss_desc); break; |
| 153 | case DESC_LDT: size = sizeof(ldt_desc); break; |
| 154 | default: size = sizeof(*gdt); break; |
| 155 | } |
| 156 | |
| 157 | memcpy(&gdt[entry], desc, size); |
| 158 | } |
| 159 | |
| 160 | static inline void set_tssldt_descriptor(void *d, unsigned long addr, |
| 161 | unsigned type, unsigned size) |
| 162 | { |
| 163 | struct ldttss_desc *desc = d; |
| 164 | |
| 165 | memset(desc, 0, sizeof(*desc)); |
| 166 | |
| 167 | desc->limit0 = (u16) size; |
| 168 | desc->base0 = (u16) addr; |
| 169 | desc->base1 = (addr >> 16) & 0xFF; |
| 170 | desc->type = type; |
| 171 | desc->p = 1; |
| 172 | desc->limit1 = (size >> 16) & 0xF; |
| 173 | desc->base2 = (addr >> 24) & 0xFF; |
| 174 | #ifdef CONFIG_X86_64 |
| 175 | desc->base3 = (u32) (addr >> 32); |
| 176 | #endif |
| 177 | } |
| 178 | |
| 179 | static inline void __set_tss_desc(unsigned cpu, unsigned int entry, struct x86_hw_tss *addr) |
| 180 | { |
| 181 | struct desc_struct *d = get_cpu_gdt_rw(cpu); |
| 182 | tss_desc tss; |
| 183 | |
| 184 | set_tssldt_descriptor(&tss, (unsigned long)addr, DESC_TSS, |
| 185 | __KERNEL_TSS_LIMIT); |
| 186 | write_gdt_entry(d, entry, &tss, DESC_TSS); |
| 187 | } |
| 188 | |
| 189 | #define set_tss_desc(cpu, addr) __set_tss_desc(cpu, GDT_ENTRY_TSS, addr) |
| 190 | |
| 191 | static inline void native_set_ldt(const void *addr, unsigned int entries) |
| 192 | { |
| 193 | if (likely(entries == 0)) |
| 194 | asm volatile("lldt %w0"::"q" (0)); |
| 195 | else { |
| 196 | unsigned cpu = smp_processor_id(); |
| 197 | ldt_desc ldt; |
| 198 | |
| 199 | set_tssldt_descriptor(&ldt, (unsigned long)addr, DESC_LDT, |
| 200 | entries * LDT_ENTRY_SIZE - 1); |
| 201 | write_gdt_entry(get_cpu_gdt_rw(cpu), GDT_ENTRY_LDT, |
| 202 | &ldt, DESC_LDT); |
| 203 | asm volatile("lldt %w0"::"q" (GDT_ENTRY_LDT*8)); |
| 204 | } |
| 205 | } |
| 206 | |
| 207 | static inline void native_load_gdt(const struct desc_ptr *dtr) |
| 208 | { |
| 209 | asm volatile("lgdt %0"::"m" (*dtr)); |
| 210 | } |
| 211 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 212 | static __always_inline void native_load_idt(const struct desc_ptr *dtr) |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 213 | { |
| 214 | asm volatile("lidt %0"::"m" (*dtr)); |
| 215 | } |
| 216 | |
| 217 | static inline void native_store_gdt(struct desc_ptr *dtr) |
| 218 | { |
| 219 | asm volatile("sgdt %0":"=m" (*dtr)); |
| 220 | } |
| 221 | |
| 222 | static inline void store_idt(struct desc_ptr *dtr) |
| 223 | { |
| 224 | asm volatile("sidt %0":"=m" (*dtr)); |
| 225 | } |
| 226 | |
| 227 | /* |
| 228 | * The LTR instruction marks the TSS GDT entry as busy. On 64-bit, the GDT is |
| 229 | * a read-only remapping. To prevent a page fault, the GDT is switched to the |
| 230 | * original writeable version when needed. |
| 231 | */ |
| 232 | #ifdef CONFIG_X86_64 |
| 233 | static inline void native_load_tr_desc(void) |
| 234 | { |
| 235 | struct desc_ptr gdt; |
| 236 | int cpu = raw_smp_processor_id(); |
| 237 | bool restore = 0; |
| 238 | struct desc_struct *fixmap_gdt; |
| 239 | |
| 240 | native_store_gdt(&gdt); |
| 241 | fixmap_gdt = get_cpu_gdt_ro(cpu); |
| 242 | |
| 243 | /* |
| 244 | * If the current GDT is the read-only fixmap, swap to the original |
| 245 | * writeable version. Swap back at the end. |
| 246 | */ |
| 247 | if (gdt.address == (unsigned long)fixmap_gdt) { |
| 248 | load_direct_gdt(cpu); |
| 249 | restore = 1; |
| 250 | } |
| 251 | asm volatile("ltr %w0"::"q" (GDT_ENTRY_TSS*8)); |
| 252 | if (restore) |
| 253 | load_fixmap_gdt(cpu); |
| 254 | } |
| 255 | #else |
| 256 | static inline void native_load_tr_desc(void) |
| 257 | { |
| 258 | asm volatile("ltr %w0"::"q" (GDT_ENTRY_TSS*8)); |
| 259 | } |
| 260 | #endif |
| 261 | |
| 262 | static inline unsigned long native_store_tr(void) |
| 263 | { |
| 264 | unsigned long tr; |
| 265 | |
| 266 | asm volatile("str %0":"=r" (tr)); |
| 267 | |
| 268 | return tr; |
| 269 | } |
| 270 | |
| 271 | static inline void native_load_tls(struct thread_struct *t, unsigned int cpu) |
| 272 | { |
| 273 | struct desc_struct *gdt = get_cpu_gdt_rw(cpu); |
| 274 | unsigned int i; |
| 275 | |
| 276 | for (i = 0; i < GDT_ENTRY_TLS_ENTRIES; i++) |
| 277 | gdt[GDT_ENTRY_TLS_MIN + i] = t->tls_array[i]; |
| 278 | } |
| 279 | |
| 280 | DECLARE_PER_CPU(bool, __tss_limit_invalid); |
| 281 | |
| 282 | static inline void force_reload_TR(void) |
| 283 | { |
| 284 | struct desc_struct *d = get_current_gdt_rw(); |
| 285 | tss_desc tss; |
| 286 | |
| 287 | memcpy(&tss, &d[GDT_ENTRY_TSS], sizeof(tss_desc)); |
| 288 | |
| 289 | /* |
| 290 | * LTR requires an available TSS, and the TSS is currently |
| 291 | * busy. Make it be available so that LTR will work. |
| 292 | */ |
| 293 | tss.type = DESC_TSS; |
| 294 | write_gdt_entry(d, GDT_ENTRY_TSS, &tss, DESC_TSS); |
| 295 | |
| 296 | load_TR_desc(); |
| 297 | this_cpu_write(__tss_limit_invalid, false); |
| 298 | } |
| 299 | |
| 300 | /* |
| 301 | * Call this if you need the TSS limit to be correct, which should be the case |
| 302 | * if and only if you have TIF_IO_BITMAP set or you're switching to a task |
| 303 | * with TIF_IO_BITMAP set. |
| 304 | */ |
| 305 | static inline void refresh_tss_limit(void) |
| 306 | { |
| 307 | DEBUG_LOCKS_WARN_ON(preemptible()); |
| 308 | |
| 309 | if (unlikely(this_cpu_read(__tss_limit_invalid))) |
| 310 | force_reload_TR(); |
| 311 | } |
| 312 | |
| 313 | /* |
| 314 | * If you do something evil that corrupts the cached TSS limit (I'm looking |
| 315 | * at you, VMX exits), call this function. |
| 316 | * |
| 317 | * The optimization here is that the TSS limit only matters for Linux if the |
| 318 | * IO bitmap is in use. If the TSS limit gets forced to its minimum value, |
| 319 | * everything works except that IO bitmap will be ignored and all CPL 3 IO |
| 320 | * instructions will #GP, which is exactly what we want for normal tasks. |
| 321 | */ |
| 322 | static inline void invalidate_tss_limit(void) |
| 323 | { |
| 324 | DEBUG_LOCKS_WARN_ON(preemptible()); |
| 325 | |
| 326 | if (unlikely(test_thread_flag(TIF_IO_BITMAP))) |
| 327 | force_reload_TR(); |
| 328 | else |
| 329 | this_cpu_write(__tss_limit_invalid, true); |
| 330 | } |
| 331 | |
| 332 | /* This intentionally ignores lm, since 32-bit apps don't have that field. */ |
| 333 | #define LDT_empty(info) \ |
| 334 | ((info)->base_addr == 0 && \ |
| 335 | (info)->limit == 0 && \ |
| 336 | (info)->contents == 0 && \ |
| 337 | (info)->read_exec_only == 1 && \ |
| 338 | (info)->seg_32bit == 0 && \ |
| 339 | (info)->limit_in_pages == 0 && \ |
| 340 | (info)->seg_not_present == 1 && \ |
| 341 | (info)->useable == 0) |
| 342 | |
| 343 | /* Lots of programs expect an all-zero user_desc to mean "no segment at all". */ |
| 344 | static inline bool LDT_zero(const struct user_desc *info) |
| 345 | { |
| 346 | return (info->base_addr == 0 && |
| 347 | info->limit == 0 && |
| 348 | info->contents == 0 && |
| 349 | info->read_exec_only == 0 && |
| 350 | info->seg_32bit == 0 && |
| 351 | info->limit_in_pages == 0 && |
| 352 | info->seg_not_present == 0 && |
| 353 | info->useable == 0); |
| 354 | } |
| 355 | |
| 356 | static inline void clear_LDT(void) |
| 357 | { |
| 358 | set_ldt(NULL, 0); |
| 359 | } |
| 360 | |
| 361 | static inline unsigned long get_desc_base(const struct desc_struct *desc) |
| 362 | { |
| 363 | return (unsigned)(desc->base0 | ((desc->base1) << 16) | ((desc->base2) << 24)); |
| 364 | } |
| 365 | |
| 366 | static inline void set_desc_base(struct desc_struct *desc, unsigned long base) |
| 367 | { |
| 368 | desc->base0 = base & 0xffff; |
| 369 | desc->base1 = (base >> 16) & 0xff; |
| 370 | desc->base2 = (base >> 24) & 0xff; |
| 371 | } |
| 372 | |
| 373 | static inline unsigned long get_desc_limit(const struct desc_struct *desc) |
| 374 | { |
| 375 | return desc->limit0 | (desc->limit1 << 16); |
| 376 | } |
| 377 | |
| 378 | static inline void set_desc_limit(struct desc_struct *desc, unsigned long limit) |
| 379 | { |
| 380 | desc->limit0 = limit & 0xffff; |
| 381 | desc->limit1 = (limit >> 16) & 0xf; |
| 382 | } |
| 383 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 384 | void alloc_intr_gate(unsigned int n, const void *addr); |
| 385 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 386 | static inline void init_idt_data(struct idt_data *data, unsigned int n, |
| 387 | const void *addr) |
| 388 | { |
| 389 | BUG_ON(n > 0xFF); |
| 390 | |
| 391 | memset(data, 0, sizeof(*data)); |
| 392 | data->vector = n; |
| 393 | data->addr = addr; |
| 394 | data->segment = __KERNEL_CS; |
| 395 | data->bits.type = GATE_INTERRUPT; |
| 396 | data->bits.p = 1; |
| 397 | } |
| 398 | |
| 399 | static inline void idt_init_desc(gate_desc *gate, const struct idt_data *d) |
| 400 | { |
| 401 | unsigned long addr = (unsigned long) d->addr; |
| 402 | |
| 403 | gate->offset_low = (u16) addr; |
| 404 | gate->segment = (u16) d->segment; |
| 405 | gate->bits = d->bits; |
| 406 | gate->offset_middle = (u16) (addr >> 16); |
| 407 | #ifdef CONFIG_X86_64 |
| 408 | gate->offset_high = (u32) (addr >> 32); |
| 409 | gate->reserved = 0; |
| 410 | #endif |
| 411 | } |
| 412 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 413 | extern unsigned long system_vectors[]; |
| 414 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 415 | extern void load_current_idt(void); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 416 | extern void idt_setup_early_handler(void); |
| 417 | extern void idt_setup_early_traps(void); |
| 418 | extern void idt_setup_traps(void); |
| 419 | extern void idt_setup_apic_and_irq_gates(void); |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 420 | extern bool idt_is_f00f_address(unsigned long address); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 421 | |
| 422 | #ifdef CONFIG_X86_64 |
| 423 | extern void idt_setup_early_pf(void); |
| 424 | extern void idt_setup_ist_traps(void); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 425 | #else |
| 426 | static inline void idt_setup_early_pf(void) { } |
| 427 | static inline void idt_setup_ist_traps(void) { } |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 428 | #endif |
| 429 | |
| 430 | extern void idt_invalidate(void *addr); |
| 431 | |
| 432 | #endif /* _ASM_X86_DESC_H */ |