Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 1 | #!/usr/bin/env python3 |
| 2 | # |
| 3 | # Copyright (c) 2017 Intel Corporation |
| 4 | # |
| 5 | # SPDX-License-Identifier: Apache-2.0 |
| 6 | |
Andrew Boie | b8cbf21 | 2019-02-24 11:36:31 -0800 | [diff] [blame] | 7 | """Generate a Global Descriptor Table (GDT) for x86 CPUs. |
| 8 | |
| 9 | For additional detail on GDT and x86 memory management, please |
| 10 | consult the IA Architecture SW Developer Manual, vol. 3. |
| 11 | |
| 12 | This script accepts as input the zephyr_prebuilt.elf binary, |
| 13 | which is a link of the Zephyr kernel without various build-time |
| 14 | generated data structures (such as the GDT) inserted into it. |
| 15 | This kernel image has been properly padded such that inserting |
| 16 | these data structures will not disturb the memory addresses of |
| 17 | other symbols. |
| 18 | |
Andrew Boie | 98bcc51 | 2020-07-17 19:02:30 -0700 | [diff] [blame^] | 19 | The input kernel ELF binary is used to obtain the following |
| 20 | information: |
| 21 | |
| 22 | - Memory addresses of the Main and Double Fault TSS structures |
| 23 | so GDT descriptors can be created for them |
| 24 | - Memory addresses of where the GDT lives in memory, so that this |
| 25 | address can be populated in the GDT pseudo descriptor |
| 26 | - whether userspace or HW stack protection are enabled in Kconfig |
| 27 | |
Andrew Boie | b8cbf21 | 2019-02-24 11:36:31 -0800 | [diff] [blame] | 28 | The output is a GDT whose contents depend on the kernel |
| 29 | configuration. With no memory protection features enabled, |
| 30 | we generate flat 32-bit code and data segments. If hardware- |
| 31 | based stack overflow protection or userspace is enabled, |
| 32 | we additionally create descriptors for the main and double- |
| 33 | fault IA tasks, needed for userspace privilege elevation and |
| 34 | double-fault handling. If userspace is enabled, we also create |
| 35 | flat code/data segments for ring 3 execution. |
| 36 | """ |
| 37 | |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 38 | import argparse |
| 39 | import sys |
| 40 | import struct |
| 41 | import os |
Andrew Boie | 3aecba1 | 2017-07-25 09:44:30 -0700 | [diff] [blame] | 42 | import elftools |
| 43 | from distutils.version import LooseVersion |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 44 | from elftools.elf.elffile import ELFFile |
| 45 | from elftools.elf.sections import SymbolTableSection |
| 46 | |
Andrew Boie | 3aecba1 | 2017-07-25 09:44:30 -0700 | [diff] [blame] | 47 | if LooseVersion(elftools.__version__) < LooseVersion('0.24'): |
Ulf Magnusson | 50b9b12 | 2019-09-07 14:41:01 +0200 | [diff] [blame] | 48 | sys.exit("pyelftools is out of date, need version 0.24 or later") |
Andrew Boie | 3aecba1 | 2017-07-25 09:44:30 -0700 | [diff] [blame] | 49 | |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 50 | |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 51 | def debug(text): |
| 52 | if not args.verbose: |
| 53 | return |
| 54 | sys.stdout.write(os.path.basename(sys.argv[0]) + ": " + text + "\n") |
| 55 | |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 56 | |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 57 | def error(text): |
Ulf Magnusson | 50b9b12 | 2019-09-07 14:41:01 +0200 | [diff] [blame] | 58 | sys.exit(os.path.basename(sys.argv[0]) + ": " + text) |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 59 | |
| 60 | |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 61 | gdt_pd_fmt = "<HIH" |
| 62 | |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 63 | FLAGS_GRAN = 1 << 7 # page granularity |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 64 | ACCESS_EX = 1 << 3 # executable |
| 65 | ACCESS_DC = 1 << 2 # direction/conforming |
| 66 | ACCESS_RW = 1 << 1 # read or write permission |
| 67 | |
| 68 | # 6 byte pseudo descriptor, but we're going to actually use this as the |
| 69 | # zero descriptor and return 8 bytes |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 70 | |
| 71 | |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 72 | def create_gdt_pseudo_desc(addr, size): |
Andrew Boie | a705eae | 2017-11-03 10:39:08 -0700 | [diff] [blame] | 73 | debug("create pseudo decriptor: %x %x" % (addr, size)) |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 74 | # ...and take back one byte for the Intel god whose Ark this is... |
| 75 | size = size - 1 |
| 76 | return struct.pack(gdt_pd_fmt, size, addr, 0) |
| 77 | |
| 78 | |
| 79 | # Limit argument always in bytes |
| 80 | def chop_base_limit(base, limit): |
| 81 | base_lo = base & 0xFFFF |
| 82 | base_mid = (base >> 16) & 0xFF |
| 83 | base_hi = (base >> 24) & 0xFF |
| 84 | |
| 85 | limit_lo = limit & 0xFFFF |
| 86 | limit_hi = (limit >> 16) & 0xF |
| 87 | |
| 88 | return (base_lo, base_mid, base_hi, limit_lo, limit_hi) |
| 89 | |
| 90 | |
| 91 | gdt_ent_fmt = "<HHBBBB" |
| 92 | |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 93 | |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 94 | def create_code_data_entry(base, limit, dpl, flags, access): |
Andrew Boie | a705eae | 2017-11-03 10:39:08 -0700 | [diff] [blame] | 95 | debug("create code or data entry: %x %x %x %x %x" % |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 96 | (base, limit, dpl, flags, access)) |
Andrew Boie | a705eae | 2017-11-03 10:39:08 -0700 | [diff] [blame] | 97 | |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 98 | base_lo, base_mid, base_hi, limit_lo, limit_hi = chop_base_limit(base, |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 99 | limit) |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 100 | |
| 101 | # This is a valid descriptor |
| 102 | present = 1 |
| 103 | |
| 104 | # 32-bit protected mode |
| 105 | size = 1 |
| 106 | |
| 107 | # 1 = code or data, 0 = system type |
| 108 | desc_type = 1 |
| 109 | |
| 110 | # Just set accessed to 1 already so the CPU doesn't need it update it, |
| 111 | # prevents freakouts if the GDT is in ROM, we don't care about this |
| 112 | # bit in the OS |
| 113 | accessed = 1 |
| 114 | |
Andrew Boie | a0da632 | 2017-08-01 09:30:09 -0700 | [diff] [blame] | 115 | access = access | (present << 7) | (dpl << 5) | (desc_type << 4) | accessed |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 116 | flags = flags | (size << 6) | limit_hi |
| 117 | |
| 118 | return struct.pack(gdt_ent_fmt, limit_lo, base_lo, base_mid, |
| 119 | access, flags, base_hi) |
| 120 | |
| 121 | |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 122 | def create_tss_entry(base, limit, dpl): |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 123 | debug("create TSS entry: %x %x %x" % (base, limit, dpl)) |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 124 | present = 1 |
| 125 | |
| 126 | base_lo, base_mid, base_hi, limit_lo, limit_hi, = chop_base_limit(base, |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 127 | limit) |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 128 | |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 129 | type_code = 0x9 # non-busy 32-bit TSS descriptor |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 130 | gran = 0 |
| 131 | |
| 132 | flags = (gran << 7) | limit_hi |
| 133 | type_byte = ((present << 7) | (dpl << 5) | type_code) |
| 134 | |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 135 | return struct.pack(gdt_ent_fmt, limit_lo, base_lo, base_mid, |
| 136 | type_byte, flags, base_hi) |
| 137 | |
| 138 | |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 139 | def get_symbols(obj): |
| 140 | for section in obj.iter_sections(): |
| 141 | if isinstance(section, SymbolTableSection): |
| 142 | return {sym.name: sym.entry.st_value |
| 143 | for sym in section.iter_symbols()} |
| 144 | |
| 145 | raise LookupError("Could not find symbol table") |
| 146 | |
| 147 | |
| 148 | def parse_args(): |
| 149 | global args |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 150 | parser = argparse.ArgumentParser( |
| 151 | description=__doc__, |
| 152 | formatter_class=argparse.RawDescriptionHelpFormatter) |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 153 | |
| 154 | parser.add_argument("-k", "--kernel", required=True, |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 155 | help="Zephyr kernel image") |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 156 | parser.add_argument("-v", "--verbose", action="store_true", |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 157 | help="Print extra debugging information") |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 158 | parser.add_argument("-o", "--output-gdt", required=True, |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 159 | help="output GDT binary") |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 160 | args = parser.parse_args() |
Sebastian Bøe | 4971d2a | 2017-12-28 17:34:50 +0100 | [diff] [blame] | 161 | if "VERBOSE" in os.environ: |
| 162 | args.verbose = 1 |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 163 | |
| 164 | |
| 165 | def main(): |
| 166 | parse_args() |
| 167 | |
| 168 | with open(args.kernel, "rb") as fp: |
| 169 | kernel = ELFFile(fp) |
| 170 | syms = get_symbols(kernel) |
| 171 | |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 172 | # NOTE: use-cases are extremely limited; we always have a basic flat |
| 173 | # code/data segments. If we are doing stack protection, we are going to |
| 174 | # have two TSS to manage the main task and the special task for double |
| 175 | # fault exception handling |
Andrew Boie | a705eae | 2017-11-03 10:39:08 -0700 | [diff] [blame] | 176 | if "CONFIG_USERSPACE" in syms: |
| 177 | num_entries = 7 |
| 178 | elif "CONFIG_HW_STACK_PROTECTION" in syms: |
| 179 | num_entries = 5 |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 180 | else: |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 181 | num_entries = 3 |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 182 | |
| 183 | gdt_base = syms["_gdt"] |
| 184 | |
| 185 | with open(args.output_gdt, "wb") as fp: |
| 186 | # The pseudo descriptor is stuffed into the NULL descriptor |
| 187 | # since the CPU never looks at it |
| 188 | fp.write(create_gdt_pseudo_desc(gdt_base, num_entries * 8)) |
| 189 | |
| 190 | # Selector 0x08: code descriptor |
| 191 | fp.write(create_code_data_entry(0, 0xFFFFF, 0, |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 192 | FLAGS_GRAN, ACCESS_EX | ACCESS_RW)) |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 193 | |
| 194 | # Selector 0x10: data descriptor |
| 195 | fp.write(create_code_data_entry(0, 0xFFFFF, 0, |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 196 | FLAGS_GRAN, ACCESS_RW)) |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 197 | |
Andrew Boie | a705eae | 2017-11-03 10:39:08 -0700 | [diff] [blame] | 198 | if num_entries >= 5: |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 199 | main_tss = syms["_main_tss"] |
| 200 | df_tss = syms["_df_tss"] |
| 201 | |
| 202 | # Selector 0x18: main TSS |
| 203 | fp.write(create_tss_entry(main_tss, 0x67, 0)) |
| 204 | |
| 205 | # Selector 0x20: double-fault TSS |
| 206 | fp.write(create_tss_entry(df_tss, 0x67, 0)) |
| 207 | |
Andrew Boie | a705eae | 2017-11-03 10:39:08 -0700 | [diff] [blame] | 208 | if num_entries == 7: |
| 209 | # Selector 0x28: code descriptor, dpl = 3 |
| 210 | fp.write(create_code_data_entry(0, 0xFFFFF, 3, |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 211 | FLAGS_GRAN, ACCESS_EX | ACCESS_RW)) |
Andrew Boie | 424e993 | 2017-08-30 14:06:30 -0700 | [diff] [blame] | 212 | |
Andrew Boie | a705eae | 2017-11-03 10:39:08 -0700 | [diff] [blame] | 213 | # Selector 0x30: data descriptor, dpl = 3 |
| 214 | fp.write(create_code_data_entry(0, 0xFFFFF, 3, |
Anas Nashif | 7256553 | 2017-12-12 08:19:25 -0500 | [diff] [blame] | 215 | FLAGS_GRAN, ACCESS_RW)) |
Andrew Boie | 424e993 | 2017-08-30 14:06:30 -0700 | [diff] [blame] | 216 | |
Andrew Boie | bc666ae | 2017-07-14 16:35:17 -0700 | [diff] [blame] | 217 | |
Andrew Boie | 08c2913 | 2017-07-14 15:29:17 -0700 | [diff] [blame] | 218 | if __name__ == "__main__": |
| 219 | main() |