blob: 32124156de6ec8a31bf0861f4787b75436d3762f [file] [log] [blame]
Andrew Boie08c29132017-07-14 15:29:17 -07001#!/usr/bin/env python3
2#
3# Copyright (c) 2017 Intel Corporation
4#
5# SPDX-License-Identifier: Apache-2.0
6
Andrew Boieb8cbf212019-02-24 11:36:31 -08007"""Generate a Global Descriptor Table (GDT) for x86 CPUs.
8
9For additional detail on GDT and x86 memory management, please
10consult the IA Architecture SW Developer Manual, vol. 3.
11
12This script accepts as input the zephyr_prebuilt.elf binary,
13which is a link of the Zephyr kernel without various build-time
14generated data structures (such as the GDT) inserted into it.
15This kernel image has been properly padded such that inserting
16these data structures will not disturb the memory addresses of
17other symbols.
18
Andrew Boie98bcc512020-07-17 19:02:30 -070019The input kernel ELF binary is used to obtain the following
20information:
21
22- Memory addresses of the Main and Double Fault TSS structures
23 so GDT descriptors can be created for them
24- Memory addresses of where the GDT lives in memory, so that this
25 address can be populated in the GDT pseudo descriptor
26- whether userspace or HW stack protection are enabled in Kconfig
27
Andrew Boieb8cbf212019-02-24 11:36:31 -080028The output is a GDT whose contents depend on the kernel
29configuration. With no memory protection features enabled,
30we generate flat 32-bit code and data segments. If hardware-
31based stack overflow protection or userspace is enabled,
32we additionally create descriptors for the main and double-
33fault IA tasks, needed for userspace privilege elevation and
34double-fault handling. If userspace is enabled, we also create
35flat code/data segments for ring 3 execution.
36"""
37
Andrew Boie08c29132017-07-14 15:29:17 -070038import argparse
39import sys
40import struct
41import os
Andrew Boie3aecba12017-07-25 09:44:30 -070042import elftools
43from distutils.version import LooseVersion
Andrew Boie08c29132017-07-14 15:29:17 -070044from elftools.elf.elffile import ELFFile
45from elftools.elf.sections import SymbolTableSection
46
Andrew Boie3aecba12017-07-25 09:44:30 -070047if LooseVersion(elftools.__version__) < LooseVersion('0.24'):
Ulf Magnusson50b9b122019-09-07 14:41:01 +020048 sys.exit("pyelftools is out of date, need version 0.24 or later")
Andrew Boie3aecba12017-07-25 09:44:30 -070049
Anas Nashif72565532017-12-12 08:19:25 -050050
Andrew Boiebc666ae2017-07-14 16:35:17 -070051def debug(text):
52 if not args.verbose:
53 return
54 sys.stdout.write(os.path.basename(sys.argv[0]) + ": " + text + "\n")
55
Anas Nashif72565532017-12-12 08:19:25 -050056
Andrew Boiebc666ae2017-07-14 16:35:17 -070057def error(text):
Ulf Magnusson50b9b122019-09-07 14:41:01 +020058 sys.exit(os.path.basename(sys.argv[0]) + ": " + text)
Andrew Boiebc666ae2017-07-14 16:35:17 -070059
60
Andrew Boie08c29132017-07-14 15:29:17 -070061gdt_pd_fmt = "<HIH"
62
Anas Nashif72565532017-12-12 08:19:25 -050063FLAGS_GRAN = 1 << 7 # page granularity
Andrew Boie08c29132017-07-14 15:29:17 -070064ACCESS_EX = 1 << 3 # executable
65ACCESS_DC = 1 << 2 # direction/conforming
66ACCESS_RW = 1 << 1 # read or write permission
67
68# 6 byte pseudo descriptor, but we're going to actually use this as the
69# zero descriptor and return 8 bytes
Anas Nashif72565532017-12-12 08:19:25 -050070
71
Andrew Boie08c29132017-07-14 15:29:17 -070072def create_gdt_pseudo_desc(addr, size):
Andrew Boiea705eae2017-11-03 10:39:08 -070073 debug("create pseudo decriptor: %x %x" % (addr, size))
Andrew Boie08c29132017-07-14 15:29:17 -070074 # ...and take back one byte for the Intel god whose Ark this is...
75 size = size - 1
76 return struct.pack(gdt_pd_fmt, size, addr, 0)
77
78
79# Limit argument always in bytes
80def chop_base_limit(base, limit):
81 base_lo = base & 0xFFFF
82 base_mid = (base >> 16) & 0xFF
83 base_hi = (base >> 24) & 0xFF
84
85 limit_lo = limit & 0xFFFF
86 limit_hi = (limit >> 16) & 0xF
87
88 return (base_lo, base_mid, base_hi, limit_lo, limit_hi)
89
90
91gdt_ent_fmt = "<HHBBBB"
92
Anas Nashif72565532017-12-12 08:19:25 -050093
Andrew Boie08c29132017-07-14 15:29:17 -070094def create_code_data_entry(base, limit, dpl, flags, access):
Andrew Boiea705eae2017-11-03 10:39:08 -070095 debug("create code or data entry: %x %x %x %x %x" %
Anas Nashif72565532017-12-12 08:19:25 -050096 (base, limit, dpl, flags, access))
Andrew Boiea705eae2017-11-03 10:39:08 -070097
Andrew Boie08c29132017-07-14 15:29:17 -070098 base_lo, base_mid, base_hi, limit_lo, limit_hi = chop_base_limit(base,
Anas Nashif72565532017-12-12 08:19:25 -050099 limit)
Andrew Boie08c29132017-07-14 15:29:17 -0700100
101 # This is a valid descriptor
102 present = 1
103
104 # 32-bit protected mode
105 size = 1
106
107 # 1 = code or data, 0 = system type
108 desc_type = 1
109
110 # Just set accessed to 1 already so the CPU doesn't need it update it,
111 # prevents freakouts if the GDT is in ROM, we don't care about this
112 # bit in the OS
113 accessed = 1
114
Andrew Boiea0da6322017-08-01 09:30:09 -0700115 access = access | (present << 7) | (dpl << 5) | (desc_type << 4) | accessed
Andrew Boie08c29132017-07-14 15:29:17 -0700116 flags = flags | (size << 6) | limit_hi
117
118 return struct.pack(gdt_ent_fmt, limit_lo, base_lo, base_mid,
119 access, flags, base_hi)
120
121
Andrew Boiebc666ae2017-07-14 16:35:17 -0700122def create_tss_entry(base, limit, dpl):
Anas Nashif72565532017-12-12 08:19:25 -0500123 debug("create TSS entry: %x %x %x" % (base, limit, dpl))
Andrew Boiebc666ae2017-07-14 16:35:17 -0700124 present = 1
125
126 base_lo, base_mid, base_hi, limit_lo, limit_hi, = chop_base_limit(base,
Anas Nashif72565532017-12-12 08:19:25 -0500127 limit)
Andrew Boiebc666ae2017-07-14 16:35:17 -0700128
Anas Nashif72565532017-12-12 08:19:25 -0500129 type_code = 0x9 # non-busy 32-bit TSS descriptor
Andrew Boiebc666ae2017-07-14 16:35:17 -0700130 gran = 0
131
132 flags = (gran << 7) | limit_hi
133 type_byte = ((present << 7) | (dpl << 5) | type_code)
134
Andrew Boiebc666ae2017-07-14 16:35:17 -0700135 return struct.pack(gdt_ent_fmt, limit_lo, base_lo, base_mid,
136 type_byte, flags, base_hi)
137
138
Andrew Boie08c29132017-07-14 15:29:17 -0700139def get_symbols(obj):
140 for section in obj.iter_sections():
141 if isinstance(section, SymbolTableSection):
142 return {sym.name: sym.entry.st_value
143 for sym in section.iter_symbols()}
144
145 raise LookupError("Could not find symbol table")
146
147
148def parse_args():
149 global args
Anas Nashif72565532017-12-12 08:19:25 -0500150 parser = argparse.ArgumentParser(
151 description=__doc__,
152 formatter_class=argparse.RawDescriptionHelpFormatter)
Andrew Boie08c29132017-07-14 15:29:17 -0700153
154 parser.add_argument("-k", "--kernel", required=True,
Anas Nashif72565532017-12-12 08:19:25 -0500155 help="Zephyr kernel image")
Andrew Boie08c29132017-07-14 15:29:17 -0700156 parser.add_argument("-v", "--verbose", action="store_true",
Anas Nashif72565532017-12-12 08:19:25 -0500157 help="Print extra debugging information")
Andrew Boie08c29132017-07-14 15:29:17 -0700158 parser.add_argument("-o", "--output-gdt", required=True,
Anas Nashif72565532017-12-12 08:19:25 -0500159 help="output GDT binary")
Andrew Boie08c29132017-07-14 15:29:17 -0700160 args = parser.parse_args()
Sebastian Bøe4971d2a2017-12-28 17:34:50 +0100161 if "VERBOSE" in os.environ:
162 args.verbose = 1
Andrew Boie08c29132017-07-14 15:29:17 -0700163
164
165def main():
166 parse_args()
167
168 with open(args.kernel, "rb") as fp:
169 kernel = ELFFile(fp)
170 syms = get_symbols(kernel)
171
Andrew Boiebc666ae2017-07-14 16:35:17 -0700172 # NOTE: use-cases are extremely limited; we always have a basic flat
173 # code/data segments. If we are doing stack protection, we are going to
174 # have two TSS to manage the main task and the special task for double
175 # fault exception handling
Andrew Boiea705eae2017-11-03 10:39:08 -0700176 if "CONFIG_USERSPACE" in syms:
177 num_entries = 7
178 elif "CONFIG_HW_STACK_PROTECTION" in syms:
179 num_entries = 5
Andrew Boiebc666ae2017-07-14 16:35:17 -0700180 else:
Andrew Boiebc666ae2017-07-14 16:35:17 -0700181 num_entries = 3
Andrew Boie08c29132017-07-14 15:29:17 -0700182
183 gdt_base = syms["_gdt"]
184
185 with open(args.output_gdt, "wb") as fp:
186 # The pseudo descriptor is stuffed into the NULL descriptor
187 # since the CPU never looks at it
188 fp.write(create_gdt_pseudo_desc(gdt_base, num_entries * 8))
189
190 # Selector 0x08: code descriptor
191 fp.write(create_code_data_entry(0, 0xFFFFF, 0,
Anas Nashif72565532017-12-12 08:19:25 -0500192 FLAGS_GRAN, ACCESS_EX | ACCESS_RW))
Andrew Boie08c29132017-07-14 15:29:17 -0700193
194 # Selector 0x10: data descriptor
195 fp.write(create_code_data_entry(0, 0xFFFFF, 0,
Anas Nashif72565532017-12-12 08:19:25 -0500196 FLAGS_GRAN, ACCESS_RW))
Andrew Boie08c29132017-07-14 15:29:17 -0700197
Andrew Boiea705eae2017-11-03 10:39:08 -0700198 if num_entries >= 5:
Andrew Boiebc666ae2017-07-14 16:35:17 -0700199 main_tss = syms["_main_tss"]
200 df_tss = syms["_df_tss"]
201
202 # Selector 0x18: main TSS
203 fp.write(create_tss_entry(main_tss, 0x67, 0))
204
205 # Selector 0x20: double-fault TSS
206 fp.write(create_tss_entry(df_tss, 0x67, 0))
207
Andrew Boiea705eae2017-11-03 10:39:08 -0700208 if num_entries == 7:
209 # Selector 0x28: code descriptor, dpl = 3
210 fp.write(create_code_data_entry(0, 0xFFFFF, 3,
Anas Nashif72565532017-12-12 08:19:25 -0500211 FLAGS_GRAN, ACCESS_EX | ACCESS_RW))
Andrew Boie424e9932017-08-30 14:06:30 -0700212
Andrew Boiea705eae2017-11-03 10:39:08 -0700213 # Selector 0x30: data descriptor, dpl = 3
214 fp.write(create_code_data_entry(0, 0xFFFFF, 3,
Anas Nashif72565532017-12-12 08:19:25 -0500215 FLAGS_GRAN, ACCESS_RW))
Andrew Boie424e9932017-08-30 14:06:30 -0700216
Andrew Boiebc666ae2017-07-14 16:35:17 -0700217
Andrew Boie08c29132017-07-14 15:29:17 -0700218if __name__ == "__main__":
219 main()