blob: 0b05255204c9a7151c49611f74e1c674ab27349f [file] [log] [blame]
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -08001/*
2 * elf header parsing.
3 *
4 * Copyright (C) 2013 Google, Inc.
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; version 2 of the License.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA, 02110-1301 USA
18 */
19
20#include <stdio.h>
21#include <stdlib.h>
22#include <string.h>
23
Aaron Durbin54ef3062014-03-05 12:12:09 -060024#include "elfparsing.h"
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -080025#include "common.h"
26#include "cbfs.h"
27
28/*
29 * Short form: this is complicated, but we've tried making it simple
30 * and we keep hitting problems with our ELF parsing.
31 *
32 * The ELF parsing situation has always been a bit tricky. In fact,
33 * we (and most others) have been getting it wrong in small ways for
34 * years. Recently this has caused real trouble for the ARM V8 build.
35 * In this file we attempt to finally get it right for all variations
36 * of endian-ness and word size and target architectures and
37 * architectures we might get run on. Phew!. To do this we borrow a
38 * page from the FreeBSD NFS xdr model (see elf_ehdr and elf_phdr),
39 * the Plan 9 endianness functions (see xdr.c), and Go interfaces (see
40 * how we use buffer structs in this file). This ends up being a bit
41 * wordy at the lowest level, but greatly simplifies the elf parsing
42 * code and removes a common source of bugs, namely, forgetting to
43 * flip type endianness when referencing a struct member.
44 *
45 * ELF files can have four combinations of data layout: 32/64, and
46 * big/little endian. Further, to add to the fun, depending on the
47 * word size, the size of the ELF structs varies. The coreboot SELF
48 * format is simpler in theory: it's supposed to be always BE, and the
49 * various struct members allow room for growth: the entry point is
50 * always 64 bits, for example, so the size of a SELF struct is
51 * constant, regardless of target architecture word size. Hence, we
52 * need to do some transformation of the ELF files.
53 *
54 * A given architecture, realistically, only supports one of the four
55 * combinations at a time as the 'native' format. Hence, our code has
56 * been sprinkled with every variation of [nh]to[hn][sll] over the
57 * years. We've never quite gotten it all right, however, and a quick
58 * pass over this code revealed another bug. It's all worked because,
59 * until now, all the working platforms that had CBFS were 32 LE. Even then,
60 * however, bugs crept in: we recently realized that we're not
61 * transforming the entry point to big format when we store into the
62 * SELF image.
63 *
64 * The problem is essentially an XDR operation:
65 * we have something in a foreign format and need to transform it.
66 * It's most like XDR because:
67 * 1) the byte order can be wrong
68 * 2) the word size can be wrong
69 * 3) the size of elements in the stream depends on the value
70 * of other elements in the stream
71 * it's not like XDR because:
72 * 1) the byte order can be right
73 * 2) the word size can be right
74 * 3) the struct members are all on a natural alignment
75 *
76 * Hence, this new approach. To cover word size issues, we *always*
77 * transform the two structs we care about, the file header and
78 * program header, into a native struct in the 64 bit format:
79 *
80 * [32,little] -> [Elf64_Ehdr, Elf64_Phdr]
81 * [64,little] -> [Elf64_Ehdr, Elf64_Phdr]
82 * [32,big] -> [Elf64_Ehdr, Elf64_Phdr]
83 * [64,big] -> [Elf64_Ehdr, Elf64_Phdr]
84 * Then we just use those structs, and all the need for inline ntoh* goes away,
85 * as well as all the chances for error.
86 * This works because all the SELF structs have fields large enough for
87 * the largest ELF 64 struct members, and all the Elf64 struct members
88 * are at least large enough for all ELF 32 struct members.
89 * We end up with one function to do all our ELF parsing, and two functions
90 * to transform the headers. For the put case, we also have
91 * XDR functions, and hopefully we'll never again spend 5 years with the
92 * wrong endian-ness on an output value :-)
93 * This should work for all word sizes and endianness we hope to target.
94 * I *really* don't want to be here for 128 bit addresses.
95 *
96 * The parse functions are called with a pointer to an input buffer
97 * struct. One might ask: are there enough bytes in the input buffer?
98 * We know there need to be at *least* sizeof(Elf32_Ehdr) +
99 * sizeof(Elf32_Phdr) bytes. Realistically, there has to be some data
100 * too. If we start to worry, though we have not in the past, we
101 * might apply the simple test: the input buffer needs to be at least
102 * sizeof(Elf64_Ehdr) + sizeof(Elf64_Phdr) bytes because, even if it's
103 * ELF 32, there's got to be *some* data! This is not theoretically
104 * accurate but it is actually good enough in practice. It allows the
105 * header transformation code to ignore the possibility of underrun.
106 *
107 * We also must accomodate different ELF files, and hence formats,
108 * in the same cbfs invocation. We might load a 64-bit payload
109 * on a 32-bit machine; we might even have a mixed armv7/armv8
110 * SOC or even a system with an x86/ARM!
111 *
112 * A possibly problematic (though unlikely to be so) assumption
113 * is that we expect the BIOS to remain in the lowest 32 bits
114 * of the physical address space. Since ARMV8 has standardized
115 * on that, and x86_64 also has, this seems a safe assumption.
116 *
117 * To repeat, ELF structs are different sizes because ELF struct
118 * members are different sizes, depending on values in the ELF file
119 * header. For this we use the functions defined in xdr.c, which
120 * consume bytes, convert the endianness, and advance the data pointer
121 * in the buffer struct.
122 */
123
Aaron Durbinaa8784c2014-03-05 12:01:36 -0600124
125static int iself(const void *input)
126{
127 const Elf32_Ehdr *ehdr = input;
128 return !memcmp(ehdr->e_ident, ELFMAG, 4);
129}
130
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800131/* Get the ident array, so we can figure out
132 * endian-ness, word size, and in future other useful
133 * parameters
134 */
135static void
136elf_eident(struct buffer *input, Elf64_Ehdr *ehdr)
137{
Aaron Durbina983cea2014-03-04 22:08:05 -0600138 bgets(input, ehdr->e_ident, sizeof(ehdr->e_ident));
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800139}
140
141
Aaron Durbina983cea2014-03-04 22:08:05 -0600142static int
143check_size(const struct buffer *b, size_t offset, size_t size, const char *desc)
144{
145 if (size == 0)
146 return 0;
147
148 if (offset >= buffer_size(b) || (offset + size) > buffer_size(b)) {
149 ERROR("The file is not large enough for the '%s'. "
150 "%ld bytes @ offset %zu, input %zu bytes.\n",
151 desc, size, offset, buffer_size(b));
152 return -1;
153 }
154 return 0;
155}
156
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800157static void
158elf_ehdr(struct buffer *input, Elf64_Ehdr *ehdr, struct xdr *xdr, int bit64)
159{
160 ehdr->e_type = xdr->get16(input);
161 ehdr->e_machine = xdr->get16(input);
162 ehdr->e_version = xdr->get32(input);
163 if (bit64){
164 ehdr->e_entry = xdr->get64(input);
165 ehdr->e_phoff = xdr->get64(input);
166 ehdr->e_shoff = xdr->get64(input);
167 } else {
168 ehdr->e_entry = xdr->get32(input);
169 ehdr->e_phoff = xdr->get32(input);
170 ehdr->e_shoff = xdr->get32(input);
171 }
172 ehdr->e_flags = xdr->get32(input);
173 ehdr->e_ehsize = xdr->get16(input);
174 ehdr->e_phentsize = xdr->get16(input);
175 ehdr->e_phnum = xdr->get16(input);
176 ehdr->e_shentsize = xdr->get16(input);
177 ehdr->e_shnum = xdr->get16(input);
178 ehdr->e_shstrndx = xdr->get16(input);
179}
180
181static void
182elf_phdr(struct buffer *pinput, Elf64_Phdr *phdr,
183 int entsize, struct xdr *xdr, int bit64)
184{
185 /*
186 * The entsize need not be sizeof(*phdr).
187 * Hence, it is easier to keep a copy of the input,
188 * as the xdr functions may not advance the input
189 * pointer the full entsize; rather than get tricky
190 * we just advance it below.
191 */
Aaron Durbina983cea2014-03-04 22:08:05 -0600192 struct buffer input;
193 buffer_clone(&input, pinput);
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800194 if (bit64){
195 phdr->p_type = xdr->get32(&input);
196 phdr->p_flags = xdr->get32(&input);
197 phdr->p_offset = xdr->get64(&input);
198 phdr->p_vaddr = xdr->get64(&input);
199 phdr->p_paddr = xdr->get64(&input);
200 phdr->p_filesz = xdr->get64(&input);
201 phdr->p_memsz = xdr->get64(&input);
202 phdr->p_align = xdr->get64(&input);
203 } else {
204 phdr->p_type = xdr->get32(&input);
205 phdr->p_offset = xdr->get32(&input);
206 phdr->p_vaddr = xdr->get32(&input);
207 phdr->p_paddr = xdr->get32(&input);
208 phdr->p_filesz = xdr->get32(&input);
209 phdr->p_memsz = xdr->get32(&input);
210 phdr->p_flags = xdr->get32(&input);
211 phdr->p_align = xdr->get32(&input);
212 }
Aaron Durbina983cea2014-03-04 22:08:05 -0600213 buffer_seek(pinput, entsize);
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800214}
215
216static void
217elf_shdr(struct buffer *pinput, Elf64_Shdr *shdr,
218 int entsize, struct xdr *xdr, int bit64)
219{
220 /*
221 * The entsize need not be sizeof(*shdr).
222 * Hence, it is easier to keep a copy of the input,
223 * as the xdr functions may not advance the input
224 * pointer the full entsize; rather than get tricky
225 * we just advance it below.
226 */
227 struct buffer input = *pinput;
228 if (bit64){
229 shdr->sh_name = xdr->get32(&input);
230 shdr->sh_type = xdr->get32(&input);
231 shdr->sh_flags = xdr->get64(&input);
232 shdr->sh_addr = xdr->get64(&input);
233 shdr->sh_offset = xdr->get64(&input);
234 shdr->sh_size= xdr->get64(&input);
235 shdr->sh_link = xdr->get32(&input);
236 shdr->sh_info = xdr->get32(&input);
237 shdr->sh_addralign = xdr->get64(&input);
238 shdr->sh_entsize = xdr->get64(&input);
239 } else {
240 shdr->sh_name = xdr->get32(&input);
241 shdr->sh_type = xdr->get32(&input);
242 shdr->sh_flags = xdr->get32(&input);
243 shdr->sh_addr = xdr->get32(&input);
244 shdr->sh_offset = xdr->get32(&input);
245 shdr->sh_size = xdr->get32(&input);
246 shdr->sh_link = xdr->get32(&input);
247 shdr->sh_info = xdr->get32(&input);
248 shdr->sh_addralign = xdr->get32(&input);
249 shdr->sh_entsize = xdr->get32(&input);
250 }
Aaron Durbina983cea2014-03-04 22:08:05 -0600251 buffer_seek(pinput, entsize);
252}
253
254static Elf64_Phdr *
255phdr_read(const struct buffer *in, Elf64_Ehdr *ehdr, struct xdr *xdr, int bit64)
256{
257 struct buffer b;
258 Elf64_Phdr *phdr;
259 int i;
260
261 /* cons up an input buffer for the headers.
262 * Note that the program headers can be anywhere,
263 * per the ELF spec, You'd be surprised how many ELF
264 * readers miss this little detail.
265 */
266 buffer_splice(&b, in, ehdr->e_phoff, ehdr->e_phentsize * ehdr->e_phnum);
267 if (check_size(in, ehdr->e_phoff, buffer_size(&b), "program headers"))
268 return NULL;
269
270 /* gather up all the phdrs.
271 * We do them all at once because there is more
272 * than one loop over all the phdrs.
273 */
274 phdr = calloc(sizeof(*phdr), ehdr->e_phnum);
275 for (i = 0; i < ehdr->e_phnum; i++)
276 elf_phdr(&b, &phdr[i], ehdr->e_phentsize, xdr, bit64);
277
278 return phdr;
279}
280
281static Elf64_Shdr *
282shdr_read(const struct buffer *in, Elf64_Ehdr *ehdr, struct xdr *xdr, int bit64)
283{
284 struct buffer b;
285 Elf64_Shdr *shdr;
286 int i;
287
288 /* cons up an input buffer for the section headers.
289 * Note that the section headers can be anywhere,
290 * per the ELF spec, You'd be surprised how many ELF
291 * readers miss this little detail.
292 */
293 buffer_splice(&b, in, ehdr->e_shoff, ehdr->e_shentsize * ehdr->e_shnum);
294 if (check_size(in, ehdr->e_shoff, buffer_size(&b), "section headers"))
295 return NULL;
296
297 /* gather up all the shdrs. */
298 shdr = calloc(sizeof(*shdr), ehdr->e_shnum);
299 for (i = 0; i < ehdr->e_shnum; i++)
300 elf_shdr(&b, &shdr[i], ehdr->e_shentsize, xdr, bit64);
301
302 return shdr;
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800303}
304
305/* Get the headers from the buffer.
306 * Return -1 in the event of an error.
307 * The section headers are optional; if NULL
308 * is passed in for pshdr they won't be parsed.
309 * We don't (yet) make payload parsing optional
310 * because we've never seen a use case.
311 */
312int
313elf_headers(const struct buffer *pinput,
Alexandru Gagniuc35850ae2014-02-02 22:37:28 -0600314 uint32_t arch,
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800315 Elf64_Ehdr *ehdr,
316 Elf64_Phdr **pphdr,
317 Elf64_Shdr **pshdr)
318{
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800319 struct xdr *xdr = &xdr_le;
320 int bit64 = 0;
Aaron Durbina983cea2014-03-04 22:08:05 -0600321 struct buffer input;
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800322
Aaron Durbina983cea2014-03-04 22:08:05 -0600323 buffer_clone(&input, pinput);
324
325 if (!iself(buffer_get(pinput))) {
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800326 ERROR("The stage file is not in ELF format!\n");
327 return -1;
328 }
329
330 elf_eident(&input, ehdr);
331 bit64 = ehdr->e_ident[EI_CLASS] == ELFCLASS64;
332 /* Assume LE unless we are sure otherwise.
333 * We're not going to take on the task of
334 * fully validating the ELF file. That way
335 * lies madness.
336 */
337 if (ehdr->e_ident[EI_DATA] == ELFDATA2MSB)
338 xdr = &xdr_be;
339
340 elf_ehdr(&input, ehdr, xdr, bit64);
341
342 // The tool may work in architecture-independent way.
343 if (arch != CBFS_ARCHITECTURE_UNKNOWN &&
344 !((ehdr->e_machine == EM_ARM) && (arch == CBFS_ARCHITECTURE_ARMV7)) &&
345 !((ehdr->e_machine == EM_386) && (arch == CBFS_ARCHITECTURE_X86))) {
346 ERROR("The stage file has the wrong architecture\n");
347 return -1;
348 }
349
Aaron Durbina983cea2014-03-04 22:08:05 -0600350 *pphdr = phdr_read(pinput, ehdr, xdr, bit64);
351 if (*pphdr == NULL)
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800352 return -1;
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800353
354 if (!pshdr)
355 return 0;
356
Aaron Durbina983cea2014-03-04 22:08:05 -0600357 *pshdr = shdr_read(pinput, ehdr, xdr, bit64);
358 if (*pshdr == NULL)
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800359 return -1;
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800360
361 return 0;
362}