blob: 78c864fa5275c543f009a1bbd348bf36d5700120 [file] [log] [blame]
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -08001/*
2 * elf header parsing.
3 *
4 * Copyright (C) 2013 Google, Inc.
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; version 2 of the License.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA, 02110-1301 USA
18 */
19
20#include <stdio.h>
21#include <stdlib.h>
22#include <string.h>
23
24#include "elf.h"
25#include "common.h"
26#include "cbfs.h"
27
28/*
29 * Short form: this is complicated, but we've tried making it simple
30 * and we keep hitting problems with our ELF parsing.
31 *
32 * The ELF parsing situation has always been a bit tricky. In fact,
33 * we (and most others) have been getting it wrong in small ways for
34 * years. Recently this has caused real trouble for the ARM V8 build.
35 * In this file we attempt to finally get it right for all variations
36 * of endian-ness and word size and target architectures and
37 * architectures we might get run on. Phew!. To do this we borrow a
38 * page from the FreeBSD NFS xdr model (see elf_ehdr and elf_phdr),
39 * the Plan 9 endianness functions (see xdr.c), and Go interfaces (see
40 * how we use buffer structs in this file). This ends up being a bit
41 * wordy at the lowest level, but greatly simplifies the elf parsing
42 * code and removes a common source of bugs, namely, forgetting to
43 * flip type endianness when referencing a struct member.
44 *
45 * ELF files can have four combinations of data layout: 32/64, and
46 * big/little endian. Further, to add to the fun, depending on the
47 * word size, the size of the ELF structs varies. The coreboot SELF
48 * format is simpler in theory: it's supposed to be always BE, and the
49 * various struct members allow room for growth: the entry point is
50 * always 64 bits, for example, so the size of a SELF struct is
51 * constant, regardless of target architecture word size. Hence, we
52 * need to do some transformation of the ELF files.
53 *
54 * A given architecture, realistically, only supports one of the four
55 * combinations at a time as the 'native' format. Hence, our code has
56 * been sprinkled with every variation of [nh]to[hn][sll] over the
57 * years. We've never quite gotten it all right, however, and a quick
58 * pass over this code revealed another bug. It's all worked because,
59 * until now, all the working platforms that had CBFS were 32 LE. Even then,
60 * however, bugs crept in: we recently realized that we're not
61 * transforming the entry point to big format when we store into the
62 * SELF image.
63 *
64 * The problem is essentially an XDR operation:
65 * we have something in a foreign format and need to transform it.
66 * It's most like XDR because:
67 * 1) the byte order can be wrong
68 * 2) the word size can be wrong
69 * 3) the size of elements in the stream depends on the value
70 * of other elements in the stream
71 * it's not like XDR because:
72 * 1) the byte order can be right
73 * 2) the word size can be right
74 * 3) the struct members are all on a natural alignment
75 *
76 * Hence, this new approach. To cover word size issues, we *always*
77 * transform the two structs we care about, the file header and
78 * program header, into a native struct in the 64 bit format:
79 *
80 * [32,little] -> [Elf64_Ehdr, Elf64_Phdr]
81 * [64,little] -> [Elf64_Ehdr, Elf64_Phdr]
82 * [32,big] -> [Elf64_Ehdr, Elf64_Phdr]
83 * [64,big] -> [Elf64_Ehdr, Elf64_Phdr]
84 * Then we just use those structs, and all the need for inline ntoh* goes away,
85 * as well as all the chances for error.
86 * This works because all the SELF structs have fields large enough for
87 * the largest ELF 64 struct members, and all the Elf64 struct members
88 * are at least large enough for all ELF 32 struct members.
89 * We end up with one function to do all our ELF parsing, and two functions
90 * to transform the headers. For the put case, we also have
91 * XDR functions, and hopefully we'll never again spend 5 years with the
92 * wrong endian-ness on an output value :-)
93 * This should work for all word sizes and endianness we hope to target.
94 * I *really* don't want to be here for 128 bit addresses.
95 *
96 * The parse functions are called with a pointer to an input buffer
97 * struct. One might ask: are there enough bytes in the input buffer?
98 * We know there need to be at *least* sizeof(Elf32_Ehdr) +
99 * sizeof(Elf32_Phdr) bytes. Realistically, there has to be some data
100 * too. If we start to worry, though we have not in the past, we
101 * might apply the simple test: the input buffer needs to be at least
102 * sizeof(Elf64_Ehdr) + sizeof(Elf64_Phdr) bytes because, even if it's
103 * ELF 32, there's got to be *some* data! This is not theoretically
104 * accurate but it is actually good enough in practice. It allows the
105 * header transformation code to ignore the possibility of underrun.
106 *
107 * We also must accomodate different ELF files, and hence formats,
108 * in the same cbfs invocation. We might load a 64-bit payload
109 * on a 32-bit machine; we might even have a mixed armv7/armv8
110 * SOC or even a system with an x86/ARM!
111 *
112 * A possibly problematic (though unlikely to be so) assumption
113 * is that we expect the BIOS to remain in the lowest 32 bits
114 * of the physical address space. Since ARMV8 has standardized
115 * on that, and x86_64 also has, this seems a safe assumption.
116 *
117 * To repeat, ELF structs are different sizes because ELF struct
118 * members are different sizes, depending on values in the ELF file
119 * header. For this we use the functions defined in xdr.c, which
120 * consume bytes, convert the endianness, and advance the data pointer
121 * in the buffer struct.
122 */
123
124/* Get the ident array, so we can figure out
125 * endian-ness, word size, and in future other useful
126 * parameters
127 */
128static void
129elf_eident(struct buffer *input, Elf64_Ehdr *ehdr)
130{
Aaron Durbina983cea2014-03-04 22:08:05 -0600131 bgets(input, ehdr->e_ident, sizeof(ehdr->e_ident));
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800132}
133
134
Aaron Durbina983cea2014-03-04 22:08:05 -0600135static int
136check_size(const struct buffer *b, size_t offset, size_t size, const char *desc)
137{
138 if (size == 0)
139 return 0;
140
141 if (offset >= buffer_size(b) || (offset + size) > buffer_size(b)) {
142 ERROR("The file is not large enough for the '%s'. "
143 "%ld bytes @ offset %zu, input %zu bytes.\n",
144 desc, size, offset, buffer_size(b));
145 return -1;
146 }
147 return 0;
148}
149
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800150static void
151elf_ehdr(struct buffer *input, Elf64_Ehdr *ehdr, struct xdr *xdr, int bit64)
152{
153 ehdr->e_type = xdr->get16(input);
154 ehdr->e_machine = xdr->get16(input);
155 ehdr->e_version = xdr->get32(input);
156 if (bit64){
157 ehdr->e_entry = xdr->get64(input);
158 ehdr->e_phoff = xdr->get64(input);
159 ehdr->e_shoff = xdr->get64(input);
160 } else {
161 ehdr->e_entry = xdr->get32(input);
162 ehdr->e_phoff = xdr->get32(input);
163 ehdr->e_shoff = xdr->get32(input);
164 }
165 ehdr->e_flags = xdr->get32(input);
166 ehdr->e_ehsize = xdr->get16(input);
167 ehdr->e_phentsize = xdr->get16(input);
168 ehdr->e_phnum = xdr->get16(input);
169 ehdr->e_shentsize = xdr->get16(input);
170 ehdr->e_shnum = xdr->get16(input);
171 ehdr->e_shstrndx = xdr->get16(input);
172}
173
174static void
175elf_phdr(struct buffer *pinput, Elf64_Phdr *phdr,
176 int entsize, struct xdr *xdr, int bit64)
177{
178 /*
179 * The entsize need not be sizeof(*phdr).
180 * Hence, it is easier to keep a copy of the input,
181 * as the xdr functions may not advance the input
182 * pointer the full entsize; rather than get tricky
183 * we just advance it below.
184 */
Aaron Durbina983cea2014-03-04 22:08:05 -0600185 struct buffer input;
186 buffer_clone(&input, pinput);
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800187 if (bit64){
188 phdr->p_type = xdr->get32(&input);
189 phdr->p_flags = xdr->get32(&input);
190 phdr->p_offset = xdr->get64(&input);
191 phdr->p_vaddr = xdr->get64(&input);
192 phdr->p_paddr = xdr->get64(&input);
193 phdr->p_filesz = xdr->get64(&input);
194 phdr->p_memsz = xdr->get64(&input);
195 phdr->p_align = xdr->get64(&input);
196 } else {
197 phdr->p_type = xdr->get32(&input);
198 phdr->p_offset = xdr->get32(&input);
199 phdr->p_vaddr = xdr->get32(&input);
200 phdr->p_paddr = xdr->get32(&input);
201 phdr->p_filesz = xdr->get32(&input);
202 phdr->p_memsz = xdr->get32(&input);
203 phdr->p_flags = xdr->get32(&input);
204 phdr->p_align = xdr->get32(&input);
205 }
Aaron Durbina983cea2014-03-04 22:08:05 -0600206 buffer_seek(pinput, entsize);
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800207}
208
209static void
210elf_shdr(struct buffer *pinput, Elf64_Shdr *shdr,
211 int entsize, struct xdr *xdr, int bit64)
212{
213 /*
214 * The entsize need not be sizeof(*shdr).
215 * Hence, it is easier to keep a copy of the input,
216 * as the xdr functions may not advance the input
217 * pointer the full entsize; rather than get tricky
218 * we just advance it below.
219 */
220 struct buffer input = *pinput;
221 if (bit64){
222 shdr->sh_name = xdr->get32(&input);
223 shdr->sh_type = xdr->get32(&input);
224 shdr->sh_flags = xdr->get64(&input);
225 shdr->sh_addr = xdr->get64(&input);
226 shdr->sh_offset = xdr->get64(&input);
227 shdr->sh_size= xdr->get64(&input);
228 shdr->sh_link = xdr->get32(&input);
229 shdr->sh_info = xdr->get32(&input);
230 shdr->sh_addralign = xdr->get64(&input);
231 shdr->sh_entsize = xdr->get64(&input);
232 } else {
233 shdr->sh_name = xdr->get32(&input);
234 shdr->sh_type = xdr->get32(&input);
235 shdr->sh_flags = xdr->get32(&input);
236 shdr->sh_addr = xdr->get32(&input);
237 shdr->sh_offset = xdr->get32(&input);
238 shdr->sh_size = xdr->get32(&input);
239 shdr->sh_link = xdr->get32(&input);
240 shdr->sh_info = xdr->get32(&input);
241 shdr->sh_addralign = xdr->get32(&input);
242 shdr->sh_entsize = xdr->get32(&input);
243 }
Aaron Durbina983cea2014-03-04 22:08:05 -0600244 buffer_seek(pinput, entsize);
245}
246
247static Elf64_Phdr *
248phdr_read(const struct buffer *in, Elf64_Ehdr *ehdr, struct xdr *xdr, int bit64)
249{
250 struct buffer b;
251 Elf64_Phdr *phdr;
252 int i;
253
254 /* cons up an input buffer for the headers.
255 * Note that the program headers can be anywhere,
256 * per the ELF spec, You'd be surprised how many ELF
257 * readers miss this little detail.
258 */
259 buffer_splice(&b, in, ehdr->e_phoff, ehdr->e_phentsize * ehdr->e_phnum);
260 if (check_size(in, ehdr->e_phoff, buffer_size(&b), "program headers"))
261 return NULL;
262
263 /* gather up all the phdrs.
264 * We do them all at once because there is more
265 * than one loop over all the phdrs.
266 */
267 phdr = calloc(sizeof(*phdr), ehdr->e_phnum);
268 for (i = 0; i < ehdr->e_phnum; i++)
269 elf_phdr(&b, &phdr[i], ehdr->e_phentsize, xdr, bit64);
270
271 return phdr;
272}
273
274static Elf64_Shdr *
275shdr_read(const struct buffer *in, Elf64_Ehdr *ehdr, struct xdr *xdr, int bit64)
276{
277 struct buffer b;
278 Elf64_Shdr *shdr;
279 int i;
280
281 /* cons up an input buffer for the section headers.
282 * Note that the section headers can be anywhere,
283 * per the ELF spec, You'd be surprised how many ELF
284 * readers miss this little detail.
285 */
286 buffer_splice(&b, in, ehdr->e_shoff, ehdr->e_shentsize * ehdr->e_shnum);
287 if (check_size(in, ehdr->e_shoff, buffer_size(&b), "section headers"))
288 return NULL;
289
290 /* gather up all the shdrs. */
291 shdr = calloc(sizeof(*shdr), ehdr->e_shnum);
292 for (i = 0; i < ehdr->e_shnum; i++)
293 elf_shdr(&b, &shdr[i], ehdr->e_shentsize, xdr, bit64);
294
295 return shdr;
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800296}
297
298/* Get the headers from the buffer.
299 * Return -1 in the event of an error.
300 * The section headers are optional; if NULL
301 * is passed in for pshdr they won't be parsed.
302 * We don't (yet) make payload parsing optional
303 * because we've never seen a use case.
304 */
305int
306elf_headers(const struct buffer *pinput,
Alexandru Gagniuc35850ae2014-02-02 22:37:28 -0600307 uint32_t arch,
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800308 Elf64_Ehdr *ehdr,
309 Elf64_Phdr **pphdr,
310 Elf64_Shdr **pshdr)
311{
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800312 struct xdr *xdr = &xdr_le;
313 int bit64 = 0;
Aaron Durbina983cea2014-03-04 22:08:05 -0600314 struct buffer input;
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800315
Aaron Durbina983cea2014-03-04 22:08:05 -0600316 buffer_clone(&input, pinput);
317
318 if (!iself(buffer_get(pinput))) {
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800319 ERROR("The stage file is not in ELF format!\n");
320 return -1;
321 }
322
323 elf_eident(&input, ehdr);
324 bit64 = ehdr->e_ident[EI_CLASS] == ELFCLASS64;
325 /* Assume LE unless we are sure otherwise.
326 * We're not going to take on the task of
327 * fully validating the ELF file. That way
328 * lies madness.
329 */
330 if (ehdr->e_ident[EI_DATA] == ELFDATA2MSB)
331 xdr = &xdr_be;
332
333 elf_ehdr(&input, ehdr, xdr, bit64);
334
335 // The tool may work in architecture-independent way.
336 if (arch != CBFS_ARCHITECTURE_UNKNOWN &&
337 !((ehdr->e_machine == EM_ARM) && (arch == CBFS_ARCHITECTURE_ARMV7)) &&
338 !((ehdr->e_machine == EM_386) && (arch == CBFS_ARCHITECTURE_X86))) {
339 ERROR("The stage file has the wrong architecture\n");
340 return -1;
341 }
342
Aaron Durbina983cea2014-03-04 22:08:05 -0600343 *pphdr = phdr_read(pinput, ehdr, xdr, bit64);
344 if (*pphdr == NULL)
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800345 return -1;
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800346
347 if (!pshdr)
348 return 0;
349
Aaron Durbina983cea2014-03-04 22:08:05 -0600350 *pshdr = shdr_read(pinput, ehdr, xdr, bit64);
351 if (*pshdr == NULL)
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800352 return -1;
Ronald G. Minnicha8a133d2013-12-30 13:16:18 -0800353
354 return 0;
355}