blob: c3b0f9b7ee56bebf8981e6affcd1291fbd0fcef3 [file] [log] [blame]
Aaron Durbin4fde5a62014-03-07 15:11:53 -06001/*
2 ;* Copyright (C) 2014 Google, Inc.
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; version 2 of the License.
7 *
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 * GNU General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public License
14 * along with this program; if not, write to the Free Software
15 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA, 02110-1301 USA
16 */
17
18#include <stdio.h>
19#include <stdlib.h>
20#include <string.h>
21
22#include "elfparsing.h"
23#include "rmodule.h"
24#include "../../src/include/rmodule-defs.h"
25
26struct rmod_context;
27
28struct arch_ops {
29 int arch;
30 /* Determine if relocation is a valid type for the architecture. */
31 int (*valid_type)(struct rmod_context *ctx, Elf64_Rela *rel);
32 /* Determine if relocation should be emitted. */
33 int (*should_emit)(struct rmod_context *ctx, Elf64_Rela *rel);
34};
35
36struct rmod_context {
37 /* Ops to process relocations. */
38 struct arch_ops *ops;
39
40 /* endian conversion ops */
41 struct xdr *xdr;
42
43 /* Parsed ELF sturcture. */
44 struct parsed_elf pelf;
45 /* Program segment. */
46 Elf64_Phdr *phdr;
47
48 /* Collection of relocation addresses fixup in the module. */
49 Elf64_Xword nrelocs;
50 Elf64_Addr *emitted_relocs;
51
52 /* The following fields are addresses within the linked program. */
53 Elf64_Addr link_addr;
54 Elf64_Addr entry;
55 Elf64_Addr parameters_begin;
56 Elf64_Addr parameters_end;
57 Elf64_Addr bss_begin;
58 Elf64_Addr bss_end;
59 Elf64_Xword size;
60};
61
62/*
63 * Architecture specific support operations.
64 */
65static int valid_reloc_386(struct rmod_context *ctx, Elf64_Rela *rel)
66{
67 int type;
68
69 type = ELF64_R_TYPE(rel->r_info);
70
71 /* Only these 2 relocations are expected to be found. */
72 return (type == R_386_32 || type == R_386_PC32);
73}
74
75static int should_emit_386(struct rmod_context *ctx, Elf64_Rela *rel)
76{
77 int type;
78
79 type = ELF64_R_TYPE(rel->r_info);
80
81 /* R_386_32 relocations are absolute. Must emit these. */
82 return (type == R_386_32);
83}
84
Aaron Durbin785e47b2014-03-20 11:08:02 -050085static int valid_reloc_arm(struct rmod_context *ctx, Elf64_Rela *rel)
86{
87 int type;
88
89 type = ELF64_R_TYPE(rel->r_info);
90
Furquan Shaikhc4f08f72014-07-23 13:42:22 -070091 /* Only these 6 relocations are expected to be found. */
Aaron Durbin785e47b2014-03-20 11:08:02 -050092 return (type == R_ARM_ABS32 || type == R_ARM_THM_PC22 ||
Furquan Shaikhc4f08f72014-07-23 13:42:22 -070093 type == R_ARM_THM_JUMP24 || type == R_ARM_V4BX ||
94 type == R_ARM_CALL || type == R_ARM_JUMP24);
Aaron Durbin785e47b2014-03-20 11:08:02 -050095}
96
97static int should_emit_arm(struct rmod_context *ctx, Elf64_Rela *rel)
98{
99 int type;
100
101 type = ELF64_R_TYPE(rel->r_info);
102
103 /* R_ARM_ABS32 relocations are absolute. Must emit these. */
104 return (type == R_ARM_ABS32);
105}
106
Furquan Shaikhd2338ba2014-08-26 15:21:15 -0700107static int valid_reloc_aarch64(struct rmod_context *ctx, Elf64_Rela *rel)
108{
109 int type;
110
111 type = ELF64_R_TYPE(rel->r_info);
112
113 return (type == R_AARCH64_ADR_PREL_PG_HI21 ||
114 type == R_AARCH64_ADD_ABS_LO12_NC ||
115 type == R_AARCH64_JUMP26 ||
116 type == R_AARCH64_LDST32_ABS_LO12_NC ||
117 type == R_AARCH64_CALL26 ||
118 type == R_AARCH64_ABS64 ||
119 type == R_AARCH64_LD_PREL_LO19 ||
120 type == R_AARCH64_ADR_PREL_LO21);
121}
122
123static int should_emit_aarch64(struct rmod_context *ctx, Elf64_Rela *rel)
124{
125 int type;
126
127 type = ELF64_R_TYPE(rel->r_info);
128
129 return (type == R_AARCH64_ABS64);
130}
131
Aaron Durbin4fde5a62014-03-07 15:11:53 -0600132static struct arch_ops reloc_ops[] = {
133 {
134 .arch = EM_386,
135 .valid_type = valid_reloc_386,
136 .should_emit = should_emit_386,
137 },
Aaron Durbin785e47b2014-03-20 11:08:02 -0500138 {
139 .arch = EM_ARM,
140 .valid_type = valid_reloc_arm,
141 .should_emit = should_emit_arm,
142 },
Furquan Shaikhd2338ba2014-08-26 15:21:15 -0700143 {
144 .arch = EM_AARCH64,
145 .valid_type = valid_reloc_aarch64,
146 .should_emit = should_emit_aarch64,
147 },
Aaron Durbin4fde5a62014-03-07 15:11:53 -0600148};
149
150/*
151 * Relocation processing loops.
152 */
153
154static int for_each_reloc(struct rmod_context *ctx, int do_emit)
155{
156 Elf64_Half i;
157 struct parsed_elf *pelf = &ctx->pelf;
158
159 for (i = 0; i < pelf->ehdr.e_shnum; i++) {
160 Elf64_Shdr *shdr;
161 Elf64_Rela *relocs;
162 Elf64_Xword nrelocs;
163 Elf64_Xword j;
164
165 relocs = pelf->relocs[i];
166
167 /* No relocations in this section. */
168 if (relocs == NULL)
169 continue;
170
171 shdr = &pelf->shdr[i];
172 nrelocs = shdr->sh_size / shdr->sh_entsize;
173
174 for (j = 0; j < nrelocs; j++) {
175 Elf64_Rela *r = &relocs[j];
176
177 if (!ctx->ops->valid_type(ctx, r)) {
178 ERROR("Invalid reloc type: %u\n",
179 (unsigned int)ELF64_R_TYPE(r->r_info));
180 return -1;
181 }
182
183 if (ctx->ops->should_emit(ctx, r)) {
184 int n = ctx->nrelocs;
185 if (do_emit)
186 ctx->emitted_relocs[n] = r->r_offset;
187 ctx->nrelocs++;
188 }
189 }
190 }
191
192 return 0;
193}
194
195static int find_program_segment(struct rmod_context *ctx)
196{
197 int i;
198 int nsegments;
199 struct parsed_elf *pelf;
200 Elf64_Phdr *phdr;
201
202 pelf = &ctx->pelf;
203
204 /* There should only be a single loadable segment. */
205 nsegments = 0;
206 for (i = 0; i < pelf->ehdr.e_phnum; i++) {
207 if (pelf->phdr[i].p_type != PT_LOAD)
208 continue;
209 phdr = &pelf->phdr[i];
210 nsegments++;
211 }
212
213 if (nsegments != 1) {
214 ERROR("Unexepcted number of loadable segments: %d.\n",
215 nsegments);
216 return -1;
217 }
218
219 INFO("Segment at 0x%0llx, file size 0x%0llx, mem size 0x%0llx.\n",
220 (long long)phdr->p_vaddr, (long long)phdr->p_filesz,
221 (long long)phdr->p_memsz);
222
223 ctx->phdr = phdr;
224
225 return 0;
226}
227
228static int
229filter_relocation_sections(struct rmod_context *ctx)
230{
231 int i;
232 const char *shstrtab;
233 struct parsed_elf *pelf;
234 const Elf64_Phdr *phdr;
235
236 pelf = &ctx->pelf;
237 phdr = ctx->phdr;
238 shstrtab = buffer_get(pelf->strtabs[pelf->ehdr.e_shstrndx]);
239
240 /*
241 * Find all relocation sections that contain relocation entries
242 * for sections that fall within the bounds of the segment. For
243 * easier processing the pointer to the relocation array for the
244 * sections that don't fall within the loadable program are NULL'd
245 * out.
246 */
247 for (i = 0; i < pelf->ehdr.e_shnum; i++) {
248 Elf64_Shdr *shdr;
249 Elf64_Word sh_info;
250 const char *section_name;
251
252 shdr = &pelf->shdr[i];
253
254 /* Ignore non-relocation sections. */
255 if (shdr->sh_type != SHT_RELA && shdr->sh_type != SHT_REL)
256 continue;
257
258 /* Obtain section which relocations apply. */
259 sh_info = shdr->sh_info;
260 shdr = &pelf->shdr[sh_info];
261
262 section_name = &shstrtab[shdr->sh_name];
263 DEBUG("Relocation section found for '%s' section.\n",
264 section_name);
265
266 /* Do not process relocations for debug sections. */
267 if (strstr(section_name, ".debug") != NULL) {
268 pelf->relocs[i] = NULL;
269 continue;
270 }
271
272 /*
273 * If relocations apply to a non program section ignore the
274 * relocations for future processing.
275 */
276 if (shdr->sh_type != SHT_PROGBITS) {
277 pelf->relocs[i] = NULL;
278 continue;
279 }
280
281 if (shdr->sh_addr < phdr->p_vaddr ||
282 ((shdr->sh_addr + shdr->sh_size) >
283 (phdr->p_vaddr + phdr->p_memsz))) {
284 ERROR("Relocations being applied to section %d not "
285 "within segment region.\n", sh_info);
286 return -1;
287 }
288 }
289
290 return 0;
291}
292
293static int vaddr_cmp(const void *a, const void *b)
294{
295 const Elf64_Addr *pa = a;
296 const Elf64_Addr *pb = b;
297
298 if (*pa < *pb)
299 return -1;
300 if (*pa > *pb)
301 return 1;
302 return 0;
303}
304
305static int collect_relocations(struct rmod_context *ctx)
306{
307 int nrelocs;
308
309 /*
310 * The relocs array in the pelf should only contain relocations that
311 * apply to the program. Count the number relocations. Then collect
312 * them into the allocated buffer.
313 */
314 if (for_each_reloc(ctx, 0))
315 return -1;
316
317 nrelocs = ctx->nrelocs;
318 INFO("%d relocations to be emitted.\n", nrelocs);
Furquan Shaikhb237c102014-08-26 14:59:36 -0700319 if (!nrelocs)
320 return 0;
Aaron Durbin4fde5a62014-03-07 15:11:53 -0600321
322 /* Reset the counter for indexing into the array. */
323 ctx->nrelocs = 0;
324 ctx->emitted_relocs = calloc(nrelocs, sizeof(Elf64_Addr));
325 /* Write out the relocations into the emitted_relocs array. */
326 if (for_each_reloc(ctx, 1))
327 return -1;
328
329 if (ctx->nrelocs != nrelocs) {
330 ERROR("Mismatch counted and emitted relocations: %zu vs %zu.\n",
331 (size_t)nrelocs, (size_t)ctx->nrelocs);
332 return -1;
333 }
334
335 /* Sort the relocations by their address. */
336 qsort(ctx->emitted_relocs, nrelocs, sizeof(Elf64_Addr), vaddr_cmp);
337
338 return 0;
339}
340
341static int
342populate_sym(struct rmod_context *ctx, const char *sym_name, Elf64_Addr *addr,
343 int nsyms, const char *strtab)
344{
345 int i;
346 Elf64_Sym *syms;
347
348 syms = ctx->pelf.syms;
349
350 for (i = 0; i < nsyms; i++) {
351 if (syms[i].st_name == 0)
352 continue;
353 if (strcmp(sym_name, &strtab[syms[i].st_name]))
354 continue;
355 DEBUG("%s -> 0x%llx\n", sym_name, (long long)syms[i].st_value);
356 *addr = syms[i].st_value;
357 return 0;
358 }
359 ERROR("symbol '%s' not found.\n", sym_name);
360 return -1;
361}
362
363static int populate_program_info(struct rmod_context *ctx)
364{
365 int i;
366 const char *strtab;
367 struct parsed_elf *pelf;
368 Elf64_Ehdr *ehdr;
369 int nsyms;
370
371 pelf = &ctx->pelf;
372 ehdr = &pelf->ehdr;
373
374 /* Obtain the string table. */
375 strtab = NULL;
376 for (i = 0; i < ehdr->e_shnum; i++) {
377 if (ctx->pelf.strtabs[i] == NULL)
378 continue;
379 /* Don't use the section headers' string table. */
380 if (i == ehdr->e_shstrndx)
381 continue;
382 strtab = buffer_get(ctx->pelf.strtabs[i]);
383 break;
384 }
385
386 if (strtab == NULL) {
387 ERROR("No string table found.\n");
388 return -1;
389 }
390
391 /* Determine number of symbols. */
392 nsyms = 0;
393 for (i = 0; i < ehdr->e_shnum; i++) {
394 if (pelf->shdr[i].sh_type != SHT_SYMTAB)
395 continue;
396
397 nsyms = pelf->shdr[i].sh_size / pelf->shdr[i].sh_entsize;
398 break;
399 }
400
401 if (populate_sym(ctx, "_module_params_begin", &ctx->parameters_begin,
402 nsyms, strtab))
403 return -1;
404
405 if (populate_sym(ctx, "_module_params_end", &ctx->parameters_end,
406 nsyms, strtab))
407 return -1;
408
409 if (populate_sym(ctx, "_bss", &ctx->bss_begin, nsyms, strtab))
410 return -1;
411
412 if (populate_sym(ctx, "_ebss", &ctx->bss_end, nsyms, strtab))
413 return -1;
414
415 if (populate_sym(ctx, "__rmodule_entry", &ctx->entry, nsyms, strtab))
416 return -1;
417
418 /* Link address is the virtual address of the program segment. */
419 ctx->link_addr = ctx->phdr->p_vaddr;
420
421 /* The program size is the memsz of the program segment. */
422 ctx->size = ctx->phdr->p_memsz;
423
424 return 0;
425}
426
427static int
428add_section(struct elf_writer *ew, struct buffer *data, const char *name,
429 Elf64_Addr addr, Elf64_Word size)
430{
431 Elf64_Shdr shdr;
432 int ret;
433
434 memset(&shdr, 0, sizeof(shdr));
435 if (data != NULL) {
436 shdr.sh_type = SHT_PROGBITS;
437 shdr.sh_flags = SHF_ALLOC | SHF_WRITE | SHF_EXECINSTR;
438 } else {
439 shdr.sh_type = SHT_NOBITS;
440 shdr.sh_flags = SHF_ALLOC;
441 }
442 shdr.sh_addr = addr;
443 shdr.sh_offset = addr;
444 shdr.sh_size = size;
445
446 ret = elf_writer_add_section(ew, &shdr, data, name);
447
448 if (ret)
449 ERROR("Could not add '%s' section.\n", name);
450
451 return ret;
452}
453
454static int
455write_elf(const struct rmod_context *ctx, const struct buffer *in,
456 struct buffer *out)
457{
458 int i;
459 int ret;
460 int bit64;
461 size_t loc;
462 size_t rmod_data_size;
463 struct elf_writer *ew;
464 struct buffer rmod_data;
465 struct buffer rmod_header;
466 struct buffer program;
467 struct buffer relocs;
468 Elf64_Xword total_size;
469 Elf64_Addr addr;
470 Elf64_Ehdr ehdr;
471
472 bit64 = ctx->pelf.ehdr.e_ident[EI_CLASS] == ELFCLASS64;
473
474 /*
475 * 3 sections will be added to the ELF file.
476 * +------------------+
477 * | rmodule header |
478 * +------------------+
479 * | program |
480 * +------------------+
481 * | relocations |
482 * +------------------+
483 */
484
485 /* Create buffer for header and relocations. */
486 rmod_data_size = sizeof(struct rmodule_header);
487 if (bit64)
488 rmod_data_size += ctx->nrelocs * sizeof(Elf64_Addr);
489 else
490 rmod_data_size += ctx->nrelocs * sizeof(Elf32_Addr);
491
492 if (buffer_create(&rmod_data, rmod_data_size, "rmod"))
493 return -1;
494
495 buffer_splice(&rmod_header, &rmod_data,
496 0, sizeof(struct rmodule_header));
497 buffer_clone(&relocs, &rmod_data);
498 buffer_seek(&relocs, sizeof(struct rmodule_header));
499
500 /* Reset current location. */
501 buffer_set_size(&rmod_header, 0);
502 buffer_set_size(&relocs, 0);
503
504 /* Program contents. */
505 buffer_splice(&program, in, ctx->phdr->p_offset, ctx->phdr->p_filesz);
506
507 /* Create ELF writer with modified entry point. */
508 memcpy(&ehdr, &ctx->pelf.ehdr, sizeof(ehdr));
509 ehdr.e_entry = ctx->entry;
510 ew = elf_writer_init(&ehdr);
511
512 if (ew == NULL) {
513 ERROR("Failed to create ELF writer.\n");
514 buffer_delete(&rmod_data);
515 return -1;
516 }
517
518 /* Write out rmodule_header. */
519 ctx->xdr->put16(&rmod_header, RMODULE_MAGIC);
520 ctx->xdr->put8(&rmod_header, RMODULE_VERSION_1);
521 ctx->xdr->put8(&rmod_header, 0);
522 /* payload_begin_offset */
523 loc = sizeof(struct rmodule_header);
524 ctx->xdr->put32(&rmod_header, loc);
525 /* payload_end_offset */
526 loc += ctx->phdr->p_filesz;
527 ctx->xdr->put32(&rmod_header, loc);
528 /* relocations_begin_offset */
529 ctx->xdr->put32(&rmod_header, loc);
530 /* relocations_end_offset */
531 if (bit64)
532 loc += ctx->nrelocs * sizeof(Elf64_Addr);
533 else
534 loc += ctx->nrelocs * sizeof(Elf32_Addr);
535 ctx->xdr->put32(&rmod_header, loc);
536 /* module_link_start_address */
537 ctx->xdr->put32(&rmod_header, ctx->link_addr);
538 /* module_program_size */
539 ctx->xdr->put32(&rmod_header, ctx->size);
540 /* module_entry_point */
541 ctx->xdr->put32(&rmod_header, ctx->entry);
542 /* parameters_begin */
543 ctx->xdr->put32(&rmod_header, ctx->parameters_begin);
544 /* parameters_end */
545 ctx->xdr->put32(&rmod_header, ctx->parameters_end);
546 /* bss_begin */
547 ctx->xdr->put32(&rmod_header, ctx->bss_begin);
548 /* bss_end */
549 ctx->xdr->put32(&rmod_header, ctx->bss_end);
550 /* padding[4] */
551 ctx->xdr->put32(&rmod_header, 0);
552 ctx->xdr->put32(&rmod_header, 0);
553 ctx->xdr->put32(&rmod_header, 0);
554 ctx->xdr->put32(&rmod_header, 0);
555
556 /* Write the relocations. */
557 for (i = 0; i < ctx->nrelocs; i++) {
558 if (bit64)
559 ctx->xdr->put64(&relocs, ctx->emitted_relocs[i]);
560 else
561 ctx->xdr->put32(&relocs, ctx->emitted_relocs[i]);
562 }
563
564 total_size = 0;
565 addr = 0;
566
567 /*
568 * There are 2 cases to deal with. The program has a large NOBITS
569 * section and the relocations can fit entirely within occupied memory
570 * region for the program. The other is that the relocations increase
571 * the memory footprint of the program if it was loaded directly into
572 * the region it would run. The rmdoule header is a fixed cost that
573 * is considered a part of the program.
574 */
575 total_size += buffer_size(&rmod_header);
Aaron Durbin518a3222014-08-26 13:52:30 -0500576 if (buffer_size(&relocs) + ctx->phdr->p_filesz > ctx->phdr->p_memsz) {
Aaron Durbin4fde5a62014-03-07 15:11:53 -0600577 total_size += buffer_size(&relocs);
578 total_size += ctx->phdr->p_filesz;
Aaron Durbin518a3222014-08-26 13:52:30 -0500579 } else {
580 total_size += ctx->phdr->p_memsz;
Aaron Durbin4fde5a62014-03-07 15:11:53 -0600581 }
582
583 ret = add_section(ew, &rmod_header, ".header", addr,
584 buffer_size(&rmod_header));
585 if (ret < 0)
586 goto out;
587 addr += buffer_size(&rmod_header);
588
589 ret = add_section(ew, &program, ".program", addr, ctx->phdr->p_filesz);
590 if (ret < 0)
591 goto out;
592 addr += ctx->phdr->p_filesz;
593
Furquan Shaikhb237c102014-08-26 14:59:36 -0700594 if (ctx->nrelocs) {
595 ret = add_section(ew, &relocs, ".relocs", addr,
596 buffer_size(&relocs));
597 if (ret < 0)
598 goto out;
599 addr += buffer_size(&relocs);
600 }
Aaron Durbin4fde5a62014-03-07 15:11:53 -0600601
602 if (total_size != addr) {
603 ret = add_section(ew, NULL, ".empty", addr, total_size - addr);
604 if (ret < 0)
605 goto out;
606 }
607
608 /*
609 * Ensure last section has a memory usage that meets the required
610 * total size of the program in memory.
611 */
612
613 ret = elf_writer_serialize(ew, out);
614 if (ret < 0)
615 ERROR("Failed to serialize ELF to buffer.\n");
616
617out:
618 buffer_delete(&rmod_data);
619 elf_writer_destroy(ew);
620
621 return ret;
622}
623
624int rmodule_create(const struct buffer *elfin, struct buffer *elfout)
625{
626 struct rmod_context ctx;
627 struct parsed_elf *pelf;
628 int i;
629 int ret;
630
631 ret = -1;
632 memset(&ctx, 0, sizeof(ctx));
633 pelf = &ctx.pelf;
634
635 if (parse_elf(elfin, pelf, ELF_PARSE_ALL)) {
636 ERROR("Couldn't parse ELF!\n");
637 return -1;
638 }
639
640 /* Only allow executables to be turned into rmodules. */
641 if (pelf->ehdr.e_type != ET_EXEC) {
642 ERROR("ELF is not an executable: %u.\n", pelf->ehdr.e_type);
643 goto out;
644 }
645
646 /* Determine if architecture is supported. */
647 for (i = 0; i < ARRAY_SIZE(reloc_ops); i++) {
648 if (reloc_ops[i].arch == pelf->ehdr.e_machine) {
649 ctx.ops = &reloc_ops[i];
650 break;
651 }
652 }
653
654 if (ctx.ops == NULL) {
655 ERROR("ELF is unsupported arch: %u.\n", pelf->ehdr.e_machine);
656 goto out;
657 }
658
659 /* Set the endian ops. */
660 if (ctx.pelf.ehdr.e_ident[EI_DATA] == ELFDATA2MSB)
661 ctx.xdr = &xdr_be;
662 else
663 ctx.xdr = &xdr_le;
664
665 if (find_program_segment(&ctx))
666 goto out;
667
668 if (filter_relocation_sections(&ctx))
669 goto out;
670
671 if (collect_relocations(&ctx))
672 goto out;
673
674 if (populate_program_info(&ctx))
675 goto out;
676
677 if (write_elf(&ctx, elfin, elfout))
678 goto out;
679
680 ret = 0;
681
682out:
683 free(ctx.emitted_relocs);
684 parsed_elf_destroy(pelf);
685 return ret;
686}