blob: d0ca9a6505f907dcefd79d868d749cca41df541b [file] [log] [blame]
Kevin O'Connor202024a2009-01-17 10:41:28 -05001#!/usr/bin/env python
Kevin O'Connor5b8f8092009-09-20 19:47:45 -04002# Script to analyze code and arrange ld sections.
Kevin O'Connor202024a2009-01-17 10:41:28 -05003#
4# Copyright (C) 2008 Kevin O'Connor <kevin@koconnor.net>
5#
6# This file may be distributed under the terms of the GNU GPLv3 license.
7
8import sys
9
Kevin O'Connor5b8f8092009-09-20 19:47:45 -040010# Align 'pos' to 'alignbytes' offset
Kevin O'Connor711ddc62009-01-17 15:17:34 -050011def alignpos(pos, alignbytes):
12 mask = alignbytes - 1
13 return (pos + mask) & ~mask
14
Kevin O'Connor5b8f8092009-09-20 19:47:45 -040015# LD script headers/trailers
16COMMONHEADER = """
17/* DO NOT EDIT! This is an autogenerated file. See tools/layoutrom.py. */
18OUTPUT_FORMAT("elf32-i386")
19OUTPUT_ARCH("i386")
20SECTIONS
21{
22"""
23COMMONTRAILER = """
24}
25"""
26
Kevin O'Connorc0693942009-06-10 21:56:01 -040027
28######################################################################
29# 16bit fixed address section fitting
30######################################################################
31
Kevin O'Connor5b8f8092009-09-20 19:47:45 -040032# Get the maximum start position for a list of sections that end at an
33# address.
34def getSectionsStart(sections, endaddr, minalign=1):
35 totspace = 0
36 for size, align, name in sections:
37 if align > minalign:
38 minalign = align
39 totspace = alignpos(totspace, align) + size
40 return (endaddr - totspace) / minalign * minalign
Kevin O'Connordb802ad2009-01-17 19:35:10 -050041
Kevin O'Connor5b8f8092009-09-20 19:47:45 -040042# Write LD script includes for the given sections
43def outSections(file, sections):
44 for size, align, name in sections:
45 file.write("*(%s)\n" % (name,))
46
47# The 16bit code can't exceed 64K of space.
48MAXPOS = 64*1024
49
50# Layout the 16bit code. This ensures sections with fixed offset
51# requirements are placed in the correct location. It also places the
52# 16bit code as high as possible in the f-segment.
Kevin O'Connorc0693942009-06-10 21:56:01 -040053def doLayout16(sections, outname):
Kevin O'Connor202024a2009-01-17 10:41:28 -050054 textsections = []
55 rodatasections = []
56 datasections = []
Kevin O'Connor711ddc62009-01-17 15:17:34 -050057 # fixedsections = [(addr, sectioninfo, extasectionslist), ...]
58 fixedsections = []
59 # canrelocate = [(sectioninfo, list), ...]
60 canrelocate = []
Kevin O'Connor202024a2009-01-17 10:41:28 -050061
62 # Find desired sections.
63 for section in sections:
Kevin O'Connor711ddc62009-01-17 15:17:34 -050064 size, align, name = section
Kevin O'Connor202024a2009-01-17 10:41:28 -050065 if name[:11] == '.fixedaddr.':
66 addr = int(name[11:], 16)
Kevin O'Connor711ddc62009-01-17 15:17:34 -050067 fixedsections.append((addr, section, []))
68 if align != 1:
69 print "Error: Fixed section %s has non-zero alignment (%d)" % (
70 name, align)
71 sys.exit(1)
Kevin O'Connor202024a2009-01-17 10:41:28 -050072 if name[:6] == '.text.':
73 textsections.append(section)
Kevin O'Connor711ddc62009-01-17 15:17:34 -050074 canrelocate.append((section, textsections))
Kevin O'Connor202024a2009-01-17 10:41:28 -050075 if name[:17] == '.rodata.__func__.' or name == '.rodata.str1.1':
76 rodatasections.append(section)
Kevin O'Connor711ddc62009-01-17 15:17:34 -050077 #canrelocate.append((section, rodatasections))
Kevin O'Connor202024a2009-01-17 10:41:28 -050078 if name[:8] == '.data16.':
79 datasections.append(section)
Kevin O'Connor711ddc62009-01-17 15:17:34 -050080 #canrelocate.append((section, datasections))
81
82 # Find freespace in fixed address area
83 fixedsections.sort()
84 # fixedAddr = [(freespace, sectioninfo), ...]
85 fixedAddr = []
86 for i in range(len(fixedsections)):
87 fixedsectioninfo = fixedsections[i]
88 addr, section, extrasectionslist = fixedsectioninfo
89 if i == len(fixedsections) - 1:
Kevin O'Connordb802ad2009-01-17 19:35:10 -050090 nextaddr = MAXPOS
Kevin O'Connor711ddc62009-01-17 15:17:34 -050091 else:
92 nextaddr = fixedsections[i+1][0]
93 avail = nextaddr - addr - section[0]
94 fixedAddr.append((avail, fixedsectioninfo))
95
96 # Attempt to fit other sections into fixed area
97 fixedAddr.sort()
98 canrelocate.sort()
Kevin O'Connor76f0bed2009-01-19 13:00:42 -050099 totalused = 0
Kevin O'Connor711ddc62009-01-17 15:17:34 -0500100 for freespace, fixedsectioninfo in fixedAddr:
101 fixedaddr, fixedsection, extrasections = fixedsectioninfo
102 addpos = fixedaddr + fixedsection[0]
Kevin O'Connor76f0bed2009-01-19 13:00:42 -0500103 totalused += fixedsection[0]
Kevin O'Connor711ddc62009-01-17 15:17:34 -0500104 nextfixedaddr = addpos + freespace
105# print "Filling section %x uses %d, next=%x, available=%d" % (
106# fixedaddr, fixedsection[0], nextfixedaddr, freespace)
107 while 1:
108 canfit = None
109 for fixedaddrinfo in canrelocate:
110 fitsection, inlist = fixedaddrinfo
Kevin O'Connordb802ad2009-01-17 19:35:10 -0500111 fitsize, fitalign, fitname = fitsection
112 if addpos + fitsize > nextfixedaddr:
113 # Can't fit and nothing else will fit.
Kevin O'Connor711ddc62009-01-17 15:17:34 -0500114 break
Kevin O'Connordb802ad2009-01-17 19:35:10 -0500115 fitnextaddr = alignpos(addpos, fitalign) + fitsize
116# print "Test %s - %x vs %x" % (
117# fitname, fitnextaddr, nextfixedaddr)
118 if fitnextaddr > nextfixedaddr:
119 # This item can't fit.
120 continue
Kevin O'Connor711ddc62009-01-17 15:17:34 -0500121 canfit = (fitnextaddr, fixedaddrinfo)
122 if canfit is None:
123 break
124 # Found a section that can fit.
125 fitnextaddr, fixedaddrinfo = canfit
126 canrelocate.remove(fixedaddrinfo)
127 fitsection, inlist = fixedaddrinfo
128 inlist.remove(fitsection)
129 extrasections.append(fitsection)
130 addpos = fitnextaddr
Kevin O'Connor76f0bed2009-01-19 13:00:42 -0500131 totalused += fitsection[0]
132# print " Adding %s (size %d align %d) pos=%x avail=%d" % (
133# fitsection[2], fitsection[0], fitsection[1]
134# , fitnextaddr, nextfixedaddr - fitnextaddr)
Kevin O'Connordb802ad2009-01-17 19:35:10 -0500135 firstfixed = fixedsections[0][0]
Kevin O'Connorb1a0d3a2009-05-23 17:49:44 -0400136
Kevin O'Connorb1a0d3a2009-05-23 17:49:44 -0400137 # Report stats
Kevin O'Connordb802ad2009-01-17 19:35:10 -0500138 total = MAXPOS-firstfixed
Kevin O'Connorb1a0d3a2009-05-23 17:49:44 -0400139 slack = total - totalused
140 print ("Fixed space: 0x%x-0x%x total: %d slack: %d"
141 " Percent slack: %.1f%%" % (
142 firstfixed, MAXPOS, total, slack,
143 (float(slack) / total) * 100.0))
144
Kevin O'Connor2ceeec92009-12-19 11:03:40 -0500145 # Find start positions
146 text16_start = getSectionsStart(textsections, firstfixed)
147 data16_start = getSectionsStart(rodatasections + datasections, text16_start)
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400148
Kevin O'Connor2ceeec92009-12-19 11:03:40 -0500149 # Write header and regular sections
Kevin O'Connorb1a0d3a2009-05-23 17:49:44 -0400150 output = open(outname, 'wb')
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400151 output.write(COMMONHEADER + """
Kevin O'Connor2ceeec92009-12-19 11:03:40 -0500152 data16_start = 0x%x ;
153 .data16 data16_start : {
Kevin O'Connor2ceeec92009-12-19 11:03:40 -0500154""" % data16_start)
155 outSections(output, datasections)
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400156 output.write("code16_rodata = . ;\n")
157 outSections(output, rodatasections)
Kevin O'Connor2ceeec92009-12-19 11:03:40 -0500158 output.write("""
159 }
160
161 text16_start = 0x%x ;
162 .text16 text16_start : {
163""" % text16_start)
164 outSections(output, textsections)
Kevin O'Connor202024a2009-01-17 10:41:28 -0500165
166 # Write fixed sections
Kevin O'Connor711ddc62009-01-17 15:17:34 -0500167 for addr, section, extrasections in fixedsections:
168 name = section[2]
Kevin O'Connor2ceeec92009-12-19 11:03:40 -0500169 output.write(". = ( 0x%x - text16_start ) ;\n" % (addr,))
Kevin O'Connor711ddc62009-01-17 15:17:34 -0500170 output.write("*(%s)\n" % (name,))
171 for extrasection in extrasections:
Kevin O'Connorc0693942009-06-10 21:56:01 -0400172 output.write("*(%s)\n" % (extrasection[2],))
Kevin O'Connorb1a0d3a2009-05-23 17:49:44 -0400173
174 # Write trailer
175 output.write("""
Kevin O'Connor2ceeec92009-12-19 11:03:40 -0500176 text16_end = ABSOLUTE(.) ;
Kevin O'Connorb1a0d3a2009-05-23 17:49:44 -0400177 }
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400178
179 /* Discard regular data sections to force a link error if
180 * 16bit code attempts to access data not marked with VAR16
181 */
182 /DISCARD/ : { *(.text*) *(.rodata*) *(.data*) *(.bss*) *(COMMON) }
183""" + COMMONTRAILER)
184
Kevin O'Connor2ceeec92009-12-19 11:03:40 -0500185 return data16_start
Kevin O'Connorb1a0d3a2009-05-23 17:49:44 -0400186
Kevin O'Connor202024a2009-01-17 10:41:28 -0500187
Kevin O'Connorc0693942009-06-10 21:56:01 -0400188######################################################################
189# 32bit section outputting
190######################################################################
191
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400192# Return the subset of sections with a given name prefix
193def getSectionsPrefix(sections, prefix):
Kevin O'Connorc0693942009-06-10 21:56:01 -0400194 lp = len(prefix)
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400195 out = []
Kevin O'Connorc0693942009-06-10 21:56:01 -0400196 for size, align, name in sections:
197 if name[:lp] == prefix:
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400198 out.append((size, align, name))
199 return out
Kevin O'Connorc0693942009-06-10 21:56:01 -0400200
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500201# Layout the 32bit segmented code. This places the code as high as possible.
202def doLayout32seg(sections, outname, endat):
203 # Find sections to output
204 textsections = getSectionsPrefix(sections, '.text.')
205 rodatasections = (getSectionsPrefix(sections, '.rodata.str1.1')
206 + getSectionsPrefix(sections, '.rodata.__func__.'))
207 datasections = getSectionsPrefix(sections, '.data32seg.')
208 startat = getSectionsStart(
209 textsections + rodatasections + datasections, endat)
210
211 # Write sections
212 output = open(outname, 'wb')
213 output.write(COMMONHEADER + """
214 code32seg_start = 0x%x ;
215 .text32seg code32seg_start : {
216 freespace_end = . ;
217""" % startat)
218
219 outSections(output, textsections)
220 output.write("code32seg_rodata = . ;\n")
221 outSections(output, rodatasections)
222 outSections(output, datasections)
223
224 output.write("""
225 code32seg_end = ABSOLUTE(.) ;
226 }
227 /DISCARD/ : { *(.text*) *(.rodata*) *(.data*) *(.bss*) *(COMMON) }
228""" + COMMONTRAILER)
229 return startat
230
231# Layout the 32bit flat code. This places the code as high as possible.
232def doLayout32flat(sections, outname, endat):
233 endat += 0xf0000
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400234 # Find sections to output
235 textsections = getSectionsPrefix(sections, '.text.')
236 rodatasections = getSectionsPrefix(sections, '.rodata')
237 datasections = getSectionsPrefix(sections, '.data.')
238 bsssections = getSectionsPrefix(sections, '.bss.')
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500239 startat = getSectionsStart(
240 textsections + rodatasections + datasections + bsssections, endat, 512)
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400241
242 # Write sections
Kevin O'Connorc0693942009-06-10 21:56:01 -0400243 output = open(outname, 'wb')
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400244 output.write(COMMONHEADER + """
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500245 code32flat_start = 0x%x ;
246 .text32flat code32flat_start : {
247""" % startat)
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400248
249 outSections(output, textsections)
Kevin O'Connorc0693942009-06-10 21:56:01 -0400250 output.write("code32_rodata = . ;\n")
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400251 outSections(output, rodatasections)
252 outSections(output, datasections)
253 outSections(output, bsssections)
254
255 output.write("""
256 freespace_start = . ;
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500257 code32flat_end = ABSOLUTE(.) ;
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400258 }
259""" + COMMONTRAILER)
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500260 return startat
Kevin O'Connorc0693942009-06-10 21:56:01 -0400261
262
263######################################################################
264# Section garbage collection
265######################################################################
266
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500267def getSectionsList(info, names):
268 out = []
269 for i in info[0]:
270 size, align, section = i
271 if section not in names:
272# print "gc", section
273 continue
274 out.append(i)
275 return out
276
Kevin O'Connorfdca4182010-01-01 12:46:54 -0500277# Find and keep the section associated with a symbol (if available).
278def keepsymbol(symbol, infos, pos):
279 addr, section = infos[pos][1].get(symbol, (None, None))
280 if section is None or '*' in section or section[:9] == '.discard.':
281 return -1
282 keepsection(section, infos, pos)
283 return 0
284
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400285# Note required section, and recursively set all referenced sections
286# as required.
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500287def keepsection(name, infos, pos=0):
288 if name in infos[pos][3]:
Kevin O'Connorc0693942009-06-10 21:56:01 -0400289 # Already kept - nothing to do.
290 return
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500291 infos[pos][3].append(name)
292 relocs = infos[pos][2].get(name)
Kevin O'Connorc0693942009-06-10 21:56:01 -0400293 if relocs is None:
294 return
295 # Keep all sections that this section points to
296 for symbol in relocs:
Kevin O'Connorfdca4182010-01-01 12:46:54 -0500297 ret = keepsymbol(symbol, infos, pos)
298 if not ret:
Kevin O'Connorc0693942009-06-10 21:56:01 -0400299 continue
300 # Not in primary sections - it may be a cross 16/32 reference
Kevin O'Connorfdca4182010-01-01 12:46:54 -0500301 ret = keepsymbol(symbol, infos, (pos+1)%3)
302 if not ret:
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500303 continue
Kevin O'Connorfdca4182010-01-01 12:46:54 -0500304 ret = keepsymbol(symbol, infos, (pos+2)%3)
305 if not ret:
306 continue
Kevin O'Connorc0693942009-06-10 21:56:01 -0400307
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400308# Determine which sections are actually referenced and need to be
309# placed into the output file.
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500310def gc(info16, info32seg, info32flat):
311 # infos = ((sections, symbols, relocs, keep sections), ...)
312 infos = ((info16[0], info16[1], info16[2], []),
313 (info32seg[0], info32seg[1], info32seg[2], []),
314 (info32flat[0], info32flat[1], info32flat[2], []))
Kevin O'Connorc0693942009-06-10 21:56:01 -0400315 # Start by keeping sections that are globally visible.
316 for size, align, section in info16[0]:
317 if section[:11] == '.fixedaddr.' or '.export.' in section:
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500318 keepsection(section, infos)
Kevin O'Connorc0693942009-06-10 21:56:01 -0400319 # Return sections found.
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500320 sections16 = getSectionsList(info16, infos[0][3])
321 sections32seg = getSectionsList(info32seg, infos[1][3])
322 sections32flat = getSectionsList(info32flat, infos[2][3])
323 return sections16, sections32seg, sections32flat
Kevin O'Connorc0693942009-06-10 21:56:01 -0400324
325
326######################################################################
327# Startup and input parsing
328######################################################################
329
330# Read in output from objdump
331def parseObjDump(file):
332 # sections = [(size, align, section), ...]
333 sections = []
334 # symbols[symbol] = section
335 symbols = {}
336 # relocs[section] = [symbol, ...]
337 relocs = {}
338
339 state = None
340 for line in file.readlines():
341 line = line.rstrip()
342 if line == 'Sections:':
343 state = 'section'
344 continue
345 if line == 'SYMBOL TABLE:':
346 state = 'symbol'
347 continue
348 if line[:24] == 'RELOCATION RECORDS FOR [':
349 state = 'reloc'
350 relocsection = line[24:-2]
351 continue
352
353 if state == 'section':
354 try:
355 idx, name, size, vma, lma, fileoff, align = line.split()
356 if align[:3] != '2**':
357 continue
358 sections.append((int(size, 16), 2**int(align[3:]), name))
359 except:
360 pass
361 continue
362 if state == 'symbol':
363 try:
364 section, off, symbol = line[17:].split()
365 off = int(off, 16)
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400366 addr = int(line[:8], 16)
367 symbols[symbol] = addr, section
Kevin O'Connorc0693942009-06-10 21:56:01 -0400368 except:
369 pass
370 continue
371 if state == 'reloc':
372 try:
373 off, type, symbol = line.split()
374 off = int(off, 16)
375 relocs.setdefault(relocsection, []).append(symbol)
376 except:
377 pass
378 return sections, symbols, relocs
379
380def main():
381 # Get output name
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500382 in16, in32seg, in32flat, out16, out32seg, out32flat = sys.argv[1:]
Kevin O'Connorc0693942009-06-10 21:56:01 -0400383
384 infile16 = open(in16, 'rb')
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500385 infile32seg = open(in32seg, 'rb')
386 infile32flat = open(in32flat, 'rb')
Kevin O'Connorc0693942009-06-10 21:56:01 -0400387
388 info16 = parseObjDump(infile16)
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500389 info32seg = parseObjDump(infile32seg)
390 info32flat = parseObjDump(infile32flat)
Kevin O'Connorc0693942009-06-10 21:56:01 -0400391
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500392 sections16, sections32seg, sections32flat = gc(info16, info32seg, info32flat)
Kevin O'Connorc0693942009-06-10 21:56:01 -0400393
Kevin O'Connor5b8f8092009-09-20 19:47:45 -0400394 start16 = doLayout16(sections16, out16)
Kevin O'Connor871e0a02009-12-30 12:14:53 -0500395 start32seg = doLayout32seg(sections32seg, out32seg, start16)
396 doLayout32flat(sections32flat, out32flat, start32seg)
Kevin O'Connorc0693942009-06-10 21:56:01 -0400397
Kevin O'Connor202024a2009-01-17 10:41:28 -0500398if __name__ == '__main__':
399 main()