Merge remote-tracking branch

'origin/GP-3182_ryanmkurtz_PR-5004_colinbourassa_unix-aout-loader'
(Closes #4943, Closes #5004)
This commit is contained in:
Ryan Kurtz 2025-03-19 16:17:14 -04:00
commit 6cc201b572
9 changed files with 1697 additions and 0 deletions

View file

@ -0,0 +1,552 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.bin.format.unixaout;
import java.io.IOException;
import ghidra.app.util.bin.*;
import ghidra.program.model.address.Address;
import ghidra.program.model.data.*;
import ghidra.program.model.listing.Listing;
import ghidra.program.model.listing.Program;
import ghidra.program.model.util.CodeUnitInsertionException;
import ghidra.util.exception.DuplicateNameException;
public class UnixAoutHeader implements StructConverter {
public enum AoutType {
OMAGIC, NMAGIC, ZMAGIC, QMAGIC, CMAGIC, UNKNOWN
}
private BinaryReader reader;
private long binarySize;
private AoutType exeType;
private boolean machineTypeValid;
private String languageSpec;
private String compilerSpec = "default";
private long pageSize;
private boolean isNetBSD = false;
private boolean isSparc = false;
private long a_magic;
private long a_text;
private long a_data;
private long a_bss;
private long a_syms;
private long a_entry;
private long a_trsize;
private long a_drsize;
private long strSize;
private long txtOffset;
private long datOffset;
private long txtRelOffset;
private long datRelOffset;
private long symOffset;
private long strOffset;
private long txtAddr;
private long txtEndAddr;
private long datAddr;
private long bssAddr;
// The Linux implementation of a.out appears to start the .text content at
// file offset 0x400 (rather than immediately after the 0x20 bytes of header
// data). It's possible that there exist Linux a.out executabLes with other
// (unintended?) header sizes caused by a mixture of 32- and 64-bit integers
// being padded out in the struct. The intended size is eight 32-bit words
// (32 bytes total.)
private static final int SIZE_OF_EXEC_HEADER = 0x20;
private static final int SIZE_OF_LONG_EXEC_HEADER = 0x400;
/**
* Interprets binary data as an exec header from a UNIX-style a.out executable, and validates
* the contained fields.
*
* @param provider Source of header binary data
* @param isLittleEndian Flag indicating whether to interpret the data as little-endian.
* @throws IOException if an IO-related error occurred
*/
public UnixAoutHeader(ByteProvider provider, boolean isLittleEndian) throws IOException {
reader = new BinaryReader(provider, isLittleEndian);
a_magic = reader.readNextUnsignedInt();
a_text = reader.readNextUnsignedInt();
a_data = reader.readNextUnsignedInt();
a_bss = reader.readNextUnsignedInt();
a_syms = reader.readNextUnsignedInt();
a_entry = reader.readNextUnsignedInt();
a_trsize = reader.readNextUnsignedInt();
a_drsize = reader.readNextUnsignedInt();
binarySize = reader.length();
setExecutableType(a_magic);
// NOTE: In NetBSD/i386 examples of a.out, the "new-style" 32-bit a_magic/midmag word is
// written in big-endian regardless of the data endianness in the rest of the file.
if ((exeType == AoutType.UNKNOWN) && isLittleEndian) {
a_magic = Integer.reverseBytes((int) a_magic);
setExecutableType(a_magic);
}
checkMachineTypeValidity(isLittleEndian);
determineTextOffset();
datOffset = txtOffset + a_text;
txtRelOffset = datOffset + a_data;
datRelOffset = txtRelOffset + a_trsize;
symOffset = datRelOffset + a_drsize;
strOffset = symOffset + a_syms;
strSize = 0;
if (strOffset != 0 && (strOffset + 4) <= binarySize) {
strSize = reader.readUnsignedInt(strOffset);
}
determineTextAddr();
txtEndAddr = txtAddr + a_text;
datAddr = (exeType == AoutType.OMAGIC) ? txtEndAddr : segmentRound(txtEndAddr);
bssAddr = datAddr + a_data;
}
public BinaryReader getReader() {
return reader;
}
/**
* {@return the processor/language specified by this header.}
*/
public String getLanguageSpec() {
return languageSpec;
}
/**
* {@return the compiler used by this executable. This is left as 'default' for
* all machine types other than i386, where it is assumed to be gcc.}
*/
public String getCompilerSpec() {
return compilerSpec;
}
/**
* {@return the enumerated type of executable contained in this A.out file.}
*/
public AoutType getExecutableType() {
return exeType;
}
/**
* {@return an indication of whether this header's fields are all valid; this
* includes the machine type, executable type, and section offsets.}
*/
public boolean isValid() {
return isMachineTypeValid() &&
(exeType != AoutType.UNKNOWN) &&
areOffsetsValid();
}
public long getTextSize() {
return a_text;
}
public long getDataSize() {
return a_data;
}
public long getBssSize() {
return a_bss;
}
public long getSymSize() {
return a_syms;
}
public long getStrSize() {
return strSize;
}
public long getEntryPoint() {
return a_entry;
}
public long getTextRelocSize() {
return a_trsize;
}
public long getDataRelocSize() {
return a_drsize;
}
public long getTextOffset() {
return txtOffset;
}
public long getDataOffset() {
return datOffset;
}
public long getTextRelocOffset() {
return txtRelOffset;
}
public long getDataRelocOffset() {
return datRelOffset;
}
public long getSymOffset() {
return symOffset;
}
public long getStrOffset() {
return strOffset;
}
public long getTextAddr() {
return txtAddr;
}
public long getDataAddr() {
return datAddr;
}
public long getBssAddr() {
return bssAddr;
}
/**
* Checks the magic word in the header for a known machine type ID, and sets the
* languageSpec string accordingly.
*/
private void checkMachineTypeValidity(boolean readingAsLittleEndian) {
machineTypeValid = true;
pageSize = 4096;
final short machtype = (short) ((a_magic >> 16) & 0xFF);
final String readEndianness = readingAsLittleEndian ? "LE" : "BE";
switch (machtype) {
/**
* Motorola 68K family
*/
case UnixAoutMachineType.M_68010:
languageSpec = "68000:BE:32:MC68010";
break;
case UnixAoutMachineType.M_68020:
languageSpec = "68000:BE:32:MC68020";
break;
case UnixAoutMachineType.M_M68K_NETBSD:
pageSize = 8192;
case UnixAoutMachineType.M_M68K4K_NETBSD:
isNetBSD = true;
languageSpec = "68000:BE:32:default";
break;
/**
* SPARC family
*/
case UnixAoutMachineType.M_SPARC_NETBSD:
isNetBSD = true;
case UnixAoutMachineType.M_SPARC:
case UnixAoutMachineType.M_SPARCLET:
isSparc = true;
pageSize = 8192;
languageSpec = "sparc:BE:32:default";
break;
case UnixAoutMachineType.M_SPARC64_NETBSD:
isNetBSD = true;
isSparc = true;
languageSpec = "sparc:BE:64:default";
break;
/**
* MIPS family
*/
case UnixAoutMachineType.M_PMAX_NETBSD:
isNetBSD = true;
case UnixAoutMachineType.M_MIPS1:
case UnixAoutMachineType.M_MIPS2:
case UnixAoutMachineType.M_R3000:
languageSpec = "MIPS:LE:32:default";
break;
case UnixAoutMachineType.M_MIPS:
languageSpec = "MIPS:BE:32:default";
break;
/**
* National Semiconductor NS32000 family
*/
case UnixAoutMachineType.M_532_NETBSD:
isNetBSD = true;
case UnixAoutMachineType.M_NS32032:
case UnixAoutMachineType.M_NS32532:
languageSpec = "UNKNOWN:LE:32:default";
break;
/**
* x86 family
*/
case UnixAoutMachineType.M_386_NETBSD:
isNetBSD = true;
case UnixAoutMachineType.M_386:
case UnixAoutMachineType.M_386_DYNIX:
compilerSpec = "gcc";
languageSpec = "x86:LE:32:default";
break;
case UnixAoutMachineType.M_X86_64_NETBSD:
compilerSpec = "gcc";
languageSpec = "x86:LE:64:default";
break;
/**
* ARM family
*/
case UnixAoutMachineType.M_ARM6_NETBSD:
isNetBSD = true;
case UnixAoutMachineType.M_ARM:
languageSpec = "ARM:" + readEndianness + ":32:default";
break;
case UnixAoutMachineType.M_AARCH64:
languageSpec = "AARCH64:" + readEndianness + ":64:default";
break;
/**
* RISC family
*/
case UnixAoutMachineType.M_OR1K:
languageSpec = "UNKNOWN:BE:32:default";
break;
case UnixAoutMachineType.M_RISCV:
languageSpec = "RISCV:LE:32:default";
break;
case UnixAoutMachineType.M_HPPA_OPENBSD:
languageSpec = "pa-risc:BE:32:default";
break;
/**
* PowerPC family
*/
case UnixAoutMachineType.M_POWERPC_NETBSD:
isNetBSD = true;
languageSpec = "PowerPC:" + readEndianness + ":32:default";
break;
case UnixAoutMachineType.M_POWERPC64:
languageSpec = "PowerPC:" + readEndianness + ":64:default";
break;
/**
* SuperH family
* NOTE: It's unclear if there is support for SuperH SH-3 or SH-5 cores;
* the primary SuperH language seems to support SH-1 and SH-2 variants
* and the alternative is the SuperH4 language.
*/
case UnixAoutMachineType.M_SH3:
case UnixAoutMachineType.M_SH5_32:
languageSpec = "SuperH:BE:32:default";
break;
case UnixAoutMachineType.M_SH5_64:
languageSpec = "SuperH:BE:64:default";
break;
/**
* VAX family
*/
case UnixAoutMachineType.M_VAX_NETBSD:
pageSize = 512;
case UnixAoutMachineType.M_VAX4K_NETBSD:
isNetBSD = true;
languageSpec = "UNKNOWN:LE:32:default";
break;
/**
* Other
*/
case UnixAoutMachineType.M_CRIS:
languageSpec = "UNKNOWN:LE:32:default";
break;
case UnixAoutMachineType.M_ALPHA_NETBSD:
isNetBSD = true;
case UnixAoutMachineType.M_IA64:
languageSpec = "UNKNOWN:" + readEndianness + ":64:default";
break;
case UnixAoutMachineType.M_29K:
case UnixAoutMachineType.M_88K_OPENBSD:
languageSpec = "UNKNOWN:" + readEndianness + ":32:default";
break;
case UnixAoutMachineType.M_UNKNOWN:
languageSpec = "UNKNOWN:" + readEndianness + ":32:default";
break;
default:
machineTypeValid = false;
}
// Check that the detected architecture's endianness matches the endianness
// with which we're reading the file; if there's a mismatch, clear the
// machineTypeValid flag because this was evidently a false reading.
if (machineTypeValid) {
String[] languageTokens = languageSpec.split(":");
if ((languageTokens.length < 2) ||
!languageTokens[1].equalsIgnoreCase(readEndianness)) {
machineTypeValid = false;
}
}
}
/**
* Returns a flag indicating whether the header contains a known machine type
* ID.
*/
private boolean isMachineTypeValid() {
return machineTypeValid;
}
/**
* Sets the executable type based on the given magic
*
* @param magic The magic
*/
private void setExecutableType(long magic) {
exeType = switch ((short) (magic & 0xFFFF)) {
case 0x111 -> AoutType.CMAGIC; // 0421: core file
case 0x108 -> AoutType.NMAGIC; // 0410: pure executable
case 0x107 -> AoutType.OMAGIC; // 0407: object file or impure executable
case 0x0CC -> AoutType.QMAGIC; // 0314: demand-paged exe w/ header in .text
case 0x10B -> AoutType.ZMAGIC; // 0413: demand-paged executable
default -> AoutType.UNKNOWN;
};
}
/**
* Determines the offset in the binary file at which the .text segment begins.
* This routine should attempt to replicate the logic from the N_TXTOFF macro
* that appears in the different incarnations of a.out.h.
*
* NOTE: The FreeBSD imgact_aout.h implies that, if the a_magic word contains
* ZMAGIC when read as little endian, the file offset for .text is __LDPGSZ;
* otherwise, if a_magic contains ZMAGIC when read as big endian, the file
* offset
* for .text is 0. Indeed, it looks like NetBSD uses big-endian ordering for
* the a_magic word even when the file contains code for a little-endian
* processor.
*/
private void determineTextOffset() {
boolean isLinuxStyle = false;
final long fixedContentSize = a_text + a_data + a_syms + a_trsize + a_drsize;
// If the file is large enough to read at least one word beyond a long-style
// header
// of 0x400 bytes plus all the sections whose sizes are specified in the
// header...
if (reader.isValidIndex(SIZE_OF_LONG_EXEC_HEADER + fixedContentSize)) {
try {
// The word that immediately follows the symbol table will contain the size of
// the string table.
final long stringTableLength =
reader.readUnsignedInt(SIZE_OF_LONG_EXEC_HEADER + fixedContentSize);
final long longHeaderExpectedFileSize =
SIZE_OF_LONG_EXEC_HEADER + fixedContentSize + stringTableLength;
// If the size of the file exactly matches what we'd expect if the .text content
// starts at offset 0x400 rather than 0, this implies that the a.out is a
// Linux-style binary.
if (binarySize == longHeaderExpectedFileSize) {
isLinuxStyle = true;
}
}
catch (IOException e) {
e.printStackTrace();
}
}
if (isLinuxStyle && (exeType == AoutType.ZMAGIC)) {
// Linux ZMAGICs don't start the .text content until 0x400
txtOffset = SIZE_OF_LONG_EXEC_HEADER;
}
else if ((exeType == AoutType.QMAGIC) ||
(exeType == AoutType.ZMAGIC)) {
// ZMAGIC for other platforms (as well as QMAGIC) include the file header itself
// in the .text content
txtOffset = 0;
}
else {
// Otherwise, the .text content starts immediately after the 0x20-byte header
txtOffset = SIZE_OF_EXEC_HEADER;
}
}
/**
* Uses the combination of executable type and architecture to set the
* appropriate
* base address of the .text segment when loaded.
*/
private void determineTextAddr() {
txtAddr = (isSparc && exeType == AoutType.NMAGIC) || isNetBSD || exeType == AoutType.QMAGIC
? pageSize
: 0;
}
/**
* Returns a flag indicating whether all the file offsets in the header
* (for the segments of nonzero size) fall within the size of the file.
*/
private boolean areOffsetsValid() {
// Note that we can't check the string table validity because, if it
// doesn't exist, its offset will be computed to be beyond the end of
// the file. The string table is also not given an explicit size in
// the header.
boolean status = ((a_text == 0) || (txtOffset < binarySize) &&
((a_data == 0) || (datOffset < binarySize)) &&
((a_trsize == 0) || (txtRelOffset < binarySize)) &&
((a_drsize == 0) || (datRelOffset < binarySize)) &&
((a_syms == 0) || (symOffset < binarySize)));
return status;
}
/**
* Rounds the provided address up to the next page boundary.
*/
private long segmentRound(long addr) {
final long mask = pageSize - 1;
long rounded = ((addr + mask) & ~mask);
return rounded;
}
@Override
public DataType toDataType() throws DuplicateNameException, IOException {
Structure struct = new StructureDataType(new CategoryPath("/AOUT"), "exec", 0);
struct.add(DWORD, "a_midmag", "magic (network byte order)");
struct.add(DWORD, "a_text", "the size of the text segment in bytes");
struct.add(DWORD, "a_data", "the size of the data segment in bytes");
struct.add(DWORD, "a_bss", "the number of bytes in the bss segment");
struct.add(DWORD, "a_syms", "the size in bytes of the symbol table section");
struct.add(DWORD, "a_entry", "the address of the entry point");
struct.add(DWORD, "a_trsize", "the size in bytes of the text relocation table");
struct.add(DWORD, "a_drsize", "the size in bytes of the data relocation table");
return struct;
}
public void markup(Program program, Address headerAddress)
throws CodeUnitInsertionException, DuplicateNameException, IOException {
Listing listing = program.getListing();
listing.createData(headerAddress, toDataType());
}
}

View file

@ -0,0 +1,78 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.bin.format.unixaout;
public class UnixAoutMachineType {
// These values come from a combination of sources, including NetBSD's aout_mids.h and the GNU
// BFD Library's libaout.h.
//
// Note: some a.out header files list a few HP values (for the 300 Series, 800 Series, etc.)
// and these values exceed a full eight-bit count. Occasionally, this is accounted for by
// extending the Machine ID field of the a_magic word two bits higher, leaving only six bits in
// the MSB for other flags. This may not be correct, because those high-value HP machine IDs
// probably only appear in HP UX binaries, which use a different format. (This format is still
// named "a.out", but has a completely different header and internal organization.) The 10-bit
// Machine ID field would also interfere with flags used by VxWorks, NetBSD, and probably
// others.
public final static short M_UNKNOWN = 0x00;
public final static short M_68010 = 0x01;
public final static short M_68020 = 0x02;
public final static short M_SPARC = 0x03;
public final static short M_R3000 = 0x04;
public final static short M_NS32032 = 0x40;
public final static short M_NS32532 = 0x45;
public final static short M_386 = 0x64;
public final static short M_29K = 0x65; // AMD 29000
public final static short M_386_DYNIX = 0x66; // i386-based Sequet machine running DYNIX
public final static short M_ARM = 0x67;
public final static short M_SPARCLET = 0x83; // Sparclet = M_SPARC + 128
public final static short M_386_NETBSD = 0x86; // NetBSD/i386
public final static short M_M68K_NETBSD = 0x87; // NetBSD/m68k, 8K pages
public final static short M_M68K4K_NETBSD = 0x88; // NetBSD/m68k, 4K pages
public final static short M_532_NETBSD = 0x89; // NetBSD/ns32k
public final static short M_SPARC_NETBSD = 0x8a; // NetBSD/sparc
public final static short M_PMAX_NETBSD = 0x8b; // NetBSD/pmax (MIPS little-endian)
public final static short M_VAX_NETBSD = 0x8c; // NetBSD/VAX (1K pages?)
public final static short M_ALPHA_NETBSD = 0x8d; // NetBSD/Alpha
public final static short M_MIPS = 0x8e; // big-endian
public final static short M_ARM6_NETBSD = 0x8f; // NetBSD/arm32
public final static short M_SH3 = 0x91;
public final static short M_POWERPC64 = 0x94; // PowerPC 64
public final static short M_POWERPC_NETBSD = 0x95; // NetBSD/PowerPC (big-endian)
public final static short M_VAX4K_NETBSD = 0x96; // NetBSD/VAX (4K pages)
public final static short M_MIPS1 = 0x97; // MIPS R2000/R3000
public final static short M_MIPS2 = 0x98; // MIPS R4000/R6000
public final static short M_88K_OPENBSD = 0x99; // OpenBSD/m88k
public final static short M_HPPA_OPENBSD = 0x9a; // OpenBSD/hppa (PA-RISC)
public final static short M_SH5_64 = 0x9b; // SuperH 64-bit
public final static short M_SPARC64_NETBSD = 0x9c; // NetBSD/sparc64
public final static short M_X86_64_NETBSD = 0x9d; // NetBSD/amd64
public final static short M_SH5_32 = 0x9e; // SuperH 32-bit (ILP 32)
public final static short M_IA64 = 0x9f; // Itanium
public final static short M_AARCH64 = 0xb7; // ARM AARCH64
public final static short M_OR1K = 0xb8; // OpenRISC 1000
public final static short M_RISCV = 0xb9; // RISC-V
public final static short M_CRIS = 0xff; // Axis ETRAX CRIS
// Machine IDs that should only appear in the incompatible HP UX a.out format:
//
// HP300 (68020+68881): 0x12c
// HP200/300 : 0x20c
// HP800 : 0x20b
}

View file

@ -0,0 +1,85 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.bin.format.unixaout;
import ghidra.app.util.opinion.UnixAoutProgramLoader;
/**
* Represents the content of a single entry in the relocation table format used
* by the UNIX a.out executable.
*/
public class UnixAoutRelocation {
public long address;
public int symbolNum;
public byte flags;
public boolean pcRelativeAddressing;
public byte pointerLength;
public boolean extern;
public boolean baseRelative;
public boolean jmpTable;
public boolean relative;
public boolean copy;
/**
*
* @param address First of the two words in the table entry (a 32-bit address)
* @param flags Second of the two words in the table entry (containing several bitfields)
* @param bigEndian True if big endian; otherwise, false
*/
public UnixAoutRelocation(long address, long flags, boolean bigEndian) {
this.address = (0xFFFFFFFF & address);
if (bigEndian) {
this.symbolNum = (int) ((flags & 0xFFFFFF00) >> 8);
this.flags = (byte) (flags & 0xFF);
this.pcRelativeAddressing = ((flags & 0x80) != 0);
this.pointerLength = (byte) (1 << ((flags & 0x60) >> 5));
this.extern = ((flags & 0x10) != 0);
this.baseRelative = ((flags & 0x8) != 0);
this.jmpTable = ((flags & 0x4) != 0);
this.relative = ((flags & 0x2) != 0);
this.copy = ((flags & 0x1) != 0);
}
else {
this.symbolNum = (int) (flags & 0x00FFFFFF);
this.flags = (byte) ((flags & 0xFF000000) >> 24);
this.pcRelativeAddressing = ((this.flags & 0x01) != 0);
this.pointerLength = (byte) (1 << ((this.flags & 0x06) >> 1));
this.extern = ((this.flags & 0x08) != 0);
this.baseRelative = ((this.flags & 0x10) != 0);
this.jmpTable = ((this.flags & 0x20) != 0);
this.relative = ((this.flags & 0x40) != 0);
this.copy = ((this.flags & 0x80) != 0);
}
}
public String getSymbolName(UnixAoutSymbolTable symtab) {
if (extern && symbolNum < symtab.size()) {
return symtab.get(symbolNum).name;
}
else if (!extern) {
return switch (symbolNum) {
case 4 -> UnixAoutProgramLoader.dot_text;
case 6 -> UnixAoutProgramLoader.dot_data;
case 8 -> UnixAoutProgramLoader.dot_bss;
default -> null;
};
}
return null;
}
}

View file

@ -0,0 +1,102 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.bin.format.unixaout;
import java.io.IOException;
import java.util.*;
import org.apache.commons.lang3.StringUtils;
import ghidra.app.util.bin.BinaryReader;
import ghidra.app.util.bin.StructConverter;
import ghidra.program.model.data.*;
import ghidra.program.model.listing.*;
import ghidra.program.model.mem.MemoryBlock;
import ghidra.program.model.util.CodeUnitInsertionException;
import ghidra.util.exception.DuplicateNameException;
public class UnixAoutRelocationTable implements Iterable<UnixAoutRelocation>, StructConverter {
private static final int ENTRY_SIZE = 8;
private final long fileSize;
private final List<UnixAoutRelocation> relocations;
private final UnixAoutSymbolTable symtab;
public UnixAoutRelocationTable(BinaryReader reader, long fileOffset, long fileSize,
UnixAoutSymbolTable symtab) throws IOException {
this.fileSize = fileSize;
this.relocations = new ArrayList<>();
this.symtab = symtab;
reader.setPointerIndex(fileOffset);
// read each relocation table entry
while (reader.getPointerIndex() < (fileOffset + fileSize)) {
long address = reader.readNextUnsignedInt();
long flags = reader.readNextUnsignedInt();
UnixAoutRelocation relocation =
new UnixAoutRelocation(address, flags, reader.isBigEndian());
relocations.add(relocation);
}
}
@Override
public Iterator<UnixAoutRelocation> iterator() {
return relocations.iterator();
}
@Override
public DataType toDataType() throws DuplicateNameException, IOException {
String dtName = "relocation_info";
Structure struct = new StructureDataType(new CategoryPath("/AOUT"), dtName, 0);
struct.setPackingEnabled(true);
try {
struct.add(DWORD, "r_address", null);
struct.addBitField(DWORD, 24, "r_symbolnum", null);
struct.addBitField(BYTE, 1, "r_pcrel", null);
struct.addBitField(BYTE, 2, "r_length", null);
struct.addBitField(BYTE, 1, "r_extern", null);
struct.addBitField(BYTE, 1, "r_baserel", null);
struct.addBitField(BYTE, 1, "r_jmptable", null);
struct.addBitField(BYTE, 1, "r_relative", null);
struct.addBitField(BYTE, 1, "r_copy", null);
}
catch (InvalidDataTypeException e) {
throw new RuntimeException(e);
}
return new ArrayDataType(struct, (int) (fileSize / ENTRY_SIZE), ENTRY_SIZE);
}
public void markup(Program program, MemoryBlock block)
throws CodeUnitInsertionException, DuplicateNameException, IOException {
Listing listing = program.getListing();
Data array = listing.createData(block.getStart(), toDataType());
int idx = 0;
for (UnixAoutRelocation relocation : this) {
String name = relocation.getSymbolName(symtab);
if (!StringUtils.isBlank(name)) {
Data structData = array.getComponent(idx);
structData.setComment(CommentType.EOL, name);
}
idx++;
}
}
}

View file

@ -0,0 +1,62 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.bin.format.unixaout;
import java.io.IOException;
import ghidra.app.util.bin.BinaryReader;
import ghidra.app.util.bin.StructConverter;
import ghidra.program.model.address.Address;
import ghidra.program.model.data.TerminatedStringDataType;
import ghidra.program.model.listing.*;
import ghidra.program.model.mem.MemoryBlock;
import ghidra.program.model.util.CodeUnitInsertionException;
public class UnixAoutStringTable {
private final BinaryReader reader;
private final long fileOffset;
public UnixAoutStringTable(BinaryReader reader, long fileOffset, long fileSize) {
this.reader = reader;
this.fileOffset = fileOffset;
}
public String readString(long stringOffset) {
if (fileOffset < 0) {
return null;
}
try {
return reader.readUtf8String(fileOffset + stringOffset).trim();
}
catch (IOException e) {
// FIXME
}
return null;
}
public void markup(Program program, MemoryBlock block) throws CodeUnitInsertionException {
Listing listing = program.getListing();
Address address = block.getStart();
listing.createData(address, StructConverter.DWORD);
int strlen = 4;
while ((address.getOffset() + strlen) < block.getEnd().getOffset()) {
address = address.add(strlen);
Data str = listing.createData(address, TerminatedStringDataType.dataType, -1);
strlen = str.getLength();
}
}
}

View file

@ -0,0 +1,66 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.bin.format.unixaout;
/**
* Represents the content of a single entry in the symbol table format used by
* the UNIX a.out executable.
*/
public class UnixAoutSymbol {
public enum SymbolType {
N_UNDF, N_ABS, N_TEXT, N_DATA, N_BSS, N_INDR, N_FN, N_STAB, UNKNOWN
}
public enum SymbolKind {
AUX_FUNC, AUX_OBJECT, AUX_LABEL, UNKNOWN
}
public long nameStringOffset;
public String name;
public SymbolType type;
public SymbolKind kind;
public byte otherByte;
public short desc;
public long value;
public boolean isExt;
public UnixAoutSymbol(long nameStringOffset, byte typeByte, byte otherByte, short desc,
long value) {
this.nameStringOffset = nameStringOffset;
this.otherByte = otherByte;
this.desc = desc;
this.value = value;
this.isExt = (typeByte & 1) == 1;
this.type = switch (typeByte & 0xfe) {
case 0 -> SymbolType.N_UNDF;
case 2 -> SymbolType.N_ABS;
case 4 -> SymbolType.N_TEXT;
case 6 -> SymbolType.N_DATA;
case 8 -> SymbolType.N_BSS;
case 10 -> SymbolType.N_INDR;
default -> (typeByte & 0xfe) >= 0x20 ? SymbolType.N_STAB : SymbolType.UNKNOWN;
};
this.kind = switch (otherByte & 0x0f) {
case 1 -> SymbolKind.AUX_OBJECT;
case 2 -> SymbolKind.AUX_FUNC;
case 3 -> SymbolKind.AUX_LABEL;
default -> SymbolKind.UNKNOWN;
};
}
}

View file

@ -0,0 +1,114 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.bin.format.unixaout;
import java.io.IOException;
import java.util.*;
import org.apache.commons.lang3.StringUtils;
import ghidra.app.util.bin.BinaryReader;
import ghidra.app.util.bin.StructConverter;
import ghidra.app.util.importer.MessageLog;
import ghidra.app.util.opinion.UnixAoutProgramLoader;
import ghidra.program.model.data.*;
import ghidra.program.model.listing.*;
import ghidra.program.model.mem.MemoryBlock;
import ghidra.program.model.util.CodeUnitInsertionException;
import ghidra.util.exception.DuplicateNameException;
public class UnixAoutSymbolTable implements Iterable<UnixAoutSymbol>, StructConverter {
private static final int ENTRY_SIZE = 12;
private final long fileSize;
private List<UnixAoutSymbol> symbols;
public UnixAoutSymbolTable(BinaryReader reader, long fileOffset, long fileSize,
UnixAoutStringTable strtab, MessageLog log) throws IOException {
this.fileSize = fileSize;
this.symbols = new ArrayList<>();
reader.setPointerIndex(fileOffset);
int idx = 0;
// read each symbol table entry
while (reader.getPointerIndex() < (fileOffset + fileSize)) {
long strOffset = reader.readNextUnsignedInt();
byte typeByte = reader.readNextByte();
byte otherByte = reader.readNextByte();
short desc = reader.readNextShort();
long value = reader.readNextUnsignedInt();
UnixAoutSymbol symbol = new UnixAoutSymbol(strOffset, typeByte, otherByte, desc, value);
if (symbol.type == UnixAoutSymbol.SymbolType.UNKNOWN) {
log.appendMsg(UnixAoutProgramLoader.dot_symtab,
String.format("Unknown symbol type 0x%02x at symbol index %d", typeByte, idx));
}
symbols.add(symbol);
idx++;
}
// lookup and set each string table symbol name
for (UnixAoutSymbol symbol : this) {
symbol.name = strtab.readString(symbol.nameStringOffset);
}
}
@Override
public Iterator<UnixAoutSymbol> iterator() {
return symbols.iterator();
}
@Override
public DataType toDataType() throws DuplicateNameException, IOException {
String dtName = "nlist";
Structure struct = new StructureDataType(new CategoryPath("/AOUT"), dtName, 0);
struct.add(DWORD, "n_strx", null);
struct.add(BYTE, "n_type", null);
struct.add(BYTE, "n_other", null);
struct.add(WORD, "n_desc", null);
struct.add(DWORD, "n_value", null);
return new ArrayDataType(struct, (int) (fileSize / ENTRY_SIZE), ENTRY_SIZE);
}
public UnixAoutSymbol get(int symbolNum) {
return symbols.get(symbolNum);
}
public long size() {
return symbols.size();
}
public void markup(Program program, MemoryBlock block)
throws CodeUnitInsertionException, DuplicateNameException, IOException {
Listing listing = program.getListing();
Data array = listing.createData(block.getStart(), toDataType());
int idx = 0;
for (UnixAoutSymbol symbol : this) {
if (!StringUtils.isBlank(symbol.name)) {
Data structData = array.getComponent(idx);
if (structData != null) {
structData.setComment(CommentType.EOL, symbol.name);
}
}
idx++;
}
}
}

View file

@ -0,0 +1,165 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.opinion;
import java.io.IOException;
import java.util.*;
import ghidra.app.util.Option;
import ghidra.app.util.OptionException;
import ghidra.app.util.bin.ByteProvider;
import ghidra.app.util.bin.format.unixaout.UnixAoutHeader;
import ghidra.app.util.importer.MessageLog;
import ghidra.framework.model.DomainObject;
import ghidra.program.model.address.*;
import ghidra.program.model.lang.LanguageCompilerSpecPair;
import ghidra.program.model.listing.Program;
import ghidra.util.exception.CancelledException;
import ghidra.util.task.TaskMonitor;
/**
* A {@link Loader} for processing UNIX-style A.out executables
* <p>
* This style was also used by UNIX-like systems such as SunOS, BSD, and VxWorks, as well as some
* early distributions of Linux. Although there do exist implementations of A.out with 64-bit and \
* GNU extensions, this loader does not currently support them.
*
* @see <a href="https://wiki.osdev.org/A.out">OSDev.org A.out</a>
* @see <a href="https://man.freebsd.org/cgi/man.cgi?a.out(5)">FreeBSD manpage</a>
*/
public class UnixAoutLoader extends AbstractProgramWrapperLoader {
public final static String UNIX_AOUT_NAME = "UNIX A.out";
public static final String OPTION_NAME_BASE_ADDR = "Base Address";
@Override
public Collection<LoadSpec> findSupportedLoadSpecs(ByteProvider provider) throws IOException {
List<LoadSpec> loadSpecs = new ArrayList<>();
// Attempt to parse the header as both little- and big-endian.
// It is likely that only one of these will produce sensible values.
UnixAoutHeader hdrBE = new UnixAoutHeader(provider, false);
UnixAoutHeader hdrLE = new UnixAoutHeader(provider, true);
boolean beValid = false;
if (hdrBE.isValid()) {
final String lang = hdrBE.getLanguageSpec();
final String comp = hdrBE.getCompilerSpec();
loadSpecs.add(new LoadSpec(this, 0, new LanguageCompilerSpecPair(lang, comp), true));
beValid = true;
}
if (hdrLE.isValid()) {
final String lang = hdrLE.getLanguageSpec();
final String comp = hdrLE.getCompilerSpec();
loadSpecs
.add(new LoadSpec(this, 0, new LanguageCompilerSpecPair(lang, comp), !beValid));
}
return loadSpecs;
}
@Override
protected void load(ByteProvider provider, LoadSpec loadSpec, List<Option> options,
Program program, TaskMonitor monitor, MessageLog log)
throws CancelledException, IOException {
final boolean isLittleEndian = !program.getLanguage().isBigEndian();
final UnixAoutHeader header = new UnixAoutHeader(provider, isLittleEndian);
final UnixAoutProgramLoader loader =
new UnixAoutProgramLoader(program, header, monitor, log);
loader.loadAout(getBaseAddrOffset(options));
}
@Override
public String validateOptions(ByteProvider provider, LoadSpec loadSpec, List<Option> options,
Program program) {
Address baseAddr = null;
for (Option option : options) {
String optName = option.getName();
try {
if (optName.equals(OPTION_NAME_BASE_ADDR)) {
baseAddr = (Address) option.getValue();
}
}
catch (Exception e) {
if (e instanceof OptionException) {
return e.getMessage();
}
return "Invalid value for " + optName + " - " + option.getValue();
}
}
if (baseAddr == null) {
return "Invalid base address";
}
return super.validateOptions(provider, loadSpec, options, program);
}
@Override
public List<Option> getDefaultOptions(ByteProvider provider, LoadSpec loadSpec,
DomainObject domainObject, boolean loadIntoProgram) {
Address baseAddr = null;
if (domainObject instanceof Program) {
Program program = (Program) domainObject;
AddressFactory addressFactory = program.getAddressFactory();
if (addressFactory != null) {
AddressSpace defaultAddressSpace = addressFactory.getDefaultAddressSpace();
if (defaultAddressSpace != null) {
baseAddr = defaultAddressSpace.getAddress(0);
}
}
}
List<Option> list = new ArrayList<Option>();
list.add(new Option(OPTION_NAME_BASE_ADDR, baseAddr, Address.class,
Loader.COMMAND_LINE_ARG_PREFIX + "-baseAddr"));
list.addAll(super.getDefaultOptions(provider, loadSpec, domainObject, loadIntoProgram));
return list;
}
@Override
public String getName() {
return UNIX_AOUT_NAME;
}
/**
* Retrieves the Address offset given in the "Base Address" option.
* Returns 0 if the option could not be found or contains an invalid value.
*/
private long getBaseAddrOffset(List<Option> options) {
Address baseAddr = null;
if (options != null) {
for (Option option : options) {
String optName = option.getName();
if (optName.equals(OPTION_NAME_BASE_ADDR)) {
baseAddr = (Address) option.getValue();
}
}
}
long offset = 0;
if (baseAddr != null) {
offset = baseAddr.getOffset();
}
return offset;
}
}

View file

@ -0,0 +1,473 @@
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ghidra.app.util.opinion;
import java.io.IOException;
import java.io.InputStream;
import java.util.*;
import ghidra.app.util.MemoryBlockUtils;
import ghidra.app.util.bin.ByteProvider;
import ghidra.app.util.bin.format.unixaout.*;
import ghidra.app.util.importer.MessageLog;
import ghidra.program.database.function.OverlappingFunctionException;
import ghidra.program.database.mem.FileBytes;
import ghidra.program.model.address.*;
import ghidra.program.model.listing.FunctionManager;
import ghidra.program.model.listing.Program;
import ghidra.program.model.mem.*;
import ghidra.program.model.reloc.Relocation.Status;
import ghidra.program.model.reloc.RelocationTable;
import ghidra.program.model.symbol.*;
import ghidra.program.model.util.CodeUnitInsertionException;
import ghidra.util.DataConverter;
import ghidra.util.MonitoredInputStream;
import ghidra.util.exception.*;
import ghidra.util.task.TaskMonitor;
public class UnixAoutProgramLoader {
private final int EXTERNAL_BLOCK_MIN_SIZE = 0x10000; // 64K
public final static String dot_text = ".text";
public final static String dot_data = ".data";
public final static String dot_bss = ".bss";
public final static String dot_rel_text = ".rel.text";
public final static String dot_rel_data = ".rel.data";
public final static String dot_strtab = ".strtab";
public final static String dot_symtab = ".symtab";
private final Program program;
private final TaskMonitor monitor;
private final MessageLog log;
private final UnixAoutHeader header;
private FileBytes fileBytes;
private UnixAoutRelocationTable relText;
private UnixAoutRelocationTable relData;
private UnixAoutSymbolTable symtab;
private UnixAoutStringTable strtab;
private Map<String, Long> possibleBssSymbols = new HashMap<>();
private int extraBssSize = 0;
private int undefinedSymbolCount = 0;
public UnixAoutProgramLoader(Program program, UnixAoutHeader header, TaskMonitor monitor,
MessageLog log) {
this.program = program;
this.monitor = monitor;
this.log = log;
this.header = header;
}
public void loadAout(long baseAddr) throws IOException, CancelledException {
log.appendMsg(String.format("----- Loading %s -----",
header.getReader().getByteProvider().getAbsolutePath()));
log.appendMsg(String.format("Found a.out type %s.", header.getExecutableType().name()));
ByteProvider byteProvider = header.getReader().getByteProvider();
try {
buildTables(byteProvider);
preprocessSymbolTable();
loadSections(baseAddr, byteProvider);
loadSymbols();
applyRelocations(baseAddr, program.getMemory().getBlock(dot_text), relText);
applyRelocations(baseAddr, program.getMemory().getBlock(dot_data), relData);
markupSections();
}
catch (AddressOverflowException | InvalidInputException | CodeUnitInsertionException
| DuplicateNameException
| MemoryAccessException e) {
throw new RuntimeException(e);
}
}
private void buildTables(ByteProvider byteProvider) throws IOException {
if (header.getStrSize() > 0) {
strtab = new UnixAoutStringTable(header.getReader(), header.getStrOffset(),
header.getStrSize());
}
if (header.getSymSize() > 0) {
symtab = new UnixAoutSymbolTable(header.getReader(), header.getSymOffset(),
header.getSymSize(),
strtab, log);
}
if (header.getTextRelocSize() > 0) {
relText = new UnixAoutRelocationTable(header.getReader(), header.getTextRelocOffset(),
header.getTextRelocSize(), symtab);
}
if (header.getDataRelocSize() > 0) {
relData = new UnixAoutRelocationTable(header.getReader(), header.getDataRelocOffset(),
header.getDataRelocSize(), symtab);
}
}
private void preprocessSymbolTable() {
if (symtab == null) {
return;
}
boolean foundStabs = false;
for (UnixAoutSymbol symbol : symtab) {
switch (symbol.type) {
case N_UNDF:
if (symbol.value > 0) {
// This is a special case given by the A.out spec: if the linker cannot find
// this symbol in any of the other binary files, then the fact that it is
// marked as N_UNDF but has a non-zero value means that its value should be
// interpreted as a size, and the linker should reserve space in .bss for it.
possibleBssSymbols.put(symbol.name, symbol.value);
}
else {
undefinedSymbolCount++;
}
break;
case N_STAB:
if (!foundStabs) {
foundStabs = true;
log.appendMsg(dot_symtab, "File contains STABS.");
}
break;
default:
break;
}
}
for (Long value : possibleBssSymbols.values()) {
extraBssSize += value;
}
if (extraBssSize > 0) {
log.appendMsg(dot_bss,
String.format("Added %d bytes for N_UNDF symbols.", extraBssSize));
}
}
private void loadSections(long baseAddr, ByteProvider byteProvider)
throws AddressOverflowException, IOException, CancelledException {
monitor.setMessage("Loading FileBytes...");
try (InputStream fileIn = byteProvider.getInputStream(0);
MonitoredInputStream mis = new MonitoredInputStream(fileIn, monitor)) {
// Indicate that cleanup is not neccessary for cancelled import operation.
mis.setCleanupOnCancel(false);
fileBytes = program.getMemory()
.createFileBytes(byteProvider.getName(), 0, byteProvider.length(), mis,
monitor);
}
final AddressSpace defaultAddressSpace =
program.getAddressFactory().getDefaultAddressSpace();
final Address otherAddress = AddressSpace.OTHER_SPACE.getMinAddress();
Address address;
Address nextFreeAddress = defaultAddressSpace.getAddress(0);
if (header.getTextOffset() != 0 || header.getTextSize() < 32) {
MemoryBlockUtils.createInitializedBlock(program, true, "_aoutHeader", otherAddress,
fileBytes, 0, 32, null, null, false, false, false, log);
}
if (header.getTextSize() > 0) {
address = defaultAddressSpace.getAddress(baseAddr + header.getTextAddr());
nextFreeAddress = address.add(header.getTextSize());
MemoryBlockUtils.createInitializedBlock(program, false, dot_text, address, fileBytes,
header.getTextOffset(), header.getTextSize(), null, null, true, true, true, log);
}
if (header.getDataSize() > 0) {
address = defaultAddressSpace.getAddress(baseAddr + header.getDataAddr());
nextFreeAddress = address.add(header.getDataSize());
MemoryBlockUtils.createInitializedBlock(program, false, dot_data, address, fileBytes,
header.getDataOffset(), header.getDataSize(), null, null, true, true, false, log);
}
if ((header.getBssSize() + extraBssSize) > 0) {
address = defaultAddressSpace.getAddress(baseAddr + header.getBssAddr());
nextFreeAddress = address.add(header.getBssSize() + extraBssSize);
MemoryBlockUtils.createUninitializedBlock(program, false, dot_bss, address,
header.getBssSize() + extraBssSize, null, null, true, true, false, log);
}
if (undefinedSymbolCount > 0) {
int externalSectionSize = undefinedSymbolCount * 4;
if (externalSectionSize < EXTERNAL_BLOCK_MIN_SIZE) {
externalSectionSize = EXTERNAL_BLOCK_MIN_SIZE;
}
MemoryBlock externalBlock = MemoryBlockUtils.createUninitializedBlock(program, false,
MemoryBlock.EXTERNAL_BLOCK_NAME, nextFreeAddress, externalSectionSize, null, null,
false, false, false, log);
if (externalBlock != null) {
externalBlock.setArtificial(true);
}
}
if (header.getStrSize() > 0) {
MemoryBlockUtils.createInitializedBlock(program, true, dot_strtab, otherAddress,
fileBytes, header.getStrOffset(), header.getStrSize(), null, null, false, false,
false, log);
}
if (header.getSymSize() > 0) {
MemoryBlockUtils.createInitializedBlock(program, true, dot_symtab, otherAddress,
fileBytes, header.getSymOffset(), header.getSymSize(), null, null, false, false,
false, log);
}
if (header.getTextRelocSize() > 0) {
MemoryBlockUtils.createInitializedBlock(program, true, dot_rel_text, otherAddress,
fileBytes, header.getTextRelocOffset(), header.getTextRelocSize(), null, null,
false, false, false, log);
}
if (header.getDataRelocSize() > 0) {
MemoryBlockUtils.createInitializedBlock(program, true, dot_rel_data, otherAddress,
fileBytes, header.getDataRelocOffset(), header.getDataRelocSize(), null, null,
false, false, false, log);
}
}
private void loadSymbols() throws InvalidInputException {
monitor.setMessage("Loading symbols...");
if (symtab == null) {
return;
}
SymbolTable symbolTable = program.getSymbolTable();
FunctionManager functionManager = program.getFunctionManager();
MemoryBlock textBlock = program.getMemory().getBlock(dot_text);
MemoryBlock dataBlock = program.getMemory().getBlock(dot_data);
MemoryBlock bssBlock = program.getMemory().getBlock(dot_bss);
MemoryBlock externalBlock = program.getMemory().getBlock(MemoryBlock.EXTERNAL_BLOCK_NAME);
int extraBssOffset = 0;
int undefinedSymbolIdx = 0;
List<String> aliases = new ArrayList<>();
for (UnixAoutSymbol symbol : symtab) {
Address address = null;
MemoryBlock block = null;
switch (symbol.type) {
case N_TEXT:
address = textBlock != null ? textBlock.getStart().add(symbol.value) : null;
block = textBlock;
break;
case N_DATA:
address = dataBlock != null ? dataBlock.getStart().add(symbol.value) : null;
block = dataBlock;
break;
case N_BSS:
address = bssBlock != null ? bssBlock.getStart().add(symbol.value) : null;
block = bssBlock;
break;
case N_UNDF:
if (symbol.value > 0) {
address = bssBlock.getEnd().add(extraBssOffset);
block = bssBlock;
extraBssOffset += symbol.value;
}
else {
address = externalBlock.getStart().add(undefinedSymbolIdx++ * 4);
block = externalBlock;
symbolTable.addExternalEntryPoint(address);
}
break;
case N_INDR:
aliases.add(symbol.name);
break;
case N_ABS:
case N_FN:
case N_STAB:
case UNKNOWN:
aliases.clear();
break;
}
if (address == null || block == null) {
continue;
}
switch (symbol.kind) {
case AUX_FUNC:
try {
functionManager.createFunction(symbol.name, address,
new AddressSet(address),
SourceType.IMPORTED);
}
catch (OverlappingFunctionException e) {
log.appendMsg(block.getName(), String.format(
"Failed to create function %s @ %s, creating symbol instead.",
symbol.name, address));
symbolTable.createLabel(address, symbol.name, SourceType.IMPORTED);
}
break;
default:
Symbol label =
symbolTable.createLabel(address, symbol.name, SourceType.IMPORTED);
if (symbol.isExt) {
label.setPrimary();
}
break;
}
for (String alias : aliases) {
symbolTable.createLabel(address, alias, SourceType.IMPORTED);
}
aliases.clear();
}
}
private void applyRelocations(long baseAddr, MemoryBlock targetBlock,
UnixAoutRelocationTable relTable) throws MemoryAccessException {
if (targetBlock == null || relTable == null) {
return;
}
monitor.setMessage(
String.format("Applying relocations for section %s...", targetBlock.getName()));
DataConverter dc = DataConverter.getInstance(program.getLanguage().isBigEndian());
SymbolTable symbolTable = program.getSymbolTable();
RelocationTable relocationTable = program.getRelocationTable();
Memory memory = program.getMemory();
MemoryBlock textBlock = memory.getBlock(dot_text);
MemoryBlock dataBlock = memory.getBlock(dot_data);
MemoryBlock bssBlock = memory.getBlock(dot_bss);
int idx = 0;
for (UnixAoutRelocation relocation : relTable) {
Address targetAddress = targetBlock.getStart().add(relocation.address);
byte originalBytes[] = new byte[relocation.pointerLength];
targetBlock.getBytes(targetAddress, originalBytes);
long addend = dc.getValue(originalBytes, 0, relocation.pointerLength);
Long value = null;
Status status = Status.FAILURE;
if (relocation.baseRelative || relocation.jmpTable || relocation.relative ||
relocation.copy) {
status = Status.UNSUPPORTED;
}
else {
if (relocation.extern == true && relocation.symbolNum < symtab.size()) {
SymbolIterator symbolIterator =
symbolTable.getSymbols(symtab.get(relocation.symbolNum).name);
if (symbolIterator.hasNext()) {
value = symbolIterator.next().getAddress().getOffset();
}
}
else if (relocation.extern == false) {
switch (relocation.symbolNum) {
case 4:
value = textBlock.getStart().getOffset();
break;
case 6:
value = dataBlock.getStart().getOffset();
break;
case 8:
value = bssBlock.getStart().getOffset();
break;
}
}
}
if (value != null) {
if (relocation.pcRelativeAddressing) {
// Addend is relative to start of target section.
value -= targetBlock.getStart().getOffset();
}
// Apply relocation.
byte newBytes[] = new byte[relocation.pointerLength];
dc.putValue(value + addend, relocation.pointerLength, newBytes, 0);
targetBlock.putBytes(targetAddress, newBytes);
status = Status.APPLIED;
}
if (status != Status.APPLIED) {
log.appendMsg(targetBlock.getName(),
String.format("Failed to apply relocation entry %d with type 0x%02x @ %s.", idx,
relocation.flags, targetAddress));
}
relocationTable.add(targetAddress, status, relocation.flags,
new long[] { relocation.symbolNum },
originalBytes, relocation.getSymbolName(symtab));
idx++;
}
}
private void markupSections() throws InvalidInputException, CodeUnitInsertionException,
DuplicateNameException, IOException {
final AddressSpace defaultAddressSpace =
program.getAddressFactory().getDefaultAddressSpace();
final FunctionManager functionManager = program.getFunctionManager();
final SymbolTable symbolTable = program.getSymbolTable();
monitor.setMessage("Marking up header...");
// Markup header.
Address headerAddress = null;
MemoryBlock aoutHeader = program.getMemory().getBlock("_aoutHeader");
MemoryBlock textBlock = program.getMemory().getBlock(dot_text);
if (aoutHeader != null) {
headerAddress = aoutHeader.getStart();
}
else if (textBlock != null && header.getTextOffset() == 0 && header.getTextSize() >= 32) {
headerAddress = textBlock.getStart();
}
if (headerAddress != null) {
header.markup(program, headerAddress);
}
// Markup entrypoint.
if (header.getEntryPoint() != 0) {
Address address = defaultAddressSpace.getAddress(header.getEntryPoint());
try {
functionManager.createFunction("entry", address, new AddressSet(address),
SourceType.IMPORTED);
}
catch (OverlappingFunctionException e) {
log.appendMsg(dot_text,
"Failed to create entrypoint function @ %s, creating symbol instead.");
symbolTable.createLabel(address, "entry", SourceType.IMPORTED);
}
}
monitor.setMessage("Marking up relocation tables...");
MemoryBlock relTextBlock = program.getMemory().getBlock(dot_rel_text);
if (relTextBlock != null) {
relText.markup(program, relTextBlock);
}
MemoryBlock relDataBlock = program.getMemory().getBlock(dot_rel_data);
if (relDataBlock != null) {
relData.markup(program, relDataBlock);
}
monitor.setMessage("Marking up symbol table...");
MemoryBlock symtabBlock = program.getMemory().getBlock(dot_symtab);
if (symtabBlock != null) {
symtab.markup(program, symtabBlock);
}
monitor.setMessage("Marking up string table...");
MemoryBlock strtabBlock = program.getMemory().getBlock(dot_strtab);
if (strtabBlock != null) {
strtab.markup(program, strtabBlock);
}
}
}