Begin REL analysis & rework lots of code to be section-address aware

This commit is contained in:
Luke Street 2023-08-17 22:09:45 -04:00
parent 347889773d
commit 5843ee021e
27 changed files with 1813 additions and 1227 deletions

View File

@ -29,8 +29,10 @@ impl AnalyzerState {
if end == 0 { if end == 0 {
continue; continue;
} }
let section_index = let (section_index, _) = obj
obj.section_for(start..end).context("Failed to locate section for function")?.index; .sections
.with_range(start..end)
.context("Failed to locate section for function")?;
obj.add_symbol( obj.add_symbol(
ObjSymbol { ObjSymbol {
name: format!("fn_{:08X}", start), name: format!("fn_{:08X}", start),
@ -48,10 +50,10 @@ impl AnalyzerState {
)?; )?;
} }
for (&addr, &size) in &self.jump_tables { for (&addr, &size) in &self.jump_tables {
let section_index = obj let (section_index, _) = obj
.section_for(addr..addr + size) .sections
.context("Failed to locate section for jump table")? .with_range(addr..addr + size)
.index; .context("Failed to locate section for jump table")?;
obj.add_symbol( obj.add_symbol(
ObjSymbol { ObjSymbol {
name: format!("jumptable_{:08X}", addr), name: format!("jumptable_{:08X}", addr),
@ -89,7 +91,7 @@ impl AnalyzerState {
} }
} }
// Also check the beginning of every code section // Also check the beginning of every code section
for section in obj.sections.iter().filter(|s| s.kind == ObjSectionKind::Code) { for (_, section) in obj.sections.by_kind(ObjSectionKind::Code) {
self.function_entries.insert(section.address as u32); self.function_entries.insert(section.address as u32);
} }
@ -266,11 +268,7 @@ impl AnalyzerState {
fn detect_new_functions(&mut self, obj: &ObjInfo) -> Result<bool> { fn detect_new_functions(&mut self, obj: &ObjInfo) -> Result<bool> {
let mut found_new = false; let mut found_new = false;
for section in &obj.sections { for (_, section) in obj.sections.by_kind(ObjSectionKind::Code) {
if section.kind != ObjSectionKind::Code {
continue;
}
let section_start = section.address as u32; let section_start = section.address as u32;
let section_end = (section.address + section.size) as u32; let section_end = (section.address + section.size) as u32;
let mut iter = self.function_bounds.range(section_start..section_end).peekable(); let mut iter = self.function_bounds.range(section_start..section_end).peekable();
@ -280,7 +278,7 @@ impl AnalyzerState {
if first_end == 0 || first_end > second_begin { if first_end == 0 || first_end > second_begin {
continue; continue;
} }
let addr = match skip_alignment(obj, first_end, second_begin) { let addr = match skip_alignment(section, first_end, second_begin) {
Some(addr) => addr, Some(addr) => addr,
None => continue, None => continue,
}; };
@ -298,7 +296,7 @@ impl AnalyzerState {
} }
(Some((&last_begin, &last_end)), None) => { (Some((&last_begin, &last_end)), None) => {
if last_end > 0 && last_end < section_end { if last_end > 0 && last_end < section_end {
let addr = match skip_alignment(obj, last_end, section_end) { let addr = match skip_alignment(section, last_end, section_end) {
Some(addr) => addr, Some(addr) => addr,
None => continue, None => continue,
}; };
@ -329,7 +327,7 @@ pub fn locate_sda_bases(obj: &mut ObjInfo) -> Result<bool> {
executor.push(obj.entry as u32, VM::new(), false); executor.push(obj.entry as u32, VM::new(), false);
let result = executor.run( let result = executor.run(
obj, obj,
|ExecCbData { executor, vm, result, section: _, ins, block_start: _ }| { |ExecCbData { executor, vm, result, section_index: _, section: _, ins, block_start: _ }| {
match result { match result {
StepResult::Continue | StepResult::LoadStore { .. } => { StepResult::Continue | StepResult::LoadStore { .. } => {
return Ok(ExecCbResult::Continue); return Ok(ExecCbResult::Continue);

View File

@ -17,8 +17,8 @@ struct VisitedAddresses {
impl VisitedAddresses { impl VisitedAddresses {
pub fn new(obj: &ObjInfo) -> Self { pub fn new(obj: &ObjInfo) -> Self {
let mut inner = Vec::with_capacity(obj.sections.len()); let mut inner = Vec::with_capacity(obj.sections.count());
for section in &obj.sections { for (_, section) in obj.sections.iter() {
if section.kind == ObjSectionKind::Code { if section.kind == ObjSectionKind::Code {
let size = (section.size / 4) as usize; let size = (section.size / 4) as usize;
inner.push(FixedBitSet::with_capacity(size)); inner.push(FixedBitSet::with_capacity(size));
@ -30,17 +30,17 @@ impl VisitedAddresses {
Self { inner } Self { inner }
} }
pub fn contains(&self, section: &ObjSection, address: u32) -> bool { pub fn contains(&self, section_index: usize, section_address: u32, address: u32) -> bool {
self.inner[section.index].contains(Self::bit_for(section, address)) self.inner[section_index].contains(Self::bit_for(section_address, address))
} }
pub fn insert(&mut self, section: &ObjSection, address: u32) { pub fn insert(&mut self, section_index: usize, section_address: u32, address: u32) {
self.inner[section.index].insert(Self::bit_for(section, address)); self.inner[section_index].insert(Self::bit_for(section_address, address));
} }
#[inline] #[inline]
fn bit_for(section: &ObjSection, address: u32) -> usize { fn bit_for(section_address: u32, address: u32) -> usize {
((address as u64 - section.address) / 4) as usize ((address - section_address) / 4) as usize
} }
} }
@ -59,6 +59,7 @@ pub struct ExecCbData<'a> {
pub executor: &'a mut Executor, pub executor: &'a mut Executor,
pub vm: &'a mut VM, pub vm: &'a mut VM,
pub result: StepResult, pub result: StepResult,
pub section_index: usize,
pub section: &'a ObjSection, pub section: &'a ObjSection,
pub ins: &'a Ins, pub ins: &'a Ins,
pub block_start: u32, pub block_start: u32,
@ -79,8 +80,8 @@ impl Executor {
pub fn run<Cb, R>(&mut self, obj: &ObjInfo, mut cb: Cb) -> Result<Option<R>> pub fn run<Cb, R>(&mut self, obj: &ObjInfo, mut cb: Cb) -> Result<Option<R>>
where Cb: FnMut(ExecCbData) -> Result<ExecCbResult<R>> { where Cb: FnMut(ExecCbData) -> Result<ExecCbResult<R>> {
while let Some(mut state) = self.vm_stack.pop() { while let Some(mut state) = self.vm_stack.pop() {
let section = match obj.section_at(state.address) { let (section_index, section) = match obj.sections.at_address(state.address) {
Ok(section) => section, Ok(ret) => ret,
Err(e) => { Err(e) => {
log::error!("{}", e); log::error!("{}", e);
// return Ok(None); // return Ok(None);
@ -93,13 +94,14 @@ impl Executor {
} }
// Already visited block // Already visited block
if self.visited.contains(section, state.address) { let section_address = section.address as u32;
if self.visited.contains(section_index, section_address, state.address) {
continue; continue;
} }
let mut block_start = state.address; let mut block_start = state.address;
loop { loop {
self.visited.insert(section, state.address); self.visited.insert(section_index, section_address, state.address);
let ins = match disassemble(section, state.address) { let ins = match disassemble(section, state.address) {
Some(ins) => ins, Some(ins) => ins,
@ -110,6 +112,7 @@ impl Executor {
executor: self, executor: self,
vm: &mut state.vm, vm: &mut state.vm,
result, result,
section_index,
section, section,
ins: &ins, ins: &ins,
block_start, block_start,
@ -118,7 +121,7 @@ impl Executor {
state.address += 4; state.address += 4;
} }
ExecCbResult::Jump(addr) => { ExecCbResult::Jump(addr) => {
if self.visited.contains(section, addr) { if self.visited.contains(section_index, section_address, addr) {
break; break;
} }
block_start = addr; block_start = addr;
@ -140,7 +143,7 @@ impl Executor {
} }
} }
pub fn visited(&self, section: &ObjSection, address: u32) -> bool { pub fn visited(&self, section_index: usize, section_address: u32, address: u32) -> bool {
self.visited.contains(section, address) self.visited.contains(section_index, section_address, address)
} }
} }

View File

@ -3,7 +3,10 @@ use std::{collections::BTreeSet, num::NonZeroU32};
use anyhow::{Context, Result}; use anyhow::{Context, Result};
use ppc750cl::Ins; use ppc750cl::Ins;
use crate::obj::{ObjInfo, ObjSection, ObjSectionKind}; use crate::{
array_ref,
obj::{ObjInfo, ObjSection, ObjSectionKind},
};
pub mod cfa; pub mod cfa;
pub mod executor; pub mod executor;
@ -23,11 +26,11 @@ pub fn read_u32(data: &[u8], address: u32, section_address: u32) -> Option<u32>
if data.len() < offset + 4 { if data.len() < offset + 4 {
return None; return None;
} }
Some(u32::from_be_bytes(data[offset..offset + 4].try_into().unwrap())) Some(u32::from_be_bytes(*array_ref!(data, offset, 4)))
} }
fn is_valid_jump_table_addr(obj: &ObjInfo, addr: u32) -> bool { fn is_valid_jump_table_addr(obj: &ObjInfo, addr: u32) -> bool {
matches!(obj.section_at(addr), Ok(section) if section.kind != ObjSectionKind::Bss) matches!(obj.sections.at_address(addr), Ok((_, section)) if section.kind != ObjSectionKind::Bss)
} }
fn get_jump_table_entries( fn get_jump_table_entries(
@ -38,7 +41,7 @@ fn get_jump_table_entries(
function_start: u32, function_start: u32,
function_end: u32, function_end: u32,
) -> Result<(Vec<u32>, u32)> { ) -> Result<(Vec<u32>, u32)> {
let section = obj.section_at(addr).with_context(|| { let (_, section) = obj.sections.at_address(addr).with_context(|| {
format!("Failed to get jump table entries @ {:#010X} size {:?}", addr, size) format!("Failed to get jump table entries @ {:#010X} size {:?}", addr, size)
})?; })?;
let offset = (addr as u64 - section.address) as usize; let offset = (addr as u64 - section.address) as usize;
@ -90,9 +93,9 @@ pub fn uniq_jump_table_entries(
Ok((BTreeSet::from_iter(entries.iter().cloned().filter(|&addr| addr != 0)), size)) Ok((BTreeSet::from_iter(entries.iter().cloned().filter(|&addr| addr != 0)), size))
} }
pub fn skip_alignment(obj: &ObjInfo, mut addr: u32, end: u32) -> Option<u32> { pub fn skip_alignment(section: &ObjSection, mut addr: u32, end: u32) -> Option<u32> {
let mut data = match obj.section_data(addr, end) { let mut data = match section.data_range(addr, end) {
Ok((_, data)) => data, Ok(data) => data,
Err(_) => return None, Err(_) => return None,
}; };
loop { loop {

View File

@ -1,16 +1,18 @@
use anyhow::Result; use anyhow::Result;
use crate::obj::{ use crate::{
split::is_linker_generated_label, ObjDataKind, ObjInfo, ObjSectionKind, ObjSymbolKind, obj::{ObjDataKind, ObjInfo, ObjSectionKind, ObjSymbolKind},
util::split::is_linker_generated_label,
}; };
pub fn detect_object_boundaries(obj: &mut ObjInfo) -> Result<()> { pub fn detect_object_boundaries(obj: &mut ObjInfo) -> Result<()> {
for section in obj.sections.iter().filter(|s| s.kind != ObjSectionKind::Code) { for (section_index, section) in
let section_start = section.address as u32; obj.sections.iter_mut().filter(|(_, s)| s.kind != ObjSectionKind::Code)
{
let section_end = (section.address + section.size) as u32; let section_end = (section.address + section.size) as u32;
let mut replace_symbols = vec![]; let mut replace_symbols = vec![];
for (idx, symbol) in obj.symbols.for_range(section_start..section_end) { for (idx, symbol) in obj.symbols.for_section(section_index) {
let mut symbol = symbol.clone(); let mut symbol = symbol.clone();
if is_linker_generated_label(&symbol.name) { if is_linker_generated_label(&symbol.name) {
continue; continue;
@ -25,7 +27,7 @@ pub fn detect_object_boundaries(obj: &mut ObjInfo) -> Result<()> {
if !symbol.size_known { if !symbol.size_known {
let next_addr = obj let next_addr = obj
.symbols .symbols
.for_range(symbol.address as u32 + 1..section_end) .for_section_range(section_index, symbol.address as u32 + 1..)
.next() .next()
.map_or(section_end, |(_, symbol)| symbol.address as u32); .map_or(section_end, |(_, symbol)| symbol.address as u32);
let new_size = next_addr - symbol.address as u32; let new_size = next_addr - symbol.address as u32;
@ -35,9 +37,9 @@ pub fn detect_object_boundaries(obj: &mut ObjInfo) -> Result<()> {
(2 | 4, 2) => expected_size, (2 | 4, 2) => expected_size,
(..=8, 1 | 2 | 4) => { (..=8, 1 | 2 | 4) => {
// alignment to double // alignment to double
if obj.symbols.at_address(next_addr).any(|(_, sym)| sym.data_kind == ObjDataKind::Double) if obj.symbols.at_section_address(section_index, next_addr).any(|(_, sym)| sym.data_kind == ObjDataKind::Double)
// If we're at a TU boundary, we can assume it's just padding // If we're at a TU boundary, we can assume it's just padding
|| obj.splits.contains_key(&(symbol.address as u32 + new_size)) || section.splits.has_split_at(symbol.address as u32 + new_size)
{ {
expected_size expected_size
} else { } else {
@ -63,10 +65,10 @@ pub fn detect_object_boundaries(obj: &mut ObjInfo) -> Result<()> {
pub fn detect_strings(obj: &mut ObjInfo) -> Result<()> { pub fn detect_strings(obj: &mut ObjInfo) -> Result<()> {
let mut symbols_set = Vec::<(usize, ObjDataKind, usize)>::new(); let mut symbols_set = Vec::<(usize, ObjDataKind, usize)>::new();
for section in obj for (section_index, section) in obj
.sections .sections
.iter() .iter()
.filter(|s| matches!(s.kind, ObjSectionKind::Data | ObjSectionKind::ReadOnlyData)) .filter(|(_, s)| matches!(s.kind, ObjSectionKind::Data | ObjSectionKind::ReadOnlyData))
{ {
enum StringResult { enum StringResult {
None, None,
@ -119,11 +121,10 @@ pub fn detect_strings(obj: &mut ObjInfo) -> Result<()> {
} }
for (symbol_idx, symbol) in obj for (symbol_idx, symbol) in obj
.symbols .symbols
.for_section(section) .for_section(section_index)
.filter(|(_, sym)| sym.data_kind == ObjDataKind::Unknown) .filter(|(_, sym)| sym.data_kind == ObjDataKind::Unknown)
{ {
let (_section, data) = let data = section.symbol_data(symbol)?;
obj.section_data(symbol.address as u32, (symbol.address + symbol.size) as u32)?;
match is_string(data) { match is_string(data) {
StringResult::None => {} StringResult::None => {}
StringResult::String { length, terminated } => { StringResult::String { length, terminated } => {
@ -146,7 +147,7 @@ pub fn detect_strings(obj: &mut ObjInfo) -> Result<()> {
} }
for (symbol_idx, data_kind, size) in symbols_set { for (symbol_idx, data_kind, size) in symbols_set {
let mut symbol = obj.symbols.at(symbol_idx).clone(); let mut symbol = obj.symbols[symbol_idx].clone();
log::debug!("Setting {} ({:#010X}) to size {:#X}", symbol.name, symbol.address, size); log::debug!("Setting {} ({:#010X}) to size {:#X}", symbol.name, symbol.address, size);
symbol.data_kind = data_kind; symbol.data_kind = data_kind;
symbol.size = size as u64; symbol.size = size as u64;

View File

@ -21,8 +21,9 @@ pub const TRK_TABLE_SIZE: u32 = 0x1F34; // always?
impl AnalysisPass for FindTRKInterruptVectorTable { impl AnalysisPass for FindTRKInterruptVectorTable {
fn execute(state: &mut AnalyzerState, obj: &ObjInfo) -> Result<()> { fn execute(state: &mut AnalyzerState, obj: &ObjInfo) -> Result<()> {
for (&start, _) in state.function_bounds.iter().filter(|&(_, &end)| end == 0) { for (&start, _) in state.function_bounds.iter().filter(|&(_, &end)| end == 0) {
let (section, data) = match obj.section_data(start, 0) { let (section_index, section) = obj.sections.at_address(start)?;
Ok((section, data)) => (section, data), let data = match section.data_range(start, 0) {
Ok(ret) => ret,
Err(_) => continue, Err(_) => continue,
}; };
if data.starts_with(TRK_TABLE_HEADER.as_bytes()) if data.starts_with(TRK_TABLE_HEADER.as_bytes())
@ -33,7 +34,7 @@ impl AnalysisPass for FindTRKInterruptVectorTable {
name: "gTRKInterruptVectorTable".to_string(), name: "gTRKInterruptVectorTable".to_string(),
demangled_name: None, demangled_name: None,
address: start as u64, address: start as u64,
section: Some(section.index), section: Some(section_index),
size: 0, size: 0,
size_known: true, size_known: true,
flags: ObjSymbolFlagSet(FlagSet::from(ObjSymbolFlags::Global)), flags: ObjSymbolFlagSet(FlagSet::from(ObjSymbolFlags::Global)),
@ -46,7 +47,7 @@ impl AnalysisPass for FindTRKInterruptVectorTable {
name: "gTRKInterruptVectorTableEnd".to_string(), name: "gTRKInterruptVectorTableEnd".to_string(),
demangled_name: None, demangled_name: None,
address: end as u64, address: end as u64,
section: Some(section.index), section: Some(section_index),
size: 0, size: 0,
size_known: true, size_known: true,
flags: ObjSymbolFlagSet(FlagSet::from(ObjSymbolFlags::Global)), flags: ObjSymbolFlagSet(FlagSet::from(ObjSymbolFlags::Global)),
@ -78,7 +79,11 @@ impl AnalysisPass for FindSaveRestSleds {
const SLED_SIZE: usize = 19 * 4; // registers 14-31 + blr const SLED_SIZE: usize = 19 * 4; // registers 14-31 + blr
let mut clear_ranges: Vec<Range<u32>> = vec![]; let mut clear_ranges: Vec<Range<u32>> = vec![];
for (&start, _) in state.function_bounds.iter().filter(|&(_, &end)| end != 0) { for (&start, _) in state.function_bounds.iter().filter(|&(_, &end)| end != 0) {
let (section, data) = obj.section_data(start, 0)?; let (section_index, section) = obj.sections.at_address(start)?;
let data = match section.data_range(start, 0) {
Ok(ret) => ret,
Err(_) => continue,
};
for (needle, func, label) in &SLEDS { for (needle, func, label) in &SLEDS {
if data.starts_with(needle) { if data.starts_with(needle) {
log::debug!("Found {} @ {:#010X}", func, start); log::debug!("Found {} @ {:#010X}", func, start);
@ -87,7 +92,7 @@ impl AnalysisPass for FindSaveRestSleds {
name: func.to_string(), name: func.to_string(),
demangled_name: None, demangled_name: None,
address: start as u64, address: start as u64,
section: Some(section.index), section: Some(section_index),
size: SLED_SIZE as u64, size: SLED_SIZE as u64,
size_known: true, size_known: true,
flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()), flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()),
@ -101,7 +106,7 @@ impl AnalysisPass for FindSaveRestSleds {
name: format!("{}{}", label, i), name: format!("{}{}", label, i),
demangled_name: None, demangled_name: None,
address: addr as u64, address: addr as u64,
section: Some(section.index), section: Some(section_index),
size: 0, size: 0,
size_known: true, size_known: true,
flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()), flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()),

View File

@ -3,12 +3,10 @@ use anyhow::{anyhow, Result};
use crate::{ use crate::{
analysis::{cfa::AnalyzerState, read_u32}, analysis::{cfa::AnalyzerState, read_u32},
obj::{ obj::{
signatures::{ ObjInfo, ObjSectionKind, ObjSplit, ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags,
apply_signature, check_signatures, check_signatures_str, parse_signatures, ObjSymbolKind,
FunctionSignature,
},
ObjInfo, ObjSplit, ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags, ObjSymbolKind,
}, },
util::signatures::{apply_signature, check_signatures, check_signatures_str, parse_signatures},
}; };
const SIGNATURES: &[(&str, &str)] = &[ const SIGNATURES: &[(&str, &str)] = &[
@ -197,17 +195,23 @@ const POST_SIGNATURES: &[(&str, &str)] = &[
pub fn apply_signatures(obj: &mut ObjInfo) -> Result<()> { pub fn apply_signatures(obj: &mut ObjInfo) -> Result<()> {
let entry = obj.entry as u32; let entry = obj.entry as u32;
if let Some(signature) = let (entry_section_index, entry_section) = obj.sections.at_address(entry)?;
check_signatures_str(obj, entry, include_str!("../../assets/signatures/__start.yml"))? if let Some(signature) = check_signatures_str(
{ entry_section,
apply_signature(obj, entry, &signature)?; entry,
include_str!("../../assets/signatures/__start.yml"),
)? {
apply_signature(obj, entry_section_index, entry, &signature)?;
} }
for &(name, sig_str) in SIGNATURES { for &(name, sig_str) in SIGNATURES {
if let Some((_, symbol)) = obj.symbols.by_name(name)? { if let Some((_, symbol)) = obj.symbols.by_name(name)? {
let addr = symbol.address as u32; let addr = symbol.address as u32;
if let Some(signature) = check_signatures_str(obj, addr, sig_str)? { let section_index =
apply_signature(obj, addr, &signature)?; symbol.section.ok_or_else(|| anyhow!("Symbol '{}' missing section", name))?;
let section = &obj.sections[section_index];
if let Some(signature) = check_signatures_str(section, addr, sig_str)? {
apply_signature(obj, section_index, addr, &signature)?;
} }
} }
} }
@ -217,12 +221,13 @@ pub fn apply_signatures(obj: &mut ObjInfo) -> Result<()> {
let mut analyzer = AnalyzerState::default(); let mut analyzer = AnalyzerState::default();
analyzer.process_function_at(obj, symbol.address as u32)?; analyzer.process_function_at(obj, symbol.address as u32)?;
for addr in analyzer.function_entries { for addr in analyzer.function_entries {
let (section_index, section) = obj.sections.at_address(addr)?;
if let Some(signature) = check_signatures_str( if let Some(signature) = check_signatures_str(
obj, section,
addr, addr,
include_str!("../../assets/signatures/__init_cpp.yml"), include_str!("../../assets/signatures/__init_cpp.yml"),
)? { )? {
apply_signature(obj, addr, &signature)?; apply_signature(obj, section_index, addr, &signature)?;
break; break;
} }
} }
@ -230,24 +235,27 @@ pub fn apply_signatures(obj: &mut ObjInfo) -> Result<()> {
if let Some((_, symbol)) = obj.symbols.by_name("_ctors")? { if let Some((_, symbol)) = obj.symbols.by_name("_ctors")? {
// First entry of ctors is __init_cpp_exceptions // First entry of ctors is __init_cpp_exceptions
let section = obj.section_at(symbol.address as u32)?; let ctors_section_index =
let target = read_u32(&section.data, symbol.address as u32, section.address as u32) symbol.section.ok_or_else(|| anyhow!("Missing _ctors symbol section"))?;
let ctors_section = &obj.sections[ctors_section_index];
let target =
read_u32(&ctors_section.data, symbol.address as u32, ctors_section.address as u32)
.ok_or_else(|| anyhow!("Failed to read _ctors data"))?; .ok_or_else(|| anyhow!("Failed to read _ctors data"))?;
if target != 0 { if target != 0 {
let (target_section_index, target_section) = obj.sections.at_address(target)?;
if let Some(signature) = check_signatures_str( if let Some(signature) = check_signatures_str(
obj, target_section,
target, target,
include_str!("../../assets/signatures/__init_cpp_exceptions.yml"), include_str!("../../assets/signatures/__init_cpp_exceptions.yml"),
)? { )? {
let address = symbol.address; let address = symbol.address;
let section_index = section.index; apply_signature(obj, target_section_index, target, &signature)?;
apply_signature(obj, target, &signature)?; obj.symbols.add(
obj.add_symbol(
ObjSymbol { ObjSymbol {
name: "__init_cpp_exceptions_reference".to_string(), name: "__init_cpp_exceptions_reference".to_string(),
demangled_name: None, demangled_name: None,
address, address,
section: Some(section_index), section: Some(ctors_section_index),
size: 4, size: 4,
size_known: true, size_known: true,
flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()), flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()),
@ -257,8 +265,8 @@ pub fn apply_signatures(obj: &mut ObjInfo) -> Result<()> {
}, },
true, true,
)?; )?;
if obj.split_for(address as u32).is_none() { if obj.sections[ctors_section_index].splits.for_address(address as u32).is_none() {
obj.add_split(address as u32, ObjSplit { obj.add_split(ctors_section_index, address as u32, ObjSplit {
unit: "__init_cpp_exceptions.cpp".to_string(), unit: "__init_cpp_exceptions.cpp".to_string(),
end: address as u32 + 4, end: address as u32 + 4,
align: None, align: None,
@ -271,30 +279,32 @@ pub fn apply_signatures(obj: &mut ObjInfo) -> Result<()> {
} }
if let Some((_, symbol)) = obj.symbols.by_name("_dtors")? { if let Some((_, symbol)) = obj.symbols.by_name("_dtors")? {
let section = obj.section_at(symbol.address as u32)?; let dtors_section_index =
symbol.section.ok_or_else(|| anyhow!("Missing _dtors symbol section"))?;
let dtors_section = &obj.sections[dtors_section_index];
let address = symbol.address; let address = symbol.address;
let section_address = section.address; let section_address = dtors_section.address;
let section_index = section.index;
// First entry of dtors is __destroy_global_chain // First entry of dtors is __destroy_global_chain
let dgc_target = read_u32(&section.data, address as u32, section_address as u32) let dgc_target = read_u32(&dtors_section.data, address as u32, section_address as u32)
.ok_or_else(|| anyhow!("Failed to read _dtors data"))?; .ok_or_else(|| anyhow!("Failed to read _dtors data"))?;
let fce_target = read_u32(&section.data, address as u32 + 4, section_address as u32) let fce_target = read_u32(&dtors_section.data, address as u32 + 4, section_address as u32)
.ok_or_else(|| anyhow!("Failed to read _dtors data"))?; .ok_or_else(|| anyhow!("Failed to read _dtors data"))?;
let mut found_dgc = false; let mut found_dgc = false;
let mut found_fce = false; let mut found_fce = false;
if dgc_target != 0 { if dgc_target != 0 {
let (target_section_index, target_section) = obj.sections.at_address(dgc_target)?;
if let Some(signature) = check_signatures_str( if let Some(signature) = check_signatures_str(
obj, target_section,
dgc_target, dgc_target,
include_str!("../../assets/signatures/__destroy_global_chain.yml"), include_str!("../../assets/signatures/__destroy_global_chain.yml"),
)? { )? {
apply_signature(obj, dgc_target, &signature)?; apply_signature(obj, target_section_index, dgc_target, &signature)?;
obj.add_symbol( obj.add_symbol(
ObjSymbol { ObjSymbol {
name: "__destroy_global_chain_reference".to_string(), name: "__destroy_global_chain_reference".to_string(),
demangled_name: None, demangled_name: None,
address, address,
section: Some(section_index), section: Some(dtors_section_index),
size: 4, size: 4,
size_known: true, size_known: true,
flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()), flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()),
@ -314,18 +324,19 @@ pub fn apply_signatures(obj: &mut ObjInfo) -> Result<()> {
} }
// Second entry of dtors is __fini_cpp_exceptions // Second entry of dtors is __fini_cpp_exceptions
if fce_target != 0 { if fce_target != 0 {
let (target_section_index, target_section) = obj.sections.at_address(fce_target)?;
if let Some(signature) = check_signatures_str( if let Some(signature) = check_signatures_str(
obj, target_section,
fce_target, fce_target,
include_str!("../../assets/signatures/__fini_cpp_exceptions.yml"), include_str!("../../assets/signatures/__fini_cpp_exceptions.yml"),
)? { )? {
apply_signature(obj, fce_target, &signature)?; apply_signature(obj, target_section_index, fce_target, &signature)?;
obj.add_symbol( obj.add_symbol(
ObjSymbol { ObjSymbol {
name: "__fini_cpp_exceptions_reference".to_string(), name: "__fini_cpp_exceptions_reference".to_string(),
demangled_name: None, demangled_name: None,
address: address + 4, address: address + 4,
section: Some(section_index), section: Some(dtors_section_index),
size: 4, size: 4,
size_known: true, size_known: true,
flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()), flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()),
@ -344,8 +355,8 @@ pub fn apply_signatures(obj: &mut ObjInfo) -> Result<()> {
if found_fce { if found_fce {
end += 4; end += 4;
} }
if obj.split_for(address as u32).is_none() { if obj.sections[dtors_section_index].splits.for_address(address as u32).is_none() {
obj.add_split(address as u32, ObjSplit { obj.add_split(dtors_section_index, address as u32, ObjSplit {
unit: "__init_cpp_exceptions.cpp".to_string(), unit: "__init_cpp_exceptions.cpp".to_string(),
end, end,
align: None, align: None,
@ -363,19 +374,28 @@ pub fn apply_signatures_post(obj: &mut ObjInfo) -> Result<()> {
log::info!("Checking post CFA signatures..."); log::info!("Checking post CFA signatures...");
for &(_name, sig_str) in POST_SIGNATURES { for &(_name, sig_str) in POST_SIGNATURES {
let signatures = parse_signatures(sig_str)?; let signatures = parse_signatures(sig_str)?;
let mut iter = obj.symbols.by_kind(ObjSymbolKind::Function); let mut found_signature = None;
let opt = loop { 'outer: for (section_index, section) in obj.sections.by_kind(ObjSectionKind::Code) {
let Some((_, symbol)) = iter.next() else { for (symbol_index, symbol) in obj
break Option::<(u32, FunctionSignature)>::None; .symbols
}; .for_section(section_index)
if let Some(signature) = check_signatures(obj, symbol.address as u32, &signatures)? { .filter(|(_, sym)| sym.kind == ObjSymbolKind::Function)
break Some((symbol.address as u32, signature)); {
if let Some(signature) =
check_signatures(section, symbol.address as u32, &signatures)?
{
found_signature = Some((symbol_index, signature));
break 'outer;
} }
}; }
if let Some((addr, signature)) = opt { }
drop(iter); if let Some((symbol_index, signature)) = found_signature {
apply_signature(obj, addr, &signature)?; let symbol = &obj.symbols[symbol_index];
break; let section_index = symbol
.section
.ok_or_else(|| anyhow!("Symbol '{}' missing section", symbol.name))?;
let address = symbol.address as u32;
apply_signature(obj, section_index, address, &signature)?;
} }
} }
log::info!("Done!"); log::info!("Done!");

View File

@ -164,7 +164,7 @@ impl FunctionSlices {
function_end: Option<u32>, function_end: Option<u32>,
known_functions: &BTreeSet<u32>, known_functions: &BTreeSet<u32>,
) -> Result<ExecCbResult<bool>> { ) -> Result<ExecCbResult<bool>> {
let ExecCbData { executor, vm, result, section, ins, block_start } = data; let ExecCbData { executor, vm, result, section_index, section, ins, block_start } = data;
// Track discovered prologue(s) and epilogue(s) // Track discovered prologue(s) and epilogue(s)
self.check_prologue(section, ins) self.check_prologue(section, ins)
@ -187,7 +187,7 @@ impl FunctionSlices {
StepResult::Continue | StepResult::LoadStore { .. } => { StepResult::Continue | StepResult::LoadStore { .. } => {
let next_address = ins.addr + 4; let next_address = ins.addr + 4;
// If we already visited the next address, connect the blocks and end // If we already visited the next address, connect the blocks and end
if executor.visited(section, next_address) { if executor.visited(section_index, section.address as u32, next_address) {
self.blocks.insert(block_start, next_address); self.blocks.insert(block_start, next_address);
self.branches.insert(ins.addr, vec![next_address]); self.branches.insert(ins.addr, vec![next_address]);
Ok(ExecCbResult::EndBlock) Ok(ExecCbResult::EndBlock)
@ -233,7 +233,7 @@ impl FunctionSlices {
if self.add_block_start(addr) { if self.add_block_start(addr) {
return Ok(ExecCbResult::Jump(addr)); return Ok(ExecCbResult::Jump(addr));
} }
} else if matches!(obj.section_data(ins.addr, ins.addr + 4), Ok((_, data)) if data == [0u8; 4]) } else if matches!(section.data_range(ins.addr, ins.addr + 4), Ok(data) if data == [0u8; 4])
{ {
// If this branch has zeroed padding after it, assume tail call. // If this branch has zeroed padding after it, assume tail call.
self.function_references.insert(addr); self.function_references.insert(addr);
@ -385,8 +385,10 @@ impl FunctionSlices {
} }
let end = self.end(); let end = self.end();
match (obj.section_at(end), obj.section_at(end - 4)) { match (obj.sections.at_address(end), obj.sections.at_address(end - 4)) {
(Ok(section), Ok(other_section)) if section.index == other_section.index => { (Ok((section_index, section)), Ok((other_section_index, _other_section)))
if section_index == other_section_index =>
{
// FIXME this is real bad // FIXME this is real bad
if !self.has_conditional_blr { if !self.has_conditional_blr {
if let Some(ins) = disassemble(section, end - 4) { if let Some(ins) = disassemble(section, end - 4) {
@ -453,15 +455,15 @@ impl FunctionSlices {
return TailCallResult::Is; return TailCallResult::Is;
} }
// If the jump target is in a different section, known tail call. // If the jump target is in a different section, known tail call.
let section = match obj.section_at(function_start) { let (_, target_section) = match obj.sections.at_address(addr) {
Ok(section) => section, Ok(section) => section,
Err(e) => return TailCallResult::Error(e), Err(e) => return TailCallResult::Error(e),
}; };
if !section.contains(addr) { if !target_section.contains(function_start) {
return TailCallResult::Is; return TailCallResult::Is;
} }
// If the jump target has 0'd padding before it, known tail call. // If the jump target has 0'd padding before it, known tail call.
if matches!(obj.section_data(addr - 4, addr), Ok((_, data)) if data == [0u8; 4]) { if matches!(target_section.data_range(addr - 4, addr), Ok(data) if data == [0u8; 4]) {
return TailCallResult::Is; return TailCallResult::Is;
} }
// If we're not sure where the function ends yet, mark as possible tail call. // If we're not sure where the function ends yet, mark as possible tail call.

View File

@ -73,8 +73,8 @@ impl Tracker {
// Stack ends after all BSS sections // Stack ends after all BSS sections
obj.sections obj.sections
.iter() .iter()
.rfind(|s| s.kind == ObjSectionKind::Bss) .rfind(|&(_, s)| s.kind == ObjSectionKind::Bss)
.map(|s| (s.address + s.size) as u32) .map(|(_, s)| (s.address + s.size) as u32)
}), }),
db_stack_addr: obj.db_stack_addr, db_stack_addr: obj.db_stack_addr,
arena_lo: obj arena_lo: obj
@ -92,21 +92,23 @@ impl Tracker {
pub fn process(&mut self, obj: &ObjInfo) -> Result<()> { pub fn process(&mut self, obj: &ObjInfo) -> Result<()> {
log::debug!("Processing code sections"); log::debug!("Processing code sections");
self.process_code(obj)?; self.process_code(obj)?;
for section in &obj.sections { for (section_index, section) in obj
if matches!(section.kind, ObjSectionKind::Data | ObjSectionKind::ReadOnlyData) { .sections
log::debug!("Processing section {}, address {:#X}", section.index, section.address); .iter()
.filter(|(_, s)| matches!(s.kind, ObjSectionKind::Data | ObjSectionKind::ReadOnlyData))
{
log::debug!("Processing section {}, address {:#X}", section_index, section.address);
self.process_data(obj, section)?; self.process_data(obj, section)?;
} }
}
Ok(()) Ok(())
} }
fn process_code(&mut self, obj: &ObjInfo) -> Result<()> { fn process_code(&mut self, obj: &ObjInfo) -> Result<()> {
self.process_function_by_address(obj, obj.entry as u32)?; self.process_function_by_address(obj, obj.entry as u32)?;
for section in obj.sections.iter().filter(|s| s.kind == ObjSectionKind::Code) { for (section_index, _) in obj.sections.by_kind(ObjSectionKind::Code) {
for (_, symbol) in obj for (_, symbol) in obj
.symbols .symbols
.for_range(section.address as u32..(section.address + section.size) as u32) .for_section(section_index)
.filter(|(_, symbol)| symbol.kind == ObjSymbolKind::Function && symbol.size_known) .filter(|(_, symbol)| symbol.kind == ObjSymbolKind::Function && symbol.size_known)
{ {
let addr = symbol.address as u32; let addr = symbol.address as u32;
@ -124,9 +126,10 @@ impl Tracker {
return Ok(()); return Ok(());
} }
self.processed_functions.insert(addr); self.processed_functions.insert(addr);
let (section_index, _) = obj.sections.at_address(addr)?;
if let Some((_, symbol)) = obj if let Some((_, symbol)) = obj
.symbols .symbols
.at_address(addr) .at_section_address(section_index, addr)
.find(|(_, symbol)| symbol.kind == ObjSymbolKind::Function && symbol.size_known) .find(|(_, symbol)| symbol.kind == ObjSymbolKind::Function && symbol.size_known)
{ {
self.process_function(obj, symbol)?; self.process_function(obj, symbol)?;
@ -144,7 +147,8 @@ impl Tracker {
function_end: u32, function_end: u32,
possible_missed_branches: &mut BTreeMap<u32, Box<VM>>, possible_missed_branches: &mut BTreeMap<u32, Box<VM>>,
) -> Result<ExecCbResult<()>> { ) -> Result<ExecCbResult<()>> {
let ExecCbData { executor, vm, result, section: _, ins, block_start: _ } = data; let ExecCbData { executor, vm, result, section_index: _, section: _, ins, block_start: _ } =
data;
let is_function_addr = |addr: u32| addr >= function_start && addr < function_end; let is_function_addr = |addr: u32| addr >= function_start && addr < function_end;
match result { match result {
@ -344,11 +348,11 @@ impl Tracker {
} }
let mut added = false; let mut added = false;
for (addr, vm) in take(&mut possible_missed_branches) { for (addr, vm) in take(&mut possible_missed_branches) {
let section = match obj.section_at(addr) { let (section_index, section) = match obj.sections.at_address(addr) {
Ok(section) => section, Ok(section) => section,
Err(_) => continue, Err(_) => continue,
}; };
if !executor.visited(section, addr) { if !executor.visited(section_index, section.address as u32, addr) {
executor.push(addr, vm, true); executor.push(addr, vm, true);
added = true; added = true;
} }
@ -397,7 +401,7 @@ impl Tracker {
// if addr > 0x80000000 && addr < 0x80003100 { // if addr > 0x80000000 && addr < 0x80003100 {
// return true; // return true;
// } // }
if let Ok(section) = obj.section_at(addr) { if let Ok((_, section)) = obj.sections.at_address(addr) {
// References to code sections will never be unaligned // References to code sections will never be unaligned
return section.kind != ObjSectionKind::Code || addr & 3 == 0; return section.kind != ObjSectionKind::Code || addr & 3 == 0;
} }
@ -450,7 +454,7 @@ impl Tracker {
section.name = new_name; section.name = new_name;
} }
for section in &mut obj.sections { for (_, section) in obj.sections.iter_mut() {
if !section.section_known { if !section.section_known {
if section.kind == ObjSectionKind::Code { if section.kind == ObjSectionKind::Code {
apply_section_name(section, ".text"); apply_section_name(section, ".text");
@ -485,7 +489,7 @@ impl Tracker {
} }
let mut relocation_maps = Vec::new(); let mut relocation_maps = Vec::new();
for section in &obj.sections { for (_, section) in obj.sections.iter() {
relocation_maps.push(section.build_relocation_map()?); relocation_maps.push(section.build_relocation_map()?);
} }
@ -516,7 +520,7 @@ impl Tracker {
if let Some(symbol) = self.special_symbol(obj, target, reloc_kind) { if let Some(symbol) = self.special_symbol(obj, target, reloc_kind) {
(symbol, 0) (symbol, 0)
} else { } else {
let target_section = match obj.sections.iter().find(|s| { let (target_section_index, _) = match obj.sections.iter().find(|&(_, s)| {
target >= s.address as u32 && target < (s.address + s.size) as u32 target >= s.address as u32 && target < (s.address + s.size) as u32
}) { }) {
Some(v) => v, Some(v) => v,
@ -541,7 +545,7 @@ impl Tracker {
name: format!("lbl_{:08X}", target), name: format!("lbl_{:08X}", target),
demangled_name: None, demangled_name: None,
address: target as u64, address: target as u64,
section: Some(target_section.index), section: Some(target_section_index),
size: 0, size: 0,
size_known: false, size_known: false,
flags: Default::default(), flags: Default::default(),
@ -552,12 +556,15 @@ impl Tracker {
(symbol_idx, 0) (symbol_idx, 0)
} }
}; };
let reloc = ObjReloc { kind: reloc_kind, address: addr as u64, target_symbol, addend }; let reloc = ObjReloc {
let section = match obj kind: reloc_kind,
.sections address: addr as u64,
.iter_mut() target_symbol,
.find(|s| addr >= s.address as u32 && addr < (s.address + s.size) as u32) addend,
{ module: None,
};
let (section_index, section) =
match obj.sections.iter_mut().find(|(_, s)| s.contains(addr)) {
Some(v) => v, Some(v) => v,
None => bail!( None => bail!(
"Failed to locate source section for relocation @ {:#010X} {:#010X?}", "Failed to locate source section for relocation @ {:#010X} {:#010X?}",
@ -566,17 +573,17 @@ impl Tracker {
), ),
}; };
let reloc_map = &mut relocation_maps[section.index]; let reloc_map = &mut relocation_maps[section_index];
match reloc_map.entry(addr) { match reloc_map.entry(addr) {
Entry::Vacant(e) => { Entry::Vacant(e) => {
e.insert(section.relocations.len()); e.insert(section.relocations.len());
section.relocations.push(reloc); section.relocations.push(reloc);
} }
Entry::Occupied(e) => { Entry::Occupied(e) => {
let reloc_symbol = obj.symbols.at(reloc.target_symbol); let reloc_symbol = &obj.symbols[reloc.target_symbol];
if reloc_symbol.name != "_unresolved" { if reloc_symbol.name != "_unresolved" {
let v = &mut section.relocations[*e.get()]; let v = &mut section.relocations[*e.get()];
let iter_symbol = obj.symbols.at(v.target_symbol); let iter_symbol = &obj.symbols[v.target_symbol];
if iter_symbol.address as i64 + v.addend if iter_symbol.address as i64 + v.addend
!= reloc_symbol.address as i64 + reloc.addend != reloc_symbol.address as i64 + reloc.addend
{ {

View File

@ -5,6 +5,7 @@ use std::{
io::Write, io::Write,
path::{Path, PathBuf}, path::{Path, PathBuf},
}; };
use std::mem::take;
use anyhow::{anyhow, bail, Context, Result}; use anyhow::{anyhow, bail, Context, Result};
use argp::FromArgs; use argp::FromArgs;
@ -21,14 +22,15 @@ use crate::{
}, },
cmd::shasum::file_sha1, cmd::shasum::file_sha1,
obj::{ obj::{
split::{is_linker_generated_object, split_obj, update_splits}, ObjDataKind, ObjInfo, ObjReloc, ObjRelocKind, ObjSectionKind, ObjSymbol, ObjSymbolFlagSet,
ObjDataKind, ObjInfo, ObjRelocKind, ObjSectionKind, ObjSymbol, ObjSymbolFlagSet,
ObjSymbolFlags, ObjSymbolKind, ObjSymbolScope, SymbolIndex, ObjSymbolFlags, ObjSymbolKind, ObjSymbolScope, SymbolIndex,
}, },
util::{ util::{
asm::write_asm, asm::write_asm,
comment::MWComment, comment::MWComment,
config::{apply_splits, apply_symbols_file, write_splits_file, write_symbols_file}, config::{
apply_splits, apply_symbols_file, is_auto_symbol, write_splits_file, write_symbols_file,
},
dep::DepFile, dep::DepFile,
dol::process_dol, dol::process_dol,
elf::{process_elf, write_elf}, elf::{process_elf, write_elf},
@ -37,6 +39,7 @@ use crate::{
map::apply_map_file, map::apply_map_file,
rel::process_rel, rel::process_rel,
rso::{process_rso, DOL_SECTION_ABS, DOL_SECTION_NAMES}, rso::{process_rso, DOL_SECTION_ABS, DOL_SECTION_NAMES},
split::{is_linker_generated_object, split_obj, update_splits},
}, },
}; };
@ -150,6 +153,8 @@ pub struct ProjectConfig {
pub struct ModuleConfig { pub struct ModuleConfig {
pub object: PathBuf, pub object: PathBuf,
pub hash: Option<String>, pub hash: Option<String>,
pub splits: Option<PathBuf>,
pub symbols: Option<PathBuf>,
} }
#[derive(Serialize, Deserialize, Debug, Clone)] #[derive(Serialize, Deserialize, Debug, Clone)]
@ -159,9 +164,18 @@ pub struct OutputUnit {
pub autogenerated: bool, pub autogenerated: bool,
} }
#[derive(Serialize, Deserialize, Debug, Clone)]
pub struct OutputModule {
pub name: String,
pub ldscript: PathBuf,
pub units: Vec<OutputUnit>,
}
#[derive(Serialize, Deserialize, Debug, Clone, Default)] #[derive(Serialize, Deserialize, Debug, Clone, Default)]
pub struct OutputConfig { pub struct OutputConfig {
pub ldscript: PathBuf,
pub units: Vec<OutputUnit>, pub units: Vec<OutputUnit>,
pub modules: Vec<OutputModule>,
} }
pub fn run(args: Args) -> Result<()> { pub fn run(args: Args) -> Result<()> {
@ -174,6 +188,7 @@ pub fn run(args: Args) -> Result<()> {
} }
fn apply_selfile(obj: &mut ObjInfo, selfile: &Path) -> Result<()> { fn apply_selfile(obj: &mut ObjInfo, selfile: &Path) -> Result<()> {
log::info!("Loading {}", selfile.display());
let rso = process_rso(selfile)?; let rso = process_rso(selfile)?;
for symbol in rso.symbols.iter() { for symbol in rso.symbols.iter() {
let dol_section_index = match symbol.section { let dol_section_index = match symbol.section {
@ -191,13 +206,13 @@ fn apply_selfile(obj: &mut ObjInfo, selfile: &Path) -> Result<()> {
DOL_SECTION_NAMES.get(dol_section_index).and_then(|&opt| opt).ok_or_else(|| { DOL_SECTION_NAMES.get(dol_section_index).and_then(|&opt| opt).ok_or_else(|| {
anyhow!("Can't add symbol for unknown DOL section {}", dol_section_index) anyhow!("Can't add symbol for unknown DOL section {}", dol_section_index)
})?; })?;
let dol_section = obj let (dol_section_index, dol_section) = obj
.sections .sections
.iter() .iter()
.find(|section| section.name == dol_section_name) .find(|&(_, section)| section.name == dol_section_name)
.ok_or_else(|| anyhow!("Failed to locate DOL section {}", dol_section_name))?; .ok_or_else(|| anyhow!("Failed to locate DOL section {}", dol_section_name))?;
( (
Some(dol_section.index), Some(dol_section_index),
dol_section.address as u32 + symbol.address as u32, dol_section.address as u32 + symbol.address as u32,
Some(dol_section.kind), Some(dol_section.kind),
) )
@ -208,17 +223,17 @@ fn apply_selfile(obj: &mut ObjInfo, selfile: &Path) -> Result<()> {
Some(_) => ObjSymbolKind::Object, Some(_) => ObjSymbolKind::Object,
None => ObjSymbolKind::Unknown, None => ObjSymbolKind::Unknown,
}; };
let existing_symbols = obj.symbols.at_address(address).collect_vec(); let existing_symbols = if let Some(section_index) = section {
obj.symbols.at_section_address(section_index, address).collect_vec()
} else {
// TODO hmmm
obj.symbols.iter_abs().filter(|(_, s)| s.address == address as u64).collect_vec()
};
let existing_symbol = existing_symbols let existing_symbol = existing_symbols
.iter() .iter()
.find(|(_, s)| s.section == section && s.name == symbol.name) .find(|(_, s)| s.name == symbol.name)
.cloned() .cloned()
.or_else(|| { .or_else(|| existing_symbols.iter().find(|(_, s)| s.kind == symbol_kind).cloned());
existing_symbols
.iter()
.find(|(_, s)| s.section == section && s.kind == symbol_kind)
.cloned()
});
if let Some((existing_symbol_idx, existing_symbol)) = existing_symbol { if let Some((existing_symbol_idx, existing_symbol)) = existing_symbol {
log::debug!("Mapping symbol {} to {}", symbol.name, existing_symbol.name); log::debug!("Mapping symbol {} to {}", symbol.name, existing_symbol.name);
obj.symbols.replace(existing_symbol_idx, ObjSymbol { obj.symbols.replace(existing_symbol_idx, ObjSymbol {
@ -273,7 +288,7 @@ fn info(args: InfoArgs) -> Result<()> {
println!("Entry point: {:#010X}", obj.entry); println!("Entry point: {:#010X}", obj.entry);
println!("\nSections:"); println!("\nSections:");
println!("\t{: >10} | {: <10} | {: <10} | {: <10}", "Name", "Address", "Size", "File Off"); println!("\t{: >10} | {: <10} | {: <10} | {: <10}", "Name", "Address", "Size", "File Off");
for section in &obj.sections { for (_, section) in obj.sections.iter() {
println!( println!(
"\t{: >10} | {:#010X} | {: <#10X} | {: <#10X}", "\t{: >10} | {:#010X} | {: <#10X} | {: <#10X}",
section.name, section.address, section.size, section.file_offset section.name, section.address, section.size, section.file_offset
@ -281,8 +296,8 @@ fn info(args: InfoArgs) -> Result<()> {
} }
println!("\nDiscovered symbols:"); println!("\nDiscovered symbols:");
println!("\t{: >23} | {: <10} | {: <10}", "Name", "Address", "Size"); println!("\t{: >23} | {: <10} | {: <10}", "Name", "Address", "Size");
for (_, symbol) in obj.symbols.iter_ordered() { for (_, symbol) in obj.symbols.iter_ordered().chain(obj.symbols.iter_abs()) {
if symbol.name.starts_with('@') || symbol.name.starts_with("fn_") { if symbol.name.starts_with('@') || is_auto_symbol(&symbol.name) {
continue; continue;
} }
if symbol.size_known { if symbol.size_known {
@ -314,6 +329,214 @@ fn verify_hash<P: AsRef<Path>>(path: P, hash_str: &str) -> Result<()> {
} }
} }
fn update_symbols(obj: &mut ObjInfo, modules: &BTreeMap<u32, ObjInfo>) -> Result<()> {
log::info!("Updating symbols for module {}", obj.module_id);
// Find all references to this module from other modules
for rel_reloc in obj
.unresolved_relocations
.iter()
.chain(modules.iter().flat_map(|(_, obj)| obj.unresolved_relocations.iter()))
.filter(|r| r.module_id == obj.module_id)
{
let (target_section_index, target_section) = obj
.sections
.get_elf_index(rel_reloc.target_section as usize)
.ok_or_else(|| anyhow!("Failed to locate REL section {}", rel_reloc.section))?;
let target_symbol = obj
.symbols
.at_section_address(target_section_index, rel_reloc.addend)
.filter(|(_, s)| s.referenced_by(rel_reloc.kind))
.at_most_one()
.map_err(|e| {
for (_, symbol) in e {
log::warn!(
"Multiple symbols found for {:#010X}: {}",
rel_reloc.addend,
symbol.name
);
}
anyhow!("Multiple symbols found for {:#010X}", rel_reloc.addend)
})?;
if let Some((symbol_index, symbol)) = target_symbol {
// Update symbol
log::trace!(
"Found symbol in section {} at {:#010X}: {}",
rel_reloc.target_section,
rel_reloc.addend,
symbol.name
);
obj.symbols.flags(symbol_index).set_force_active(true);
} else {
// Add label
log::trace!(
"Creating label in section {} at {:#010X}",
rel_reloc.target_section,
rel_reloc.addend
);
obj.symbols.add_direct(ObjSymbol {
name: format!(
"lbl_mod{}_{}_{:08X}",
obj.module_id,
target_section.name.trim_start_matches('.'),
rel_reloc.addend
),
demangled_name: None,
address: rel_reloc.addend as u64,
section: Some(target_section_index),
size: 0,
size_known: false,
flags: ObjSymbolFlagSet(ObjSymbolFlags::ForceActive.into()),
kind: Default::default(),
align: None,
data_kind: ObjDataKind::Unknown,
})?;
}
}
Ok(())
}
fn create_relocations(
obj: &mut ObjInfo,
modules: &BTreeMap<u32, ObjInfo>,
dol_obj: &ObjInfo,
) -> Result<()> {
log::info!("Creating relocations for module {}", obj.module_id);
// Resolve all relocations in this module
for rel_reloc in take(&mut obj.unresolved_relocations) {
let target_obj = if rel_reloc.module_id == 0 {
dol_obj
} else if rel_reloc.module_id == obj.module_id {
&*obj
} else {
modules
.get(&rel_reloc.module_id)
.ok_or_else(|| anyhow!("Failed to locate module {}", rel_reloc.module_id))?
};
let (target_section_index, _target_section) = if rel_reloc.module_id == 0 {
target_obj.sections.at_address(rel_reloc.addend)?
} else {
target_obj.sections.get_elf_index(rel_reloc.target_section as usize).ok_or_else(
|| {
anyhow!(
"Failed to locate module {} section {}",
rel_reloc.module_id,
rel_reloc.target_section
)
},
)?
};
if let Some((symbol_index, symbol)) = target_obj
.symbols
.at_section_address(target_section_index, rel_reloc.addend)
.filter(|(_, s)| s.referenced_by(rel_reloc.kind))
.at_most_one()
.map_err(|e| {
for (_, symbol) in e {
log::warn!(
"Multiple symbols found for {:#010X}: {}",
rel_reloc.addend,
symbol.name
);
}
anyhow!("Multiple symbols found for {:#010X}", rel_reloc.addend)
})?
{
// log::info!("Would create relocation to symbol {}", symbol.name);
let reloc = ObjReloc {
kind: rel_reloc.kind,
address: rel_reloc.address as u64 & !3,
target_symbol: symbol_index,
addend: rel_reloc.addend as i64 - symbol.address as i64,
module: if rel_reloc.module_id == obj.module_id {
None
} else {
Some(rel_reloc.module_id)
},
};
let (_, source_section) = obj
.sections
.get_elf_index_mut(rel_reloc.section as usize)
.ok_or_else(|| anyhow!("Failed to locate REL section {}", rel_reloc.section))?;
source_section.relocations.push(reloc);
} else {
bail!(
"Couldn't find module {} symbol in section {} at {:#010X}",
rel_reloc.module_id,
rel_reloc.target_section,
rel_reloc.addend
);
}
}
Ok(())
}
fn resolve_external_relocations(
obj: &mut ObjInfo,
modules: &BTreeMap<u32, ObjInfo>,
dol_obj: Option<&ObjInfo>,
) -> Result<()> {
log::info!("Resolving relocations for module {}", obj.module_id);
#[derive(Debug, Clone, Copy, Hash, PartialEq, Eq)]
struct RelocRef {
module_id: u32,
symbol_index: SymbolIndex,
}
let mut reloc_to_symbol = HashMap::<RelocRef, usize>::new();
for (_section_index, section) in obj.sections.iter_mut() {
for reloc in section.relocations.iter_mut() {
if let Some(module_id) = reloc.module {
let reloc_ref = RelocRef { module_id, symbol_index: reloc.target_symbol };
let symbol_idx = match reloc_to_symbol.entry(reloc_ref) {
hash_map::Entry::Occupied(e) => *e.get(),
hash_map::Entry::Vacant(e) => {
let target_obj = if module_id == obj.module_id {
bail!("Relocation to self in module {}", obj.module_id)
} else if module_id == 0 {
dol_obj.unwrap()
} else {
modules.get(&module_id).ok_or_else(|| {
anyhow!("Failed to locate module {}", reloc.module.unwrap())
})?
};
let target_symbol = &target_obj.symbols[reloc.target_symbol];
let symbol_idx = obj.symbols.add_direct(ObjSymbol {
name: target_symbol.name.clone(),
demangled_name: target_symbol.demangled_name.clone(),
address: 0,
section: None,
size: 0,
size_known: false,
flags: Default::default(),
kind: Default::default(),
align: None,
data_kind: Default::default(),
})?;
e.insert(symbol_idx);
symbol_idx
}
};
reloc.target_symbol = symbol_idx;
reloc.module = None;
}
}
}
Ok(())
}
fn split(args: SplitArgs) -> Result<()> { fn split(args: SplitArgs) -> Result<()> {
log::info!("Loading {}", args.config.display()); log::info!("Loading {}", args.config.display());
let mut config_file = File::open(&args.config) let mut config_file = File::open(&args.config)
@ -335,6 +558,7 @@ fn split(args: SplitArgs) -> Result<()> {
} }
let mut modules = BTreeMap::<u32, ObjInfo>::new(); let mut modules = BTreeMap::<u32, ObjInfo>::new();
let mut module_ids = Vec::with_capacity(config.modules.len());
for module_config in &config.modules { for module_config in &config.modules {
log::info!("Loading {}", module_config.object.display()); log::info!("Loading {}", module_config.object.display());
if let Some(hash_str) = &module_config.hash { if let Some(hash_str) = &module_config.hash {
@ -342,6 +566,7 @@ fn split(args: SplitArgs) -> Result<()> {
} }
let map = map_file(&module_config.object)?; let map = map_file(&module_config.object)?;
let rel_obj = process_rel(map_reader(&map))?; let rel_obj = process_rel(map_reader(&map))?;
module_ids.push(rel_obj.module_id);
match modules.entry(rel_obj.module_id) { match modules.entry(rel_obj.module_id) {
Entry::Vacant(e) => e.insert(rel_obj), Entry::Vacant(e) => e.insert(rel_obj),
Entry::Occupied(_) => bail!("Duplicate module ID {}", obj.module_id), Entry::Occupied(_) => bail!("Duplicate module ID {}", obj.module_id),
@ -370,52 +595,20 @@ fn split(args: SplitArgs) -> Result<()> {
if !modules.is_empty() { if !modules.is_empty() {
log::info!("Applying module relocations"); log::info!("Applying module relocations");
for (module_id, module_obj) in modules {
for rel_reloc in &module_obj.unresolved_relocations { // Step 1: For each module, create any missing symbols (referenced from other modules) and set FORCEACTIVE
// TODO also apply inter-module relocations update_symbols(&mut obj, &modules)?;
if rel_reloc.module_id != 0 { for &module_id in &module_ids {
continue; let mut module_obj = modules.remove(&module_id).unwrap();
} update_symbols(&mut module_obj, &modules)?;
let target = rel_reloc.addend; modules.insert(module_id, module_obj);
if let Some((symbol_index, symbol)) =
obj.symbols.for_relocation(target, rel_reloc.kind)?
{
if symbol.flags.is_local() {
bail!(
"Module {} relocation to {:#010X} found local symbol {}",
module_id,
symbol.address,
symbol.name
);
}
let addend = target as i64 - symbol.address as i64;
if addend != 0 {
bail!(
"Module {} relocation to {:#010X} for symbol {} has non-zero addend {:#010X}",
module_id,
symbol.address,
symbol.name,
addend
);
}
obj.symbols.flags(symbol_index).set_force_active(true);
} else {
// Add label
let target_section = obj.section_at(target)?;
obj.symbols.add_direct(ObjSymbol {
name: format!("lbl_{:08X}", target),
demangled_name: None,
address: target as u64,
section: Some(target_section.index),
size: 0,
size_known: false,
flags: ObjSymbolFlagSet(ObjSymbolFlags::ForceActive.into()),
kind: Default::default(),
align: None,
data_kind: ObjDataKind::Unknown,
})?;
}
} }
// Step 2: For each module, create relocations to symbols in other modules
for &module_id in &module_ids {
let mut module_obj = modules.remove(&module_id).unwrap();
create_relocations(&mut module_obj, &modules, &obj)?;
modules.insert(module_id, module_obj);
} }
} }
@ -467,6 +660,17 @@ fn split(args: SplitArgs) -> Result<()> {
} }
} }
if !modules.is_empty() {
log::info!("Resolving module relocations");
resolve_external_relocations(&mut obj, &modules, None)?;
for &module_id in &module_ids {
let mut module_obj = modules.remove(&module_id).unwrap();
resolve_external_relocations(&mut module_obj, &modules, Some(&obj))?;
modules.insert(module_id, module_obj);
}
}
log::info!("Splitting {} objects", obj.link_order.len()); log::info!("Splitting {} objects", obj.link_order.len());
let split_objs = split_obj(&obj)?; let split_objs = split_obj(&obj)?;
@ -479,20 +683,9 @@ fn split(args: SplitArgs) -> Result<()> {
fs::write(include_dir.join("macros.inc"), include_str!("../../assets/macros.inc"))?; fs::write(include_dir.join("macros.inc"), include_str!("../../assets/macros.inc"))?;
log::info!("Writing object files"); log::info!("Writing object files");
let mut file_map = HashMap::<String, Vec<u8>>::new(); let mut out_config = OutputConfig::default();
for (unit, split_obj) in obj.link_order.iter().zip(&split_objs) { for (unit, split_obj) in obj.link_order.iter().zip(&split_objs) {
let out_obj = write_elf(split_obj)?; let out_obj = write_elf(split_obj)?;
match file_map.entry(unit.name.clone()) {
hash_map::Entry::Vacant(e) => e.insert(out_obj),
hash_map::Entry::Occupied(_) => bail!("Duplicate file {}", unit.name),
};
}
let mut out_config = OutputConfig::default();
for unit in &obj.link_order {
let object = file_map
.get(&unit.name)
.ok_or_else(|| anyhow!("Failed to find object file for unit '{}'", unit.name))?;
let out_path = obj_dir.join(obj_path_for_unit(&unit.name)); let out_path = obj_dir.join(obj_path_for_unit(&unit.name));
out_config.units.push(OutputUnit { out_config.units.push(OutputUnit {
object: out_path.clone(), object: out_path.clone(),
@ -502,7 +695,7 @@ fn split(args: SplitArgs) -> Result<()> {
if let Some(parent) = out_path.parent() { if let Some(parent) = out_path.parent() {
DirBuilder::new().recursive(true).create(parent)?; DirBuilder::new().recursive(true).create(parent)?;
} }
fs::write(&out_path, object) fs::write(&out_path, out_obj)
.with_context(|| format!("Failed to write '{}'", out_path.display()))?; .with_context(|| format!("Failed to write '{}'", out_path.display()))?;
} }
{ {
@ -512,24 +705,46 @@ fn split(args: SplitArgs) -> Result<()> {
} }
// Generate ldscript.lcf // Generate ldscript.lcf
fs::write( let ldscript_path = args.out_dir.join("ldscript.lcf");
args.out_dir.join("ldscript.lcf"), fs::write(&ldscript_path, generate_ldscript(&obj, config.auto_force_files)?)?;
generate_ldscript(&obj, config.auto_force_files)?, out_config.ldscript = ldscript_path;
)?;
log::info!("Writing disassembly"); log::info!("Writing disassembly");
for (unit, split_obj) in obj.link_order.iter().zip(&split_objs) { for (unit, split_obj) in obj.link_order.iter().zip(&split_objs) {
let out_path = asm_dir.join(asm_path_for_unit(&unit.name)); let out_path = asm_dir.join(asm_path_for_unit(&unit.name));
if let Some(parent) = out_path.parent() {
DirBuilder::new().recursive(true).create(parent)?;
}
let mut w = buf_writer(&out_path)?; let mut w = buf_writer(&out_path)?;
write_asm(&mut w, split_obj) write_asm(&mut w, split_obj)
.with_context(|| format!("Failed to write {}", out_path.display()))?; .with_context(|| format!("Failed to write {}", out_path.display()))?;
w.flush()?; w.flush()?;
} }
// Split and write modules
for (config, &module_id) in config.modules.iter().zip(&module_ids) {
let obj = modules.get(&module_id).unwrap();
let out_dir = args.out_dir.join(format!("module_{}", module_id));
let asm_dir = out_dir.join("asm");
// let obj_dir = out_dir.join("obj");
if !args.no_update {
if let Some(symbols_path) = &config.symbols {
write_symbols_file(symbols_path, obj)?;
}
if let Some(splits_path) = &config.splits {
write_splits_file(splits_path, obj)?;
}
}
log::info!("Writing disassembly");
let filename = config.object.file_name().unwrap().to_str().unwrap();
let out_path = asm_dir.join(asm_path_for_unit(filename));
let mut w = buf_writer(&out_path)?;
write_asm(&mut w, obj)
.with_context(|| format!("Failed to write {}", out_path.display()))?;
w.flush()?;
}
// Write dep file // Write dep file
{ {
let dep_path = args.out_dir.join("dep"); let dep_path = args.out_dir.join("dep");
@ -549,15 +764,11 @@ fn split(args: SplitArgs) -> Result<()> {
#[allow(dead_code)] #[allow(dead_code)]
fn validate<P: AsRef<Path>>(obj: &ObjInfo, elf_file: P, state: &AnalyzerState) -> Result<()> { fn validate<P: AsRef<Path>>(obj: &ObjInfo, elf_file: P, state: &AnalyzerState) -> Result<()> {
let real_obj = process_elf(elf_file)?; let real_obj = process_elf(elf_file)?;
for real_section in &real_obj.sections { for (section_index, real_section) in real_obj.sections.iter() {
let obj_section = match obj.sections.get(real_section.index) { let obj_section = match obj.sections.get(section_index) {
Some(v) => v, Some(v) => v,
None => { None => {
log::error!( log::error!("Section {} {} doesn't exist in DOL", section_index, real_section.name);
"Section {} {} doesn't exist in DOL",
real_section.index,
real_section.name
);
continue; continue;
} }
}; };
@ -566,18 +777,15 @@ fn validate<P: AsRef<Path>>(obj: &ObjInfo, elf_file: P, state: &AnalyzerState) -
"Section mismatch: {} {:?} ({}) should be {} {:?}", "Section mismatch: {} {:?} ({}) should be {} {:?}",
obj_section.name, obj_section.name,
obj_section.kind, obj_section.kind,
obj_section.index, section_index,
real_section.name, real_section.name,
real_section.kind real_section.kind
); );
} }
} }
let mut real_functions = BTreeMap::<u32, String>::new(); let mut real_functions = BTreeMap::<u32, String>::new();
for section in &real_obj.sections { for (section_index, _section) in real_obj.sections.by_kind(ObjSectionKind::Code) {
if section.kind != ObjSectionKind::Code { for (_symbol_idx, symbol) in real_obj.symbols.for_section(section_index) {
continue;
}
for (_symbol_idx, symbol) in real_obj.symbols.for_section(section) {
real_functions.insert(symbol.address as u32, symbol.name.clone()); real_functions.insert(symbol.address as u32, symbol.name.clone());
match state.function_bounds.get(&(symbol.address as u32)) { match state.function_bounds.get(&(symbol.address as u32)) {
Some(&end) => { Some(&end) => {
@ -617,8 +825,8 @@ fn validate<P: AsRef<Path>>(obj: &ObjInfo, elf_file: P, state: &AnalyzerState) -
} }
// return Ok(()); // TODO // return Ok(()); // TODO
for real_section in &real_obj.sections { for (real_section_index, real_section) in real_obj.sections.iter() {
let obj_section = match obj.sections.get(real_section.index) { let obj_section = match obj.sections.get(real_section_index) {
Some(v) => v, Some(v) => v,
None => continue, None => continue,
}; };
@ -626,7 +834,7 @@ fn validate<P: AsRef<Path>>(obj: &ObjInfo, elf_file: P, state: &AnalyzerState) -
let obj_map = obj_section.build_relocation_map()?; let obj_map = obj_section.build_relocation_map()?;
for (&real_addr, &real_reloc_idx) in &real_map { for (&real_addr, &real_reloc_idx) in &real_map {
let real_reloc = &real_section.relocations[real_reloc_idx]; let real_reloc = &real_section.relocations[real_reloc_idx];
let real_symbol = real_obj.symbols.at(real_reloc.target_symbol); let real_symbol = &real_obj.symbols[real_reloc.target_symbol];
let obj_reloc = match obj_map.get(&real_addr) { let obj_reloc = match obj_map.get(&real_addr) {
Some(v) => &obj_section.relocations[*v], Some(v) => &obj_section.relocations[*v],
None => { None => {
@ -652,7 +860,7 @@ fn validate<P: AsRef<Path>>(obj: &ObjInfo, elf_file: P, state: &AnalyzerState) -
continue; continue;
} }
}; };
let obj_symbol = obj.symbols.at(obj_reloc.target_symbol); let obj_symbol = &obj.symbols[obj_reloc.target_symbol];
if real_reloc.kind != obj_reloc.kind { if real_reloc.kind != obj_reloc.kind {
log::warn!( log::warn!(
"Relocation type mismatch @ {:#010X}: {:?} != {:?}", "Relocation type mismatch @ {:#010X}: {:?} != {:?}",
@ -680,7 +888,7 @@ fn validate<P: AsRef<Path>>(obj: &ObjInfo, elf_file: P, state: &AnalyzerState) -
} }
for (&obj_addr, &obj_reloc_idx) in &obj_map { for (&obj_addr, &obj_reloc_idx) in &obj_map {
let obj_reloc = &obj_section.relocations[obj_reloc_idx]; let obj_reloc = &obj_section.relocations[obj_reloc_idx];
let obj_symbol = obj.symbols.at(obj_reloc.target_symbol); let obj_symbol = &obj.symbols[obj_reloc.target_symbol];
if !real_map.contains_key(&obj_addr) { if !real_map.contains_key(&obj_addr) {
log::warn!( log::warn!(
"Relocation not real @ {:#010X} {:?} to {:#010X}+{:X} ({})", "Relocation not real @ {:#010X} {:?} to {:#010X}+{:X} ({})",
@ -716,19 +924,20 @@ fn diff(args: DiffArgs) -> Result<()> {
log::info!("Loading {}", args.map_file.display()); log::info!("Loading {}", args.map_file.display());
apply_map_file(&args.map_file, &mut linked_obj)?; apply_map_file(&args.map_file, &mut linked_obj)?;
for orig_sym in obj.symbols.iter() { for orig_sym in obj.symbols.iter().filter(|s| s.kind != ObjSymbolKind::Section) {
if orig_sym.kind == ObjSymbolKind::Section || orig_sym.section.is_none() { let Some(orig_section_index) = orig_sym.section else { continue };
continue; let orig_section = &obj.sections[orig_section_index];
} let (linked_section_index, linked_section) =
linked_obj.sections.at_address(orig_sym.address as u32)?;
let linked_sym = linked_obj let linked_sym = linked_obj
.symbols .symbols
.at_address(orig_sym.address as u32) .at_section_address(linked_section_index, orig_sym.address as u32)
.find(|(_, sym)| sym.name == orig_sym.name) .find(|(_, sym)| sym.name == orig_sym.name)
.or_else(|| { .or_else(|| {
linked_obj linked_obj
.symbols .symbols
.at_address(orig_sym.address as u32) .at_section_address(linked_section_index, orig_sym.address as u32)
.find(|(_, sym)| sym.kind == orig_sym.kind) .find(|(_, sym)| sym.kind == orig_sym.kind)
}); });
let mut found = false; let mut found = false;
@ -746,18 +955,14 @@ fn diff(args: DiffArgs) -> Result<()> {
found = true; found = true;
} else if linked_sym.kind == orig_sym.kind && linked_sym.size == orig_sym.size { } else if linked_sym.kind == orig_sym.kind && linked_sym.size == orig_sym.size {
// Fuzzy match // Fuzzy match
let orig_data = obj let orig_data = orig_section.data_range(
.section_data(
orig_sym.address as u32, orig_sym.address as u32,
orig_sym.address as u32 + orig_sym.size as u32, orig_sym.address as u32 + orig_sym.size as u32,
)? )?;
.1; let linked_data = linked_section.data_range(
let linked_data = linked_obj
.section_data(
linked_sym.address as u32, linked_sym.address as u32,
linked_sym.address as u32 + linked_sym.size as u32, linked_sym.address as u32 + linked_sym.size as u32,
)? )?;
.1;
if orig_data == linked_data { if orig_data == linked_data {
found = true; found = true;
} }
@ -771,7 +976,9 @@ fn diff(args: DiffArgs) -> Result<()> {
orig_sym.size, orig_sym.size,
orig_sym.address orig_sym.address
); );
for (_, linked_sym) in linked_obj.symbols.at_address(orig_sym.address as u32) { for (_, linked_sym) in
linked_obj.symbols.at_section_address(linked_section_index, orig_sym.address as u32)
{
log::error!( log::error!(
"At {:#010X}, found: {} (type {:?}, size {:#X})", "At {:#010X}, found: {} (type {:?}, size {:#X})",
linked_sym.address, linked_sym.address,
@ -794,32 +1001,30 @@ fn diff(args: DiffArgs) -> Result<()> {
} }
// Data diff // Data diff
for orig_sym in obj.symbols.iter() { for orig_sym in obj.symbols.iter().filter(|s| s.kind != ObjSymbolKind::Section) {
if orig_sym.kind == ObjSymbolKind::Section || orig_sym.section.is_none() { let Some(orig_section_index) = orig_sym.section else { continue };
continue; let orig_section = &obj.sections[orig_section_index];
} let (linked_section_index, linked_section) =
linked_obj.sections.at_address(orig_sym.address as u32)?;
let (_, linked_sym) = linked_obj let (_, linked_sym) = linked_obj
.symbols .symbols
.at_address(orig_sym.address as u32) .at_section_address(linked_section_index, orig_sym.address as u32)
.find(|(_, sym)| sym.name == orig_sym.name) .find(|(_, sym)| sym.name == orig_sym.name)
.or_else(|| { .or_else(|| {
linked_obj linked_obj
.symbols .symbols
.at_address(orig_sym.address as u32) .at_section_address(linked_section_index, orig_sym.address as u32)
.find(|(_, sym)| sym.kind == orig_sym.kind) .find(|(_, sym)| sym.kind == orig_sym.kind)
}) })
.unwrap(); .unwrap();
let orig_data = obj let orig_data = orig_section
.section_data(orig_sym.address as u32, orig_sym.address as u32 + orig_sym.size as u32)? .data_range(orig_sym.address as u32, orig_sym.address as u32 + orig_sym.size as u32)?;
.1; let linked_data = linked_section.data_range(
let linked_data = linked_obj
.section_data(
linked_sym.address as u32, linked_sym.address as u32,
linked_sym.address as u32 + linked_sym.size as u32, linked_sym.address as u32 + linked_sym.size as u32,
)? )?;
.1;
if orig_data != linked_data { if orig_data != linked_data {
log::error!( log::error!(
"Data mismatch for {} (type {:?}, size {:#X}) at {:#010X}", "Data mismatch for {} (type {:?}, size {:#X}) at {:#010X}",
@ -861,14 +1066,21 @@ fn apply(args: ApplyArgs) -> Result<()> {
let mut replacements: Vec<(SymbolIndex, Option<ObjSymbol>)> = vec![]; let mut replacements: Vec<(SymbolIndex, Option<ObjSymbol>)> = vec![];
for (orig_idx, orig_sym) in obj.symbols.iter().enumerate() { for (orig_idx, orig_sym) in obj.symbols.iter().enumerate() {
// skip ABS for now
if orig_sym.section.is_none() {
continue;
}
let (linked_section_index, _linked_section) =
linked_obj.sections.at_address(orig_sym.address as u32)?;
let linked_sym = linked_obj let linked_sym = linked_obj
.symbols .symbols
.at_address(orig_sym.address as u32) .at_section_address(linked_section_index, orig_sym.address as u32)
.find(|(_, sym)| sym.name == orig_sym.name) .find(|(_, sym)| sym.name == orig_sym.name)
.or_else(|| { .or_else(|| {
linked_obj linked_obj
.symbols .symbols
.at_address(orig_sym.address as u32) .at_section_address(linked_section_index, orig_sym.address as u32)
.find(|(_, sym)| sym.kind == orig_sym.kind) .find(|(_, sym)| sym.kind == orig_sym.kind)
}); });
if let Some((_, linked_sym)) = linked_sym { if let Some((_, linked_sym)) = linked_sym {
@ -929,18 +1141,21 @@ fn apply(args: ApplyArgs) -> Result<()> {
for linked_sym in linked_obj.symbols.iter() { for linked_sym in linked_obj.symbols.iter() {
if matches!(linked_sym.kind, ObjSymbolKind::Section) if matches!(linked_sym.kind, ObjSymbolKind::Section)
|| is_linker_generated_object(&linked_sym.name) || is_linker_generated_object(&linked_sym.name)
// skip ABS for now
|| linked_sym.section.is_none()
{ {
continue; continue;
} }
let (orig_section_index, _orig_section) =
obj.sections.at_address(linked_sym.address as u32)?;
let orig_sym = obj let orig_sym = obj
.symbols .symbols
.at_address(linked_sym.address as u32) .at_section_address(orig_section_index, linked_sym.address as u32)
.find(|(_, sym)| sym.name == linked_sym.name) .find(|(_, sym)| sym.name == linked_sym.name)
.or_else(|| { .or_else(|| {
linked_obj obj.symbols
.symbols .at_section_address(orig_section_index, linked_sym.address as u32)
.at_address(linked_sym.address as u32)
.find(|(_, sym)| sym.kind == linked_sym.kind) .find(|(_, sym)| sym.kind == linked_sym.kind)
}); });
if orig_sym.is_none() { if orig_sym.is_none() {
@ -951,7 +1166,18 @@ fn apply(args: ApplyArgs) -> Result<()> {
linked_sym.size, linked_sym.size,
linked_sym.address linked_sym.address
); );
obj.symbols.add_direct(linked_sym.clone())?; obj.symbols.add_direct(ObjSymbol {
name: linked_sym.name.clone(),
demangled_name: linked_sym.demangled_name.clone(),
address: linked_sym.address,
section: Some(orig_section_index),
size: linked_sym.size,
size_known: linked_sym.size_known,
flags: linked_sym.flags,
kind: linked_sym.kind,
align: linked_sym.align,
data_kind: linked_sym.data_kind,
})?;
} }
} }

View File

@ -16,16 +16,14 @@ use object::{
}; };
use crate::{ use crate::{
obj::{ obj::ObjKind,
signatures::{compare_signature, generate_signature, FunctionSignature},
split::split_obj,
ObjKind,
},
util::{ util::{
asm::write_asm, asm::write_asm,
config::{write_splits_file, write_symbols_file}, config::{write_splits_file, write_symbols_file},
elf::{process_elf, write_elf}, elf::{process_elf, write_elf},
file::{buf_writer, process_rsp}, file::{buf_writer, process_rsp},
signatures::{compare_signature, generate_signature, FunctionSignature},
split::split_obj,
}, },
}; };
@ -148,9 +146,6 @@ fn disasm(args: DisasmArgs) -> Result<()> {
let out_path = asm_dir.join(file_name_from_unit(&unit.name, ".s")); let out_path = asm_dir.join(file_name_from_unit(&unit.name, ".s"));
log::info!("Writing {}", out_path.display()); log::info!("Writing {}", out_path.display());
if let Some(parent) = out_path.parent() {
DirBuilder::new().recursive(true).create(parent)?;
}
let mut w = buf_writer(out_path)?; let mut w = buf_writer(out_path)?;
write_asm(&mut w, split_obj)?; write_asm(&mut w, split_obj)?;
w.flush()?; w.flush()?;
@ -160,9 +155,6 @@ fn disasm(args: DisasmArgs) -> Result<()> {
files_out.flush()?; files_out.flush()?;
} }
ObjKind::Relocatable => { ObjKind::Relocatable => {
if let Some(parent) = args.out.parent() {
DirBuilder::new().recursive(true).create(parent)?;
}
let mut w = buf_writer(args.out)?; let mut w = buf_writer(args.out)?;
write_asm(&mut w, &obj)?; write_asm(&mut w, &obj)?;
w.flush()?; w.flush()?;

View File

@ -107,25 +107,24 @@ fn merge(args: MergeArgs) -> Result<()> {
let mut section_map: BTreeMap<u32, BTreeMap<u32, u32>> = BTreeMap::new(); let mut section_map: BTreeMap<u32, BTreeMap<u32, u32>> = BTreeMap::new();
let mut offset = align32(arena_lo + 0x2000); let mut offset = align32(arena_lo + 0x2000);
for module in module_map.values() { for module in module_map.values() {
for mod_section in &module.sections { for (mod_section_index, mod_section) in module.sections.iter() {
let section_idx = obj.sections.len();
ensure!(mod_section.relocations.is_empty(), "Unsupported relocations during merge"); ensure!(mod_section.relocations.is_empty(), "Unsupported relocations during merge");
obj.sections.push(ObjSection { let section_idx = obj.sections.push(ObjSection {
name: format!("{}:{}", mod_section.name, module.module_id), name: format!("{}:{}", mod_section.name, module.module_id),
kind: mod_section.kind, kind: mod_section.kind,
address: offset as u64, address: offset as u64,
size: mod_section.size, size: mod_section.size,
data: mod_section.data.clone(), data: mod_section.data.clone(),
align: mod_section.align, align: mod_section.align,
index: section_idx,
elf_index: mod_section.elf_index, elf_index: mod_section.elf_index,
relocations: vec![], relocations: vec![],
original_address: mod_section.original_address, original_address: mod_section.original_address,
file_offset: mod_section.file_offset, file_offset: mod_section.file_offset,
section_known: mod_section.section_known, section_known: mod_section.section_known,
splits: mod_section.splits.clone(),
}); });
section_map.nested_insert(module.module_id, mod_section.elf_index as u32, offset)?; section_map.nested_insert(module.module_id, mod_section.elf_index as u32, offset)?;
for (_, mod_symbol) in module.symbols.for_section(mod_section) { for (_, mod_symbol) in module.symbols.for_section(mod_section_index) {
obj.symbols.add_direct(ObjSymbol { obj.symbols.add_direct(ObjSymbol {
name: mod_symbol.name.clone(), name: mod_symbol.name.clone(),
demangled_name: mod_symbol.demangled_name.clone(), demangled_name: mod_symbol.demangled_name.clone(),
@ -157,8 +156,8 @@ fn merge(args: MergeArgs) -> Result<()> {
})?; })?;
section_map[&(rel_reloc.target_section as u32)] + rel_reloc.addend section_map[&(rel_reloc.target_section as u32)] + rel_reloc.addend
}; };
let source_section_index = obj.section_at(source_addr)?.index; let (source_section_index, _) = obj.sections.at_address(source_addr)?;
let target_section_index = obj.section_at(target_addr)?.index; let (target_section_index, _) = obj.sections.at_address(target_addr)?;
let (symbol_idx, addend) = if let Some((symbol_idx, symbol)) = let (symbol_idx, addend) = if let Some((symbol_idx, symbol)) =
obj.symbols.for_relocation(target_addr, rel_reloc.kind)? obj.symbols.for_relocation(target_addr, rel_reloc.kind)?
@ -185,6 +184,7 @@ fn merge(args: MergeArgs) -> Result<()> {
address: source_addr as u64, address: source_addr as u64,
target_symbol: symbol_idx, target_symbol: symbol_idx,
addend, addend,
module: None,
}); });
} }
} }
@ -217,11 +217,11 @@ fn merge(args: MergeArgs) -> Result<()> {
} }
fn link_relocations(obj: &mut ObjInfo) -> Result<()> { fn link_relocations(obj: &mut ObjInfo) -> Result<()> {
for section in &mut obj.sections { for (_, section) in obj.sections.iter_mut() {
for reloc in &section.relocations { for reloc in &section.relocations {
let source_address = reloc.address /*& !3*/; let source_address = reloc.address /*& !3*/;
let target_address = let target_address =
(obj.symbols.address_of(reloc.target_symbol) as i64 + reloc.addend) as u32; (obj.symbols[reloc.target_symbol].address as i64 + reloc.addend) as u32;
let ins_ref = let ins_ref =
array_ref_mut!(section.data, (source_address - section.address) as usize, 4); array_ref_mut!(section.data, (source_address - section.address) as usize, 4);
let mut ins = u32::from_be_bytes(*ins_ref); let mut ins = u32::from_be_bytes(*ins_ref);

View File

@ -1,180 +1,23 @@
pub mod signatures; mod sections;
pub mod split; mod splits;
mod symbols;
use std::{ use std::{
cmp::{max, min}, cmp::{max, min},
collections::{btree_map, BTreeMap, BTreeSet, HashMap}, collections::{BTreeMap, BTreeSet},
hash::{Hash, Hasher}, hash::Hash,
ops::{Range, RangeBounds},
}; };
use anyhow::{anyhow, bail, ensure, Result}; use anyhow::{anyhow, bail, ensure, Result};
use flagset::{flags, FlagSet}; pub use sections::{section_kind_for_section, ObjSection, ObjSectionKind, ObjSections};
use itertools::Itertools;
use serde::{Deserialize, Serialize}; use serde::{Deserialize, Serialize};
use serde_repr::{Deserialize_repr, Serialize_repr}; pub use splits::{ObjSplit, ObjSplits};
pub use symbols::{
use crate::{ ObjDataKind, ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags, ObjSymbolKind, ObjSymbolScope,
obj::split::is_linker_generated_label, ObjSymbols, SymbolIndex,
util::{comment::MWComment, nested::NestedVec, rel::RelReloc},
}; };
#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize, Default)] use crate::util::{comment::MWComment, rel::RelReloc};
pub enum ObjSymbolScope {
#[default]
Unknown,
Global,
Weak,
Local,
}
flags! {
#[repr(u8)]
#[derive(Deserialize_repr, Serialize_repr)]
pub enum ObjSymbolFlags: u8 {
Global,
Local,
Weak,
Common,
Hidden,
ForceActive,
}
}
#[derive(Debug, Copy, Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
pub struct ObjSymbolFlagSet(pub FlagSet<ObjSymbolFlags>);
impl ObjSymbolFlagSet {
#[inline]
pub fn scope(&self) -> ObjSymbolScope {
if self.is_local() {
ObjSymbolScope::Local
} else if self.is_weak() {
ObjSymbolScope::Weak
} else if self.0.contains(ObjSymbolFlags::Global) {
ObjSymbolScope::Global
} else {
ObjSymbolScope::Unknown
}
}
#[inline]
pub fn is_local(&self) -> bool { self.0.contains(ObjSymbolFlags::Local) }
#[inline]
pub fn is_global(&self) -> bool { !self.is_local() }
#[inline]
pub fn is_common(&self) -> bool { self.0.contains(ObjSymbolFlags::Common) }
#[inline]
pub fn is_weak(&self) -> bool { self.0.contains(ObjSymbolFlags::Weak) }
#[inline]
pub fn is_hidden(&self) -> bool { self.0.contains(ObjSymbolFlags::Hidden) }
#[inline]
pub fn is_force_active(&self) -> bool { self.0.contains(ObjSymbolFlags::ForceActive) }
#[inline]
pub fn set_scope(&mut self, scope: ObjSymbolScope) {
match scope {
ObjSymbolScope::Unknown => {
self.0 &= !(ObjSymbolFlags::Local | ObjSymbolFlags::Global | ObjSymbolFlags::Weak)
}
ObjSymbolScope::Global => {
self.0 = (self.0 & !(ObjSymbolFlags::Local | ObjSymbolFlags::Weak))
| ObjSymbolFlags::Global
}
ObjSymbolScope::Weak => {
self.0 = (self.0 & !(ObjSymbolFlags::Local | ObjSymbolFlags::Global))
| ObjSymbolFlags::Weak
}
ObjSymbolScope::Local => {
self.0 = (self.0 & !(ObjSymbolFlags::Global | ObjSymbolFlags::Weak))
| ObjSymbolFlags::Local
}
}
}
#[inline]
pub fn set_force_active(&mut self, value: bool) {
if value {
self.0 |= ObjSymbolFlags::ForceActive;
} else {
self.0 &= !ObjSymbolFlags::ForceActive;
}
}
}
#[allow(clippy::derived_hash_with_manual_eq)]
impl Hash for ObjSymbolFlagSet {
fn hash<H: Hasher>(&self, state: &mut H) { self.0.bits().hash(state) }
}
#[derive(Debug, Copy, Clone, Eq, PartialEq, Hash)]
pub enum ObjSectionKind {
Code,
Data,
ReadOnlyData,
Bss,
}
#[derive(Debug, Clone)]
pub struct ObjSection {
pub name: String,
pub kind: ObjSectionKind,
pub address: u64,
pub size: u64,
pub data: Vec<u8>,
pub align: u64,
pub index: usize,
/// REL files reference the original ELF section indices
pub elf_index: usize,
pub relocations: Vec<ObjReloc>,
pub original_address: u64,
pub file_offset: u64,
pub section_known: bool,
}
#[derive(Debug, Copy, Clone, Eq, PartialEq, Hash, Default, Serialize, Deserialize)]
pub enum ObjSymbolKind {
#[default]
Unknown,
Function,
Object,
Section,
}
#[derive(Debug, Copy, Clone, Default, PartialEq, Eq)]
pub enum ObjDataKind {
#[default]
Unknown,
Byte,
Byte2,
Byte4,
Byte8,
Float,
Double,
String,
String16,
StringTable,
String16Table,
}
#[derive(Debug, Clone, Default, Eq, PartialEq)]
pub struct ObjSymbol {
pub name: String,
pub demangled_name: Option<String>,
pub address: u64,
pub section: Option<usize>,
pub size: u64,
pub size_known: bool,
pub flags: ObjSymbolFlagSet,
pub kind: ObjSymbolKind,
pub align: Option<u32>,
pub data_kind: ObjDataKind,
}
#[derive(Debug, Copy, Clone, Eq, PartialEq, Hash)] #[derive(Debug, Copy, Clone, Eq, PartialEq, Hash)]
pub enum ObjKind { pub enum ObjKind {
@ -199,34 +42,13 @@ pub struct ObjUnit {
pub comment_version: Option<u8>, pub comment_version: Option<u8>,
} }
/// Marks a split point within a section.
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct ObjSplit {
pub unit: String,
pub end: u32,
pub align: Option<u32>,
/// Whether this is a part of common BSS.
pub common: bool,
/// Generated, replaceable by user.
pub autogenerated: bool,
}
pub type SymbolIndex = usize;
#[derive(Debug, Clone)]
pub struct ObjSymbols {
symbols: Vec<ObjSymbol>,
symbols_by_address: BTreeMap<u32, Vec<SymbolIndex>>,
symbols_by_name: HashMap<String, Vec<SymbolIndex>>,
}
#[derive(Debug, Clone)] #[derive(Debug, Clone)]
pub struct ObjInfo { pub struct ObjInfo {
pub kind: ObjKind, pub kind: ObjKind,
pub architecture: ObjArchitecture, pub architecture: ObjArchitecture,
pub name: String, pub name: String,
pub symbols: ObjSymbols, pub symbols: ObjSymbols,
pub sections: Vec<ObjSection>, pub sections: ObjSections,
pub entry: u64, pub entry: u64,
pub mw_comment: Option<MWComment>, pub mw_comment: Option<MWComment>,
@ -240,7 +62,6 @@ pub struct ObjInfo {
pub arena_hi: Option<u32>, pub arena_hi: Option<u32>,
// Extracted // Extracted
pub splits: BTreeMap<u32, Vec<ObjSplit>>,
pub named_sections: BTreeMap<u32, String>, pub named_sections: BTreeMap<u32, String>,
pub link_order: Vec<ObjUnit>, pub link_order: Vec<ObjUnit>,
pub blocked_ranges: BTreeMap<u32, u32>, // start -> end pub blocked_ranges: BTreeMap<u32, u32>, // start -> end
@ -271,312 +92,8 @@ pub struct ObjReloc {
pub address: u64, pub address: u64,
pub target_symbol: SymbolIndex, pub target_symbol: SymbolIndex,
pub addend: i64, pub addend: i64,
} /// If present, relocation against external module
pub module: Option<u32>,
impl ObjSymbols {
pub fn new(symbols: Vec<ObjSymbol>) -> Self {
let mut symbols_by_address = BTreeMap::<u32, Vec<SymbolIndex>>::new();
let mut symbols_by_name = HashMap::<String, Vec<SymbolIndex>>::new();
for (idx, symbol) in symbols.iter().enumerate() {
symbols_by_address.nested_push(symbol.address as u32, idx);
if !symbol.name.is_empty() {
symbols_by_name.nested_push(symbol.name.clone(), idx);
}
}
Self { symbols, symbols_by_address, symbols_by_name }
}
pub fn add(&mut self, in_symbol: ObjSymbol, replace: bool) -> Result<SymbolIndex> {
let opt = self.at_address(in_symbol.address as u32).find(|(_, symbol)| {
(symbol.kind == in_symbol.kind ||
// Replace lbl_* with real symbols
(symbol.kind == ObjSymbolKind::Unknown && symbol.name.starts_with("lbl_")))
// Hack to avoid replacing different ABS symbols
&& (symbol.section.is_some() || symbol.name == in_symbol.name)
// Avoid replacing symbols with ABS symbols, and vice versa
&& (symbol.section == in_symbol.section)
});
let target_symbol_idx = if let Some((symbol_idx, existing)) = opt {
let size =
if existing.size_known && in_symbol.size_known && existing.size != in_symbol.size {
log::warn!(
"Conflicting size for {}: was {:#X}, now {:#X}",
existing.name,
existing.size,
in_symbol.size
);
if replace {
in_symbol.size
} else {
existing.size
}
} else if in_symbol.size_known {
in_symbol.size
} else {
existing.size
};
if !replace {
// Not replacing existing symbol, but update size
if in_symbol.size_known && !existing.size_known {
self.replace(symbol_idx, ObjSymbol {
size: in_symbol.size,
size_known: true,
..existing.clone()
})?;
}
return Ok(symbol_idx);
}
let new_symbol = ObjSymbol {
name: in_symbol.name,
demangled_name: in_symbol.demangled_name,
address: in_symbol.address,
section: in_symbol.section,
size,
size_known: existing.size_known || in_symbol.size != 0,
flags: in_symbol.flags,
kind: in_symbol.kind,
align: in_symbol.align.or(existing.align),
data_kind: match in_symbol.data_kind {
ObjDataKind::Unknown => existing.data_kind,
kind => kind,
},
};
if existing != &new_symbol {
log::debug!("Replacing {:?} with {:?}", existing, new_symbol);
self.replace(symbol_idx, new_symbol)?;
}
symbol_idx
} else {
let target_symbol_idx = self.symbols.len();
self.add_direct(ObjSymbol {
name: in_symbol.name,
demangled_name: in_symbol.demangled_name,
address: in_symbol.address,
section: in_symbol.section,
size: in_symbol.size,
size_known: in_symbol.size != 0,
flags: in_symbol.flags,
kind: in_symbol.kind,
align: in_symbol.align,
data_kind: in_symbol.data_kind,
})?;
target_symbol_idx
};
Ok(target_symbol_idx)
}
pub fn add_direct(&mut self, in_symbol: ObjSymbol) -> Result<SymbolIndex> {
let symbol_idx = self.symbols.len();
self.symbols_by_address.nested_push(in_symbol.address as u32, symbol_idx);
if !in_symbol.name.is_empty() {
self.symbols_by_name.nested_push(in_symbol.name.clone(), symbol_idx);
}
self.symbols.push(in_symbol);
Ok(symbol_idx)
}
pub fn at(&self, symbol_idx: SymbolIndex) -> &ObjSymbol { &self.symbols[symbol_idx] }
pub fn address_of(&self, symbol_idx: SymbolIndex) -> u64 { self.symbols[symbol_idx].address }
pub fn iter(&self) -> impl DoubleEndedIterator<Item = &ObjSymbol> { self.symbols.iter() }
pub fn count(&self) -> usize { self.symbols.len() }
pub fn at_address(
&self,
addr: u32,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols_by_address
.get(&addr)
.into_iter()
.flatten()
.map(move |&idx| (idx, &self.symbols[idx]))
}
pub fn kind_at_address(
&self,
addr: u32,
kind: ObjSymbolKind,
) -> Result<Option<(SymbolIndex, &ObjSymbol)>> {
let (count, result) = self
.at_address(addr)
.filter(|(_, sym)| sym.kind == kind)
.fold((0, None), |(i, _), v| (i + 1, Some(v)));
ensure!(count <= 1, "Multiple symbols of kind {:?} at address {:#010X}", kind, addr);
Ok(result)
}
// Iterate over all in address ascending order, including ABS symbols
pub fn iter_ordered(&self) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols_by_address
.iter()
.flat_map(move |(_, v)| v.iter().map(move |u| (*u, &self.symbols[*u])))
}
// Iterate over range in address ascending order, excluding ABS symbols
pub fn for_range<R>(
&self,
range: R,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)>
where
R: RangeBounds<u32>,
{
self.symbols_by_address
.range(range)
.flat_map(move |(_, v)| v.iter().map(move |u| (*u, &self.symbols[*u])))
// Ignore ABS symbols
.filter(move |(_, sym)| sym.section.is_some() || sym.flags.is_common())
}
pub fn indexes_for_range<R>(
&self,
range: R,
) -> impl DoubleEndedIterator<Item = (u32, &[SymbolIndex])>
where
R: RangeBounds<u32>,
{
self.symbols_by_address.range(range).map(|(k, v)| (*k, v.as_ref()))
}
pub fn for_section(
&self,
section: &ObjSection,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
let section_index = section.index;
self.for_range(section.address as u32..(section.address + section.size) as u32)
.filter(move |(_, symbol)| symbol.section == Some(section_index))
}
pub fn for_name(
&self,
name: &str,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols_by_name
.get(name)
.into_iter()
.flat_map(move |v| v.iter().map(move |u| (*u, &self.symbols[*u])))
}
pub fn by_name(&self, name: &str) -> Result<Option<(SymbolIndex, &ObjSymbol)>> {
let mut iter = self.for_name(name);
let result = iter.next();
if let Some((index, symbol)) = result {
if let Some((other_index, other_symbol)) = iter.next() {
bail!(
"Multiple symbols with name {}: {} {:?} {:#010X} and {} {:?} {:#010X}",
name,
index,
symbol.kind,
symbol.address,
other_index,
other_symbol.kind,
other_symbol.address
);
}
}
Ok(result)
}
pub fn by_kind(
&self,
kind: ObjSymbolKind,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols.iter().enumerate().filter(move |(_, sym)| sym.kind == kind)
}
pub fn replace(&mut self, index: SymbolIndex, symbol: ObjSymbol) -> Result<()> {
let symbol_ref = &mut self.symbols[index];
ensure!(symbol_ref.address == symbol.address, "Can't modify address with replace_symbol");
if symbol_ref.name != symbol.name {
if !symbol_ref.name.is_empty() {
self.symbols_by_name.nested_remove(&symbol_ref.name, &index);
}
if !symbol.name.is_empty() {
self.symbols_by_name.nested_push(symbol.name.clone(), index);
}
}
*symbol_ref = symbol;
Ok(())
}
// Try to find a previous sized symbol that encompasses the target
pub fn for_relocation(
&self,
target_addr: u32,
reloc_kind: ObjRelocKind,
) -> Result<Option<(SymbolIndex, &ObjSymbol)>> {
let mut result = None;
for (_addr, symbol_idxs) in self.indexes_for_range(..=target_addr).rev() {
let mut symbols = symbol_idxs
.iter()
.map(|&idx| (idx, self.at(idx)))
.filter(|(_, sym)| {
// Linker generated labels can only be used with @ha/@h/@l relocations
!is_linker_generated_label(&sym.name)
|| (matches!(
reloc_kind,
ObjRelocKind::PpcAddr16Ha
| ObjRelocKind::PpcAddr16Hi
| ObjRelocKind::PpcAddr16Lo
))
})
.collect_vec();
let (symbol_idx, symbol) = if symbols.len() == 1 {
symbols.pop().unwrap()
} else {
symbols.sort_by_key(|&(_, symbol)| {
let mut rank = match symbol.kind {
ObjSymbolKind::Function | ObjSymbolKind::Object => match reloc_kind {
ObjRelocKind::PpcAddr16Hi
| ObjRelocKind::PpcAddr16Ha
| ObjRelocKind::PpcAddr16Lo => 1,
ObjRelocKind::Absolute
| ObjRelocKind::PpcRel24
| ObjRelocKind::PpcRel14
| ObjRelocKind::PpcEmbSda21 => 2,
},
// Label
ObjSymbolKind::Unknown => match reloc_kind {
ObjRelocKind::PpcAddr16Hi
| ObjRelocKind::PpcAddr16Ha
| ObjRelocKind::PpcAddr16Lo
if !symbol.name.starts_with("..") =>
{
3
}
_ => 1,
},
ObjSymbolKind::Section => -1,
};
if symbol.size > 0 {
rank += 1;
}
-rank
});
match symbols.first() {
Some(&v) => v,
None => continue,
}
};
if symbol.address == target_addr as u64 {
result = Some((symbol_idx, symbol));
break;
}
if symbol.size > 0 {
if symbol.address + symbol.size > target_addr as u64 {
result = Some((symbol_idx, symbol));
}
break;
}
}
Ok(result)
}
#[inline]
pub fn flags(&mut self, idx: SymbolIndex) -> &mut ObjSymbolFlagSet {
&mut self.symbols[idx].flags
}
} }
impl ObjInfo { impl ObjInfo {
@ -591,8 +108,8 @@ impl ObjInfo {
kind, kind,
architecture, architecture,
name, name,
symbols: ObjSymbols::new(symbols), symbols: ObjSymbols::new(kind, symbols),
sections, sections: ObjSections::new(kind, sections),
entry: 0, entry: 0,
mw_comment: Default::default(), mw_comment: Default::default(),
sda2_base: None, sda2_base: None,
@ -602,7 +119,7 @@ impl ObjInfo {
db_stack_addr: None, db_stack_addr: None,
arena_lo: None, arena_lo: None,
arena_hi: None, arena_hi: None,
splits: Default::default(), // splits: Default::default(),
named_sections: Default::default(), named_sections: Default::default(),
link_order: vec![], link_order: vec![],
blocked_ranges: Default::default(), blocked_ranges: Default::default(),
@ -626,86 +143,11 @@ impl ObjInfo {
self.symbols.add(in_symbol, replace) self.symbols.add(in_symbol, replace)
} }
pub fn section_at(&self, addr: u32) -> Result<&ObjSection> { pub fn add_split(&mut self, section_index: usize, address: u32, split: ObjSplit) -> Result<()> {
self.sections let section = self
.iter() .sections
.find(|s| s.contains(addr)) .get_mut(section_index)
.ok_or_else(|| anyhow!("Failed to locate section @ {:#010X}", addr)) .ok_or_else(|| anyhow!("Invalid section index {}", section_index))?;
}
pub fn section_for(&self, range: Range<u32>) -> Result<&ObjSection> {
self.sections.iter().find(|s| s.contains_range(range.clone())).ok_or_else(|| {
anyhow!("Failed to locate section @ {:#010X}-{:#010X}", range.start, range.end)
})
}
pub fn section_data(&self, start: u32, end: u32) -> Result<(&ObjSection, &[u8])> {
let section = self.section_at(start)?;
ensure!(
section.contains_range(start..end),
"Range {:#010X}-{:#010X} outside of section {}: {:#010X}-{:#010X}",
start,
end,
section.name,
section.address,
section.address + section.size
);
if section.kind == ObjSectionKind::Bss {
return Ok((section, &[]));
}
let data = if end == 0 {
&section.data[(start as u64 - section.address) as usize..]
} else {
&section.data[(start as u64 - section.address) as usize
..min(section.data.len(), (end as u64 - section.address) as usize)]
};
Ok((section, data))
}
/// Locate an existing split for the given address.
pub fn split_for(&self, address: u32) -> Option<(u32, &ObjSplit)> {
match self.splits_for_range(..=address).next_back() {
Some((addr, split)) if split.end == 0 || split.end > address => Some((addr, split)),
_ => None,
}
}
/// Locate existing splits within the given address range.
pub fn splits_for_range<R>(
&self,
range: R,
) -> impl DoubleEndedIterator<Item = (u32, &ObjSplit)>
where
R: RangeBounds<u32>,
{
self.splits.range(range).flat_map(|(addr, v)| v.iter().map(move |u| (*addr, u)))
}
pub fn split_for_unit(
&self,
unit: &str,
section: &ObjSection,
) -> Result<Option<(u32, &ObjSplit)>> {
let mut result = None::<(u32, &ObjSplit)>;
for (addr, split) in self
.splits_for_range(section.address as u32..(section.address + section.size) as u32)
.filter(|(_, split)| split.unit == unit)
{
ensure!(
result.is_none(),
"Multiple splits for unit {} in section {}: {:#010X}, {:#010X}",
unit,
section.name,
result.unwrap().0,
addr
);
result = Some((addr, split));
}
Ok(result)
}
pub fn add_split(&mut self, address: u32, split: ObjSplit) -> Result<()> {
let section = self.section_at(address)?;
let section_start = section.address as u32; let section_start = section.address as u32;
let section_end = (section.address + section.size) as u32; let section_end = (section.address + section.size) as u32;
ensure!( ensure!(
@ -719,7 +161,7 @@ impl ObjInfo {
section_end section_end
); );
if let Some((existing_addr, existing_split)) = self.split_for_unit(&split.unit, section)? { if let Some((existing_addr, existing_split)) = section.splits.for_unit(&split.unit)? {
let new_start = min(existing_addr, address); let new_start = min(existing_addr, address);
let new_end = max(existing_split.end, split.end); let new_end = max(existing_split.end, split.end);
@ -788,7 +230,7 @@ impl ObjInfo {
// Check if new split overlaps any existing splits // Check if new split overlaps any existing splits
let mut to_remove = BTreeSet::new(); let mut to_remove = BTreeSet::new();
let mut to_rename = BTreeSet::new(); let mut to_rename = BTreeSet::new();
for (existing_addr, existing_split) in self.splits_for_range(new_start..new_end) { for (existing_addr, existing_split) in section.splits.for_range(new_start..new_end) {
// TODO the logic in this method should be reworked, this is a hack // TODO the logic in this method should be reworked, this is a hack
if split.autogenerated && !existing_split.autogenerated { if split.autogenerated && !existing_split.autogenerated {
log::debug!( log::debug!(
@ -827,15 +269,15 @@ impl ObjInfo {
// Remove overlapping splits // Remove overlapping splits
for addr in to_remove { for addr in to_remove {
self.splits.remove(&addr); section.splits.remove(addr);
} }
// Rename any units that were overwritten // Rename any units that were overwritten
// TODO this should also merge with existing splits // TODO this should also merge with existing splits
for unit in to_rename { for unit in to_rename {
for (existing_addr, existing) in self for (existing_addr, existing) in self
.splits .sections
.iter_mut() .iter_mut()
.flat_map(|(addr, v)| v.iter_mut().map(move |u| (addr, u))) .flat_map(|(_, section)| section.splits.iter_mut())
.filter(|(_, split)| split.unit == unit) .filter(|(_, split)| split.unit == unit)
{ {
log::debug!( log::debug!(
@ -848,7 +290,7 @@ impl ObjInfo {
existing.unit = split.unit.clone(); existing.unit = split.unit.clone();
} }
} }
self.add_split(new_start, ObjSplit { self.add_split(section_index, new_start, ObjSplit {
unit: split.unit, unit: split.unit,
end: new_end, end: new_end,
align: new_align, align: new_align,
@ -859,72 +301,14 @@ impl ObjInfo {
} }
log::debug!("Adding split @ {} {:#010X}: {:?}", section.name, address, split); log::debug!("Adding split @ {} {:#010X}: {:?}", section.name, address, split);
self.splits.entry(address).or_default().push(split); section.splits.push(address, split);
Ok(()) Ok(())
} }
pub fn is_unit_autogenerated(&self, unit: &str) -> bool { pub fn is_unit_autogenerated(&self, unit: &str) -> bool {
self.splits_for_range(..) self.sections
.filter(|(_, split)| split.unit == unit) .all_splits()
.all(|(_, split)| split.autogenerated) .filter(|(_, _, _, split)| split.unit == unit)
.all(|(_, _, _, split)| split.autogenerated)
} }
} }
impl ObjSection {
pub fn build_relocation_map(&self) -> Result<BTreeMap<u32, usize>> {
let mut relocations = BTreeMap::new();
for (idx, reloc) in self.relocations.iter().enumerate() {
let address = reloc.address as u32;
match relocations.entry(address) {
btree_map::Entry::Vacant(e) => {
e.insert(idx);
}
btree_map::Entry::Occupied(_) => bail!("Duplicate relocation @ {address:#010X}"),
}
}
Ok(relocations)
}
pub fn build_relocation_map_cloned(&self) -> Result<BTreeMap<u32, ObjReloc>> {
let mut relocations = BTreeMap::new();
for reloc in self.relocations.iter().cloned() {
let address = reloc.address as u32;
match relocations.entry(address) {
btree_map::Entry::Vacant(e) => {
e.insert(reloc);
}
btree_map::Entry::Occupied(_) => bail!("Duplicate relocation @ {address:#010X}"),
}
}
Ok(relocations)
}
#[inline]
pub fn contains(&self, addr: u32) -> bool {
(self.address..self.address + self.size).contains(&(addr as u64))
}
#[inline]
pub fn contains_range(&self, range: Range<u32>) -> bool {
(range.start as u64) >= self.address && (range.end as u64) <= self.address + self.size
}
pub fn rename(&mut self, name: String) -> Result<()> {
self.kind = section_kind_for_section(&name)?;
self.name = name;
self.section_known = true;
Ok(())
}
}
pub fn section_kind_for_section(section_name: &str) -> Result<ObjSectionKind> {
Ok(match section_name {
".init" | ".text" | ".dbgtext" | ".vmtext" => ObjSectionKind::Code,
".ctors" | ".dtors" | ".rodata" | ".sdata2" | "extab" | "extabindex" => {
ObjSectionKind::ReadOnlyData
}
".bss" | ".sbss" | ".sbss2" => ObjSectionKind::Bss,
".data" | ".sdata" => ObjSectionKind::Data,
name => bail!("Unknown section {name}"),
})
}

247
src/obj/sections.rs Normal file
View File

@ -0,0 +1,247 @@
use std::{
cmp::min,
collections::{btree_map, BTreeMap, Bound},
ops::{Index, IndexMut, Range, RangeBounds},
};
use anyhow::{anyhow, bail, ensure, Result};
use itertools::Itertools;
use crate::obj::{ObjKind, ObjReloc, ObjSplit, ObjSplits, ObjSymbol};
#[derive(Debug, Copy, Clone, Eq, PartialEq, Hash)]
pub enum ObjSectionKind {
Code,
Data,
ReadOnlyData,
Bss,
}
#[derive(Debug, Clone)]
pub struct ObjSection {
pub name: String,
pub kind: ObjSectionKind,
pub address: u64,
pub size: u64,
pub data: Vec<u8>,
pub align: u64,
/// REL files reference the original ELF section indices
pub elf_index: usize,
pub relocations: Vec<ObjReloc>,
pub original_address: u64,
pub file_offset: u64,
pub section_known: bool,
pub splits: ObjSplits,
}
#[derive(Debug, Clone)]
pub struct ObjSections {
obj_kind: ObjKind,
sections: Vec<ObjSection>,
}
impl ObjSections {
pub fn new(obj_kind: ObjKind, sections: Vec<ObjSection>) -> Self { Self { obj_kind, sections } }
pub fn iter(&self) -> impl DoubleEndedIterator<Item = (usize, &ObjSection)> {
self.sections.iter().enumerate()
}
pub fn iter_mut(&mut self) -> impl DoubleEndedIterator<Item = (usize, &mut ObjSection)> {
self.sections.iter_mut().enumerate()
}
pub fn count(&self) -> usize { self.sections.len() }
pub fn next_section_index(&self) -> usize { self.sections.len() }
pub fn get(&self, index: usize) -> Option<&ObjSection> { self.sections.get(index) }
pub fn get_mut(&mut self, index: usize) -> Option<&mut ObjSection> {
self.sections.get_mut(index)
}
pub fn get_elf_index(&self, elf_index: usize) -> Option<(usize, &ObjSection)> {
self.iter().find(|&(_, s)| s.elf_index == elf_index)
}
pub fn get_elf_index_mut(&mut self, elf_index: usize) -> Option<(usize, &mut ObjSection)> {
self.iter_mut().find(|(_, s)| s.elf_index == elf_index)
}
pub fn at_address(&self, addr: u32) -> Result<(usize, &ObjSection)> {
ensure!(
self.obj_kind == ObjKind::Executable,
"Use of ObjSections::at_address in relocatable object"
);
self.iter()
.find(|&(_, s)| s.contains(addr))
.ok_or_else(|| anyhow!("Failed to locate section @ {:#010X}", addr))
}
pub fn at_address_mut(&mut self, addr: u32) -> Result<(usize, &mut ObjSection)> {
ensure!(
self.obj_kind == ObjKind::Executable,
"Use of ObjSections::at_address_mut in relocatable object"
);
self.iter_mut()
.find(|(_, s)| s.contains(addr))
.ok_or_else(|| anyhow!("Failed to locate section @ {:#010X}", addr))
}
pub fn with_range(&self, range: Range<u32>) -> Result<(usize, &ObjSection)> {
ensure!(
self.obj_kind == ObjKind::Executable,
"Use of ObjSections::with_range in relocatable object"
);
self.iter().find(|&(_, s)| s.contains_range(range.clone())).ok_or_else(|| {
anyhow!("Failed to locate section @ {:#010X}-{:#010X}", range.start, range.end)
})
}
pub fn by_kind(
&self,
kind: ObjSectionKind,
) -> impl DoubleEndedIterator<Item = (usize, &ObjSection)> {
self.iter().filter(move |(_, s)| s.kind == kind)
}
pub fn by_name(&self, name: &str) -> Result<Option<(usize, &ObjSection)>> {
self.iter()
.filter(move |(_, s)| s.name == name)
.at_most_one()
.map_err(|_| anyhow!("Multiple sections with name {}", name))
}
pub fn push(&mut self, section: ObjSection) -> usize {
let index = self.sections.len();
self.sections.push(section);
index
}
pub fn all_splits(
&self,
) -> impl DoubleEndedIterator<Item = (usize, &ObjSection, u32, &ObjSplit)> {
self.iter()
.flat_map(|(idx, s)| s.splits.iter().map(move |(addr, split)| (idx, s, addr, split)))
}
}
impl Index<usize> for ObjSections {
type Output = ObjSection;
fn index(&self, index: usize) -> &Self::Output { &self.sections[index] }
}
impl IndexMut<usize> for ObjSections {
fn index_mut(&mut self, index: usize) -> &mut Self::Output { &mut self.sections[index] }
}
impl ObjSection {
pub fn data_range(&self, start: u32, end: u32) -> Result<&[u8]> {
if end == 0 {
ensure!(
self.contains(start),
"Address {:#010X} outside of section {}: {:#010X}-{:#010X}",
start,
self.name,
self.address,
self.address + self.size
);
} else {
ensure!(
self.contains_range(start..end),
"Range {:#010X}-{:#010X} outside of section {}: {:#010X}-{:#010X}",
start,
end,
self.name,
self.address,
self.address + self.size
);
}
if self.kind == ObjSectionKind::Bss {
return Ok(&[]);
}
let start = (start as u64 - self.address) as usize;
Ok(if end == 0 {
&self.data[start..]
} else {
&self.data[start..min(self.data.len(), (end as u64 - self.address) as usize)]
})
}
#[inline]
pub fn symbol_data(&self, symbol: &ObjSymbol) -> Result<&[u8]> {
self.data_range(symbol.address as u32, symbol.address as u32 + symbol.size as u32)
}
pub fn build_relocation_map(&self) -> Result<BTreeMap<u32, usize>> {
let mut relocations = BTreeMap::new();
for (idx, reloc) in self.relocations.iter().enumerate() {
let address = reloc.address as u32;
match relocations.entry(address) {
btree_map::Entry::Vacant(e) => {
e.insert(idx);
}
btree_map::Entry::Occupied(_) => bail!("Duplicate relocation @ {address:#010X}"),
}
}
Ok(relocations)
}
pub fn build_relocation_map_cloned(&self) -> Result<BTreeMap<u32, ObjReloc>> {
let mut relocations = BTreeMap::new();
for reloc in self.relocations.iter().cloned() {
let address = reloc.address as u32;
match relocations.entry(address) {
btree_map::Entry::Vacant(e) => {
e.insert(reloc);
}
btree_map::Entry::Occupied(_) => bail!("Duplicate relocation @ {address:#010X}"),
}
}
Ok(relocations)
}
#[inline]
pub fn contains(&self, addr: u32) -> bool {
(self.address..self.address + self.size).contains(&(addr as u64))
}
#[inline]
pub fn contains_range<R>(&self, range: R) -> bool
where R: RangeBounds<u32> {
let start = self.address as u32;
let end = self.address as u32 + self.size as u32;
let start_in_range = match range.start_bound() {
Bound::Included(&n) => n >= start && n < end,
Bound::Excluded(&n) => n > start && n < end,
Bound::Unbounded => true,
};
let end_in_range = match range.end_bound() {
Bound::Included(&n) => n > start && n < end,
Bound::Excluded(&n) => n > start && n <= end,
Bound::Unbounded => true,
};
start_in_range && end_in_range
}
pub fn rename(&mut self, name: String) -> Result<()> {
self.kind = section_kind_for_section(&name)?;
self.name = name;
self.section_known = true;
Ok(())
}
}
pub fn section_kind_for_section(section_name: &str) -> Result<ObjSectionKind> {
Ok(match section_name {
".init" | ".text" | ".dbgtext" | ".vmtext" => ObjSectionKind::Code,
".ctors" | ".dtors" | ".rodata" | ".sdata2" | "extab" | "extabindex" => {
ObjSectionKind::ReadOnlyData
}
".bss" | ".sbss" | ".sbss2" => ObjSectionKind::Bss,
".data" | ".sdata" => ObjSectionKind::Data,
name => bail!("Unknown section {name}"),
})
}

76
src/obj/splits.rs Normal file
View File

@ -0,0 +1,76 @@
use std::{collections::BTreeMap, ops::RangeBounds};
use anyhow::{anyhow, Result};
use itertools::Itertools;
use crate::util::nested::NestedVec;
/// Marks a split point within a section.
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct ObjSplit {
pub unit: String,
pub end: u32,
pub align: Option<u32>,
/// Whether this is a part of common BSS.
pub common: bool,
/// Generated, replaceable by user.
pub autogenerated: bool,
}
/// Splits within a section.
#[derive(Debug, Clone, Default)]
pub struct ObjSplits {
splits: BTreeMap<u32, Vec<ObjSplit>>,
}
impl ObjSplits {
pub fn iter(&self) -> impl DoubleEndedIterator<Item = (u32, &ObjSplit)> {
self.splits.iter().flat_map(|(addr, v)| v.iter().map(move |u| (*addr, u)))
}
pub fn iter_mut(&mut self) -> impl DoubleEndedIterator<Item = (u32, &mut ObjSplit)> {
self.splits.iter_mut().flat_map(|(addr, v)| v.iter_mut().map(move |u| (*addr, u)))
}
pub fn has_split_at(&self, address: u32) -> bool { self.splits.contains_key(&address) }
/// Locate an existing split for the given address.
pub fn for_address(&self, address: u32) -> Option<(u32, &ObjSplit)> {
match self.for_range(..=address).next_back() {
Some((addr, split)) if split.end == 0 || split.end > address => Some((addr, split)),
_ => None,
}
}
/// Locate existing splits within the given address range.
pub fn for_range<R>(&self, range: R) -> impl DoubleEndedIterator<Item = (u32, &ObjSplit)>
where R: RangeBounds<u32> {
self.splits.range(range).flat_map(|(addr, v)| v.iter().map(move |u| (*addr, u)))
}
/// Locate existing splits within the given address range.
pub fn for_range_mut<R>(
&mut self,
range: R,
) -> impl DoubleEndedIterator<Item = (u32, &mut ObjSplit)>
where
R: RangeBounds<u32>,
{
self.splits.range_mut(range).flat_map(|(addr, v)| v.iter_mut().map(move |u| (*addr, u)))
}
pub fn for_unit(&self, unit: &str) -> Result<Option<(u32, &ObjSplit)>> {
self.splits
.iter()
.flat_map(|(addr, v)| v.iter().map(move |u| (*addr, u)))
.filter(|&(_, split)| split.unit == unit)
.at_most_one()
.map_err(|_| anyhow!("Multiple splits for unit {}", unit))
}
pub fn push(&mut self, address: u32, split: ObjSplit) {
self.splits.nested_push(address, split);
}
pub fn remove(&mut self, address: u32) -> Option<Vec<ObjSplit>> { self.splits.remove(&address) }
}

536
src/obj/symbols.rs Normal file
View File

@ -0,0 +1,536 @@
use std::{
collections::{BTreeMap, HashMap},
hash::{Hash, Hasher},
ops::{Index, RangeBounds},
};
use anyhow::{anyhow, bail, ensure, Result};
use flagset::{flags, FlagSet};
use itertools::Itertools;
use serde::{Deserialize, Serialize};
use serde_repr::{Deserialize_repr, Serialize_repr};
use crate::{
obj::{ObjKind, ObjRelocKind},
util::{config::is_auto_symbol, nested::NestedVec, split::is_linker_generated_label},
};
#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize, Default)]
pub enum ObjSymbolScope {
#[default]
Unknown,
Global,
Weak,
Local,
}
flags! {
#[repr(u8)]
#[derive(Deserialize_repr, Serialize_repr)]
pub enum ObjSymbolFlags: u8 {
Global,
Local,
Weak,
Common,
Hidden,
ForceActive,
}
}
#[derive(Debug, Copy, Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
pub struct ObjSymbolFlagSet(pub FlagSet<ObjSymbolFlags>);
impl ObjSymbolFlagSet {
#[inline]
pub fn scope(&self) -> ObjSymbolScope {
if self.is_local() {
ObjSymbolScope::Local
} else if self.is_weak() {
ObjSymbolScope::Weak
} else if self.0.contains(ObjSymbolFlags::Global) {
ObjSymbolScope::Global
} else {
ObjSymbolScope::Unknown
}
}
#[inline]
pub fn is_local(&self) -> bool { self.0.contains(ObjSymbolFlags::Local) }
#[inline]
pub fn is_global(&self) -> bool { !self.is_local() }
#[inline]
pub fn is_common(&self) -> bool { self.0.contains(ObjSymbolFlags::Common) }
#[inline]
pub fn is_weak(&self) -> bool { self.0.contains(ObjSymbolFlags::Weak) }
#[inline]
pub fn is_hidden(&self) -> bool { self.0.contains(ObjSymbolFlags::Hidden) }
#[inline]
pub fn is_force_active(&self) -> bool { self.0.contains(ObjSymbolFlags::ForceActive) }
#[inline]
pub fn set_scope(&mut self, scope: ObjSymbolScope) {
match scope {
ObjSymbolScope::Unknown => {
self.0 &= !(ObjSymbolFlags::Local | ObjSymbolFlags::Global | ObjSymbolFlags::Weak)
}
ObjSymbolScope::Global => {
self.0 = (self.0 & !(ObjSymbolFlags::Local | ObjSymbolFlags::Weak))
| ObjSymbolFlags::Global
}
ObjSymbolScope::Weak => {
self.0 = (self.0 & !(ObjSymbolFlags::Local | ObjSymbolFlags::Global))
| ObjSymbolFlags::Weak
}
ObjSymbolScope::Local => {
self.0 = (self.0 & !(ObjSymbolFlags::Global | ObjSymbolFlags::Weak))
| ObjSymbolFlags::Local
}
}
}
#[inline]
pub fn set_force_active(&mut self, value: bool) {
if value {
self.0 |= ObjSymbolFlags::ForceActive;
} else {
self.0 &= !ObjSymbolFlags::ForceActive;
}
}
}
#[allow(clippy::derived_hash_with_manual_eq)]
impl Hash for ObjSymbolFlagSet {
fn hash<H: Hasher>(&self, state: &mut H) { self.0.bits().hash(state) }
}
#[derive(Debug, Copy, Clone, Eq, PartialEq, Hash, Default, Serialize, Deserialize)]
pub enum ObjSymbolKind {
#[default]
Unknown,
Function,
Object,
Section,
}
#[derive(Debug, Copy, Clone, Default, PartialEq, Eq)]
pub enum ObjDataKind {
#[default]
Unknown,
Byte,
Byte2,
Byte4,
Byte8,
Float,
Double,
String,
String16,
StringTable,
String16Table,
}
#[derive(Debug, Clone, Default, Eq, PartialEq)]
pub struct ObjSymbol {
pub name: String,
pub demangled_name: Option<String>,
pub address: u64,
pub section: Option<usize>,
pub size: u64,
pub size_known: bool,
pub flags: ObjSymbolFlagSet,
pub kind: ObjSymbolKind,
pub align: Option<u32>,
pub data_kind: ObjDataKind,
}
pub type SymbolIndex = usize;
#[derive(Debug, Clone)]
pub struct ObjSymbols {
obj_kind: ObjKind,
symbols: Vec<ObjSymbol>,
symbols_by_address: BTreeMap<u32, Vec<SymbolIndex>>,
symbols_by_name: HashMap<String, Vec<SymbolIndex>>,
symbols_by_section: Vec<BTreeMap<u32, Vec<SymbolIndex>>>,
}
impl ObjSymbols {
pub fn new(obj_kind: ObjKind, symbols: Vec<ObjSymbol>) -> Self {
let mut symbols_by_address = BTreeMap::<u32, Vec<SymbolIndex>>::new();
let mut symbols_by_section: Vec<BTreeMap<u32, Vec<SymbolIndex>>> = vec![];
let mut symbols_by_name = HashMap::<String, Vec<SymbolIndex>>::new();
for (idx, symbol) in symbols.iter().enumerate() {
if obj_kind == ObjKind::Executable {
symbols_by_address.nested_push(symbol.address as u32, idx);
}
if let Some(section_idx) = symbol.section {
if section_idx >= symbols_by_section.len() {
symbols_by_section.resize_with(section_idx + 1, BTreeMap::new);
}
symbols_by_section[section_idx].nested_push(symbol.address as u32, idx);
} else {
debug_assert!(
symbol.address == 0
|| symbol.flags.is_common()
|| obj_kind == ObjKind::Executable,
"ABS symbol in relocatable object"
);
}
if !symbol.name.is_empty() {
symbols_by_name.nested_push(symbol.name.clone(), idx);
}
}
Self { obj_kind, symbols, symbols_by_address, symbols_by_name, symbols_by_section }
}
pub fn add(&mut self, in_symbol: ObjSymbol, replace: bool) -> Result<SymbolIndex> {
let opt = if let Some(section_index) = in_symbol.section {
self.at_section_address(section_index, in_symbol.address as u32).find(|(_, symbol)| {
symbol.kind == in_symbol.kind ||
// Replace auto symbols with real symbols
(symbol.kind == ObjSymbolKind::Unknown && is_auto_symbol(&symbol.name))
})
} else {
// TODO hmmm
self.iter_abs().find(|(_, symbol)| symbol.name == in_symbol.name)
};
let target_symbol_idx = if let Some((symbol_idx, existing)) = opt {
let size =
if existing.size_known && in_symbol.size_known && existing.size != in_symbol.size {
log::warn!(
"Conflicting size for {}: was {:#X}, now {:#X}",
existing.name,
existing.size,
in_symbol.size
);
if replace {
in_symbol.size
} else {
existing.size
}
} else if in_symbol.size_known {
in_symbol.size
} else {
existing.size
};
if !replace {
// Not replacing existing symbol, but update size
if in_symbol.size_known && !existing.size_known {
self.replace(symbol_idx, ObjSymbol {
size: in_symbol.size,
size_known: true,
..existing.clone()
})?;
}
return Ok(symbol_idx);
}
let new_symbol = ObjSymbol {
name: in_symbol.name,
demangled_name: in_symbol.demangled_name,
address: in_symbol.address,
section: in_symbol.section,
size,
size_known: existing.size_known || in_symbol.size != 0,
flags: in_symbol.flags,
kind: in_symbol.kind,
align: in_symbol.align.or(existing.align),
data_kind: match in_symbol.data_kind {
ObjDataKind::Unknown => existing.data_kind,
kind => kind,
},
};
if existing != &new_symbol {
log::debug!("Replacing {:?} with {:?}", existing, new_symbol);
self.replace(symbol_idx, new_symbol)?;
}
symbol_idx
} else {
let target_symbol_idx = self.symbols.len();
self.add_direct(ObjSymbol {
name: in_symbol.name,
demangled_name: in_symbol.demangled_name,
address: in_symbol.address,
section: in_symbol.section,
size: in_symbol.size,
size_known: in_symbol.size != 0,
flags: in_symbol.flags,
kind: in_symbol.kind,
align: in_symbol.align,
data_kind: in_symbol.data_kind,
})?;
target_symbol_idx
};
Ok(target_symbol_idx)
}
pub fn add_direct(&mut self, in_symbol: ObjSymbol) -> Result<SymbolIndex> {
let symbol_idx = self.symbols.len();
if self.obj_kind == ObjKind::Executable {
self.symbols_by_address.nested_push(in_symbol.address as u32, symbol_idx);
}
if let Some(section_idx) = in_symbol.section {
if section_idx >= self.symbols_by_section.len() {
self.symbols_by_section.resize_with(section_idx + 1, BTreeMap::new);
}
self.symbols_by_section[section_idx].nested_push(in_symbol.address as u32, symbol_idx);
} else {
ensure!(
in_symbol.address == 0
|| in_symbol.flags.is_common()
|| self.obj_kind == ObjKind::Executable,
"ABS symbol in relocatable object"
);
}
if !in_symbol.name.is_empty() {
self.symbols_by_name.nested_push(in_symbol.name.clone(), symbol_idx);
}
self.symbols.push(in_symbol);
Ok(symbol_idx)
}
pub fn iter(&self) -> impl DoubleEndedIterator<Item = &ObjSymbol> { self.symbols.iter() }
pub fn count(&self) -> usize { self.symbols.len() }
pub fn at_section_address(
&self,
section_idx: usize,
addr: u32,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols_by_section
.get(section_idx)
.and_then(|v| v.get(&addr))
.into_iter()
.flatten()
.map(move |&idx| (idx, &self.symbols[idx]))
}
pub fn kind_at_section_address(
&self,
section_idx: usize,
addr: u32,
kind: ObjSymbolKind,
) -> Result<Option<(SymbolIndex, &ObjSymbol)>> {
self.at_section_address(section_idx, addr)
.filter(|(_, sym)| sym.kind == kind)
.at_most_one()
.map_err(|_| anyhow!("Multiple symbols of kind {:?} at address {:#010X}", kind, addr))
}
// Iterate over all in address ascending order, excluding ABS symbols
pub fn iter_ordered(&self) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols_by_section
.iter()
.flat_map(|v| v.iter().map(|(_, v)| v))
.flat_map(move |v| v.iter().map(move |u| (*u, &self.symbols[*u])))
}
// Iterate over all ABS symbols
pub fn iter_abs(&self) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
debug_assert!(self.obj_kind == ObjKind::Executable);
self.symbols_by_address
.iter()
.flat_map(|(_, v)| v.iter().map(|&u| (u, &self.symbols[u])))
.filter(|(_, s)| s.section.is_none())
}
// Iterate over range in address ascending order, excluding ABS symbols
pub fn for_section_range<R>(
&self,
section_index: usize,
range: R,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)>
where
R: RangeBounds<u32> + Clone,
{
self.symbols_by_section
.get(section_index)
.into_iter()
.flat_map(move |v| v.range(range.clone()))
.flat_map(move |(_, v)| v.iter().map(move |u| (*u, &self.symbols[*u])))
}
pub fn indexes_for_range<R>(
&self,
range: R,
) -> impl DoubleEndedIterator<Item = (u32, &[SymbolIndex])>
where
R: RangeBounds<u32>,
{
debug_assert!(self.obj_kind == ObjKind::Executable);
self.symbols_by_address.range(range).map(|(k, v)| (*k, v.as_ref()))
}
pub fn for_section(
&self,
section_idx: usize,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols_by_section
.get(section_idx)
.into_iter()
.flat_map(|v| v.iter().map(|(_, v)| v))
.flat_map(move |v| v.iter().map(move |u| (*u, &self.symbols[*u])))
}
pub fn for_name(
&self,
name: &str,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols_by_name
.get(name)
.into_iter()
.flat_map(move |v| v.iter().map(move |u| (*u, &self.symbols[*u])))
}
pub fn by_name(&self, name: &str) -> Result<Option<(SymbolIndex, &ObjSymbol)>> {
let mut iter = self.for_name(name);
let result = iter.next();
if let Some((index, symbol)) = result {
if let Some((other_index, other_symbol)) = iter.next() {
bail!(
"Multiple symbols with name {}: {} {:?} {:#010X} and {} {:?} {:#010X}",
name,
index,
symbol.kind,
symbol.address,
other_index,
other_symbol.kind,
other_symbol.address
);
}
}
Ok(result)
}
pub fn by_kind(
&self,
kind: ObjSymbolKind,
) -> impl DoubleEndedIterator<Item = (SymbolIndex, &ObjSymbol)> {
self.symbols.iter().enumerate().filter(move |(_, sym)| sym.kind == kind)
}
pub fn replace(&mut self, index: SymbolIndex, symbol: ObjSymbol) -> Result<()> {
let symbol_ref = &mut self.symbols[index];
ensure!(symbol_ref.address == symbol.address, "Can't modify address with replace_symbol");
ensure!(symbol_ref.section == symbol.section, "Can't modify section with replace_symbol");
if symbol_ref.name != symbol.name {
if !symbol_ref.name.is_empty() {
self.symbols_by_name.nested_remove(&symbol_ref.name, &index);
}
if !symbol.name.is_empty() {
self.symbols_by_name.nested_push(symbol.name.clone(), index);
}
}
*symbol_ref = symbol;
Ok(())
}
// Try to find a previous sized symbol that encompasses the target
pub fn for_relocation(
&self,
target_addr: u32,
reloc_kind: ObjRelocKind,
) -> Result<Option<(SymbolIndex, &ObjSymbol)>> {
ensure!(self.obj_kind == ObjKind::Executable);
let mut result = None;
for (_addr, symbol_idxs) in self.indexes_for_range(..=target_addr).rev() {
let mut symbols = symbol_idxs
.iter()
.map(|&idx| (idx, &self.symbols[idx]))
.filter(|(_, sym)| sym.referenced_by(reloc_kind))
.collect_vec();
let (symbol_idx, symbol) = if symbols.len() == 1 {
symbols.pop().unwrap()
} else {
symbols.sort_by_key(|&(_, symbol)| {
let mut rank = match symbol.kind {
ObjSymbolKind::Function | ObjSymbolKind::Object => match reloc_kind {
ObjRelocKind::PpcAddr16Hi
| ObjRelocKind::PpcAddr16Ha
| ObjRelocKind::PpcAddr16Lo => 1,
ObjRelocKind::Absolute
| ObjRelocKind::PpcRel24
| ObjRelocKind::PpcRel14
| ObjRelocKind::PpcEmbSda21 => 2,
},
// Label
ObjSymbolKind::Unknown => match reloc_kind {
ObjRelocKind::PpcAddr16Hi
| ObjRelocKind::PpcAddr16Ha
| ObjRelocKind::PpcAddr16Lo
if !symbol.name.starts_with("..") =>
{
3
}
_ => 1,
},
ObjSymbolKind::Section => -1,
};
if symbol.size > 0 {
rank += 1;
}
-rank
});
match symbols.first() {
Some(&v) => v,
None => continue,
}
};
if symbol.address == target_addr as u64 {
result = Some((symbol_idx, symbol));
break;
}
if symbol.size > 0 {
if symbol.address + symbol.size > target_addr as u64 {
result = Some((symbol_idx, symbol));
}
break;
}
}
Ok(result)
}
#[inline]
pub fn flags(&mut self, idx: SymbolIndex) -> &mut ObjSymbolFlagSet {
&mut self.symbols[idx].flags
}
}
impl Index<SymbolIndex> for ObjSymbols {
type Output = ObjSymbol;
fn index(&self, index: usize) -> &Self::Output { &self.symbols[index] }
}
impl ObjSymbol {
/// Whether this symbol can be referenced by the given relocation kind.
pub fn referenced_by(&self, reloc_kind: ObjRelocKind) -> bool {
if is_linker_generated_label(&self.name) {
// Linker generated labels will only be referenced by @ha/@h/@l relocations
return matches!(
reloc_kind,
ObjRelocKind::PpcAddr16Ha | ObjRelocKind::PpcAddr16Hi | ObjRelocKind::PpcAddr16Lo
);
}
match self.kind {
ObjSymbolKind::Unknown => true,
ObjSymbolKind::Function => !matches!(reloc_kind, ObjRelocKind::PpcEmbSda21),
ObjSymbolKind::Object => {
!matches!(reloc_kind, ObjRelocKind::PpcRel14 | ObjRelocKind::PpcRel24)
}
ObjSymbolKind::Section => {
matches!(
reloc_kind,
ObjRelocKind::PpcAddr16Ha
| ObjRelocKind::PpcAddr16Hi
| ObjRelocKind::PpcAddr16Lo
)
}
}
}
}

View File

@ -46,10 +46,10 @@ pub fn write_asm<W: Write>(w: &mut W, obj: &ObjInfo) -> Result<()> {
let mut symbols: Vec<ObjSymbol> = obj.symbols.iter().cloned().collect(); let mut symbols: Vec<ObjSymbol> = obj.symbols.iter().cloned().collect();
let mut section_entries: Vec<BTreeMap<u32, Vec<SymbolEntry>>> = vec![]; let mut section_entries: Vec<BTreeMap<u32, Vec<SymbolEntry>>> = vec![];
let mut section_relocations: Vec<BTreeMap<u32, ObjReloc>> = vec![]; let mut section_relocations: Vec<BTreeMap<u32, ObjReloc>> = vec![];
for (section_idx, section) in obj.sections.iter().enumerate() { for (section_idx, section) in obj.sections.iter() {
// Build symbol start/end entries // Build symbol start/end entries
let mut entries = BTreeMap::<u32, Vec<SymbolEntry>>::new(); let mut entries = BTreeMap::<u32, Vec<SymbolEntry>>::new();
for (symbol_index, symbol) in obj.symbols.for_section(section) { for (symbol_index, symbol) in obj.symbols.for_section(section_idx) {
entries.nested_push(symbol.address as u32, SymbolEntry { entries.nested_push(symbol.address as u32, SymbolEntry {
index: symbol_index, index: symbol_index,
kind: SymbolEntryKind::Start, kind: SymbolEntryKind::Start,
@ -110,6 +110,7 @@ pub fn write_asm<W: Write>(w: &mut W, obj: &ObjInfo) -> Result<()> {
address: ins.addr as u64, address: ins.addr as u64,
target_symbol: symbol_idx, target_symbol: symbol_idx,
addend: 0, addend: 0,
module: None,
}); });
} }
} }
@ -121,11 +122,11 @@ pub fn write_asm<W: Write>(w: &mut W, obj: &ObjInfo) -> Result<()> {
} }
// Generate labels for jump tables & relative data relocations // Generate labels for jump tables & relative data relocations
for section in &obj.sections { for (_section_index, section) in obj
if !matches!(section.kind, ObjSectionKind::Data | ObjSectionKind::ReadOnlyData) { .sections
continue; .iter()
} .filter(|(_, s)| matches!(s.kind, ObjSectionKind::Data | ObjSectionKind::ReadOnlyData))
{
for reloc in &section.relocations { for reloc in &section.relocations {
if reloc.addend == 0 { if reloc.addend == 0 {
continue; continue;
@ -135,7 +136,9 @@ pub fn write_asm<W: Write>(w: &mut W, obj: &ObjInfo) -> Result<()> {
Some(v) => v, Some(v) => v,
None => continue, None => continue,
}; };
let target_section = &obj.sections[target_section_idx]; let target_section = obj.sections.get(target_section_idx).ok_or_else(|| {
anyhow!("Invalid relocation target section: {:#010X} {:?}", reloc.address, target)
})?;
let address = (target.address as i64 + reloc.addend) as u64; let address = (target.address as i64 + reloc.addend) as u64;
let vec = match section_entries[target_section_idx].entry(address as u32) { let vec = match section_entries[target_section_idx].entry(address as u32) {
btree_map::Entry::Occupied(e) => e.into_mut(), btree_map::Entry::Occupied(e) => e.into_mut(),
@ -177,14 +180,14 @@ pub fn write_asm<W: Write>(w: &mut W, obj: &ObjInfo) -> Result<()> {
} }
} }
for section in &obj.sections { for (section_index, section) in obj.sections.iter() {
let entries = &section_entries[section.index]; let entries = &section_entries[section_index];
let relocations = &section_relocations[section.index]; let relocations = &section_relocations[section_index];
let mut current_address = section.address as u32; let mut current_address = section.address as u32;
let section_end = (section.address + section.size) as u32; let section_end = (section.address + section.size) as u32;
let subsection = let subsection =
obj.sections.iter().take(section.index).filter(|s| s.name == section.name).count(); obj.sections.iter().take(section_index).filter(|(_, s)| s.name == section.name).count();
loop { loop {
if current_address >= section_end { if current_address >= section_end {

View File

@ -12,13 +12,10 @@ use regex::{Captures, Regex};
use crate::{ use crate::{
obj::{ obj::{
ObjDataKind, ObjInfo, ObjSplit, ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags, ObjSymbolKind, ObjDataKind, ObjInfo, ObjKind, ObjSplit, ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags,
ObjUnit, ObjSymbolKind, ObjUnit,
},
util::{
file::{buf_writer, map_file, map_reader},
nested::NestedVec,
}, },
util::file::{buf_writer, map_file, map_reader},
}; };
fn parse_hex(s: &str) -> Result<u32, ParseIntError> { fn parse_hex(s: &str) -> Result<u32, ParseIntError> {
@ -56,15 +53,18 @@ pub fn parse_symbol_line(line: &str, obj: &mut ObjInfo) -> Result<Option<ObjSymb
let name = captures["name"].to_string(); let name = captures["name"].to_string();
let addr = parse_hex(&captures["addr"])?; let addr = parse_hex(&captures["addr"])?;
let section_name = captures["section"].to_string(); let section_name = captures["section"].to_string();
let section = if let Some(section) = obj.sections.iter().find(|s| s.name == section_name) { let section = if section_name == "ABS" {
Some(section.index) None
} else if let Some(section) = obj.sections.iter_mut().find(|s| s.contains(addr)) { } else if let Some((section_index, _)) = obj.sections.by_name(&section_name)? {
Some(section_index)
} else if obj.kind == ObjKind::Executable {
let (section_index, section) = obj.sections.at_address_mut(addr)?;
if !section.section_known { if !section.section_known {
section.rename(section_name)?; section.rename(section_name)?;
} }
Some(section.index) Some(section_index)
} else { } else {
None bail!("Section {} not found", section_name)
}; };
let demangled_name = demangle(&name, &DemangleOptions::default()); let demangled_name = demangle(&name, &DemangleOptions::default());
let mut symbol = ObjSymbol { let mut symbol = ObjSymbol {
@ -132,7 +132,7 @@ pub fn parse_symbol_line(line: &str, obj: &mut ObjInfo) -> Result<Option<ObjSymb
} }
} }
fn is_skip_symbol(symbol: &ObjSymbol) -> bool { pub fn is_skip_symbol(symbol: &ObjSymbol) -> bool {
let _ = symbol; let _ = symbol;
// symbol.name.starts_with("lbl_") // symbol.name.starts_with("lbl_")
// || symbol.name.starts_with("func_") // || symbol.name.starts_with("func_")
@ -142,6 +142,8 @@ fn is_skip_symbol(symbol: &ObjSymbol) -> bool {
false false
} }
pub fn is_auto_symbol(name: &str) -> bool { name.starts_with("lbl_") || name.starts_with("fn_") }
#[inline] #[inline]
pub fn write_symbols_file<P: AsRef<Path>>(path: P, obj: &ObjInfo) -> Result<()> { pub fn write_symbols_file<P: AsRef<Path>>(path: P, obj: &ObjInfo) -> Result<()> {
let mut w = buf_writer(path)?; let mut w = buf_writer(path)?;
@ -152,11 +154,7 @@ pub fn write_symbols_file<P: AsRef<Path>>(path: P, obj: &ObjInfo) -> Result<()>
pub fn write_symbols<W: Write>(w: &mut W, obj: &ObjInfo) -> Result<()> { pub fn write_symbols<W: Write>(w: &mut W, obj: &ObjInfo) -> Result<()> {
for (_, symbol) in obj.symbols.iter_ordered() { for (_, symbol) in obj.symbols.iter_ordered() {
if symbol.kind == ObjSymbolKind::Section if symbol.kind == ObjSymbolKind::Section || is_skip_symbol(symbol) {
// Ignore absolute symbols for now (usually linker-generated)
|| symbol.section.is_none()
|| is_skip_symbol(symbol)
{
continue; continue;
} }
write_symbol(w, obj, symbol)?; write_symbol(w, obj, symbol)?;
@ -311,17 +309,16 @@ pub fn write_splits<W: Write>(w: &mut W, obj: &ObjInfo) -> Result<()> {
write!(w, " comment:{}", comment_version)?; write!(w, " comment:{}", comment_version)?;
} }
writeln!(w)?; writeln!(w)?;
let mut split_iter = obj.splits_for_range(..).peekable(); let mut split_iter = obj.sections.all_splits().peekable();
while let Some((addr, split)) = split_iter.next() { while let Some((_section_index, section, addr, split)) = split_iter.next() {
if split.unit != unit.name { if split.unit != unit.name {
continue; continue;
} }
let end = if split.end > 0 { let end = if split.end > 0 {
split.end split.end
} else { } else {
split_iter.peek().map(|&(addr, _)| addr).unwrap_or(0) split_iter.peek().map(|&(_, _, addr, _)| addr).unwrap_or(0)
}; };
let section = obj.section_at(addr)?;
write!(w, "\t{:<11} start:{:#010X} end:{:#010X}", section.name, addr, end)?; write!(w, "\t{:<11} start:{:#010X} end:{:#010X}", section.name, addr, end)?;
// if let Some(align) = split.align { // if let Some(align) = split.align {
// write!(w, " align:{}", align)?; // write!(w, " align:{}", align)?;
@ -347,6 +344,7 @@ struct SplitSection {
align: Option<u32>, align: Option<u32>,
/// Whether this is a part of common BSS. /// Whether this is a part of common BSS.
common: bool, common: bool,
rename: Option<String>,
} }
struct SplitUnit { struct SplitUnit {
@ -403,6 +401,7 @@ fn parse_section_line(captures: Captures) -> Result<SplitLine> {
end: 0, end: 0,
align: None, align: None,
common: false, common: false,
rename: None,
}; };
for attr in captures["attrs"].split(' ').filter(|&s| !s.is_empty()) { for attr in captures["attrs"].split(' ').filter(|&s| !s.is_empty()) {
@ -411,7 +410,7 @@ fn parse_section_line(captures: Captures) -> Result<SplitLine> {
"start" => section.start = parse_hex(value)?, "start" => section.start = parse_hex(value)?,
"end" => section.end = parse_hex(value)?, "end" => section.end = parse_hex(value)?,
"align" => section.align = Some(u32::from_str(value)?), "align" => section.align = Some(u32::from_str(value)?),
"rename" => section.name = value.to_string(), "rename" => section.rename = Some(value.to_string()),
_ => bail!("Unknown split attribute '{attr}'"), _ => bail!("Unknown split attribute '{attr}'"),
} }
} else { } else {
@ -462,17 +461,39 @@ pub fn apply_splits<R: BufRead>(r: R, obj: &mut ObjInfo) -> Result<()> {
} }
( (
SplitState::Unit(unit), SplitState::Unit(unit),
SplitLine::Section(SplitSection { name, start, end, align, common }), SplitLine::Section(SplitSection { name, start, end, align, common, rename }),
) => { ) => {
obj.splits.nested_push(start, ObjSplit { let (section_index, _) = match obj.sections.by_name(&name)? {
Some(v) => Ok(v),
None => {
if obj.kind == ObjKind::Executable {
obj.sections.with_range(start..end)
} else {
Err(anyhow!("Section {} not found", name))
}
}
}?;
let section = obj.sections.get_mut(section_index).unwrap();
ensure!(
section.contains_range(start..end),
"Section {} ({:#010X}..{:#010X}) does not contain range {:#010X}..{:#010X}",
name,
section.address,
section.address + section.size,
start,
end
);
section.splits.push(start, ObjSplit {
unit: unit.clone(), unit: unit.clone(),
end, end,
align, align,
common, common,
autogenerated: false, autogenerated: false,
}); });
if let Some(name) = rename {
obj.named_sections.insert(start, name); obj.named_sections.insert(start, name);
} }
}
_ => {} _ => {}
} }
} }

View File

@ -33,8 +33,6 @@ pub fn process_dol<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
let mmap = map_file(path)?; let mmap = map_file(path)?;
Dol::read_from(map_reader(&mmap))? Dol::read_from(map_reader(&mmap))?
}; };
let mut obj = ObjInfo::new(ObjKind::Executable, ObjArchitecture::PowerPc, name, vec![], vec![]);
obj.entry = dol.header.entry_point as u64;
// Locate _rom_copy_info // Locate _rom_copy_info
let first_rom_section = dol let first_rom_section = dol
@ -227,6 +225,7 @@ pub fn process_dol<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
} }
// Add text and data sections // Add text and data sections
let mut sections = vec![];
for dol_section in for dol_section in
dol.header.sections.iter().filter(|section| section.kind != DolSectionType::Bss) dol.header.sections.iter().filter(|section| section.kind != DolSectionType::Bss)
{ {
@ -263,19 +262,19 @@ pub fn process_dol<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
} }
}; };
obj.sections.push(ObjSection { sections.push(ObjSection {
name, name,
kind, kind,
address: dol_section.target as u64, address: dol_section.target as u64,
size: size as u64, size: size as u64,
data: dol.virtual_data_at(dol_section.target, size)?.to_vec(), data: dol.virtual_data_at(dol_section.target, size)?.to_vec(),
align: 0, align: 0,
index: 0,
elf_index: 0, elf_index: 0,
relocations: vec![], relocations: vec![],
original_address: 0, original_address: 0,
file_offset: dol_section.offset as u64, file_offset: dol_section.offset as u64,
section_known: known, section_known: known,
splits: Default::default(),
}); });
} }
@ -292,28 +291,28 @@ pub fn process_dol<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
bss_section.target + bss_section.size bss_section.target + bss_section.size
); );
obj.sections.push(ObjSection { sections.push(ObjSection {
name: format!(".bss{}", idx), name: format!(".bss{}", idx),
kind: ObjSectionKind::Bss, kind: ObjSectionKind::Bss,
address: addr as u64, address: addr as u64,
size: size as u64, size: size as u64,
data: vec![], data: vec![],
align: 0, align: 0,
index: 0,
elf_index: 0, elf_index: 0,
relocations: vec![], relocations: vec![],
original_address: 0, original_address: 0,
file_offset: 0, file_offset: 0,
section_known: false, section_known: false,
splits: Default::default(),
}); });
} }
// Sort sections by address ascending // Sort sections by address ascending
obj.sections.sort_by_key(|s| s.address); sections.sort_by_key(|s| s.address);
// Apply section indices // Apply section indices
let mut init_section_index = None; let mut init_section_index = None;
for (idx, section) in obj.sections.iter_mut().enumerate() { for (idx, section) in sections.iter_mut().enumerate() {
match section.name.as_str() { match section.name.as_str() {
".init" => { ".init" => {
init_section_index = Some(idx); init_section_index = Some(idx);
@ -326,12 +325,16 @@ pub fn process_dol<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
} }
_ => {} _ => {}
} }
section.index = idx;
// Assume the original ELF section index is +1 // Assume the original ELF section index is +1
// ELF files start with a NULL section // ELF files start with a NULL section
section.elf_index = idx + 1; section.elf_index = idx + 1;
} }
// Create object
let mut obj =
ObjInfo::new(ObjKind::Executable, ObjArchitecture::PowerPc, name, vec![], sections);
obj.entry = dol.header.entry_point as u64;
// Generate _rom_copy_info symbol // Generate _rom_copy_info symbol
if let (Some(rom_copy_info_addr), Some(rom_copy_info_end)) = if let (Some(rom_copy_info_addr), Some(rom_copy_info_end)) =
(rom_copy_info_addr, rom_copy_info_end) (rom_copy_info_addr, rom_copy_info_end)
@ -394,13 +397,10 @@ pub fn process_dol<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
} }
// Generate symbols for extab & extabindex entries // Generate symbols for extab & extabindex entries
if let (Some(extabindex_section_idx), Some(extab_section_idx)) = if let (Some(extabindex_section_index), Some(extab_section_index)) =
(extabindex_section, extab_section) (extabindex_section, extab_section)
{ {
let extabindex_section = &obj.sections[extabindex_section_idx]; let extab_section = &obj.sections[extab_section_index];
let extabindex_section_index = extabindex_section.index;
let extab_section = &obj.sections[extab_section_idx];
let extab_section_index = extab_section.index;
let extab_section_address = extab_section.address; let extab_section_address = extab_section.address;
let extab_section_size = extab_section.size; let extab_section_size = extab_section.size;

View File

@ -1,5 +1,5 @@
use std::{ use std::{
collections::{hash_map, BTreeMap, HashMap}, collections::{hash_map, HashMap},
io::Cursor, io::Cursor,
path::Path, path::Path,
}; };
@ -27,7 +27,6 @@ use crate::{
util::{ util::{
comment::{read_comment_sym, write_comment_sym, CommentSym, MWComment}, comment::{read_comment_sym, write_comment_sym, CommentSym, MWComment},
file::map_file, file::map_file,
nested::NestedVec,
}, },
}; };
@ -90,12 +89,12 @@ pub fn process_elf<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
size: section.size(), size: section.size(),
data: section.uncompressed_data()?.to_vec(), data: section.uncompressed_data()?.to_vec(),
align: section.align(), align: section.align(),
index: sections.len(),
elf_index: section.index().0, elf_index: section.index().0,
relocations: vec![], relocations: vec![],
original_address: 0, // TODO load from abs symbol original_address: 0, // TODO load from abs symbol
file_offset: section.file_range().map(|(v, _)| v).unwrap_or_default(), file_offset: section.file_range().map(|(v, _)| v).unwrap_or_default(),
section_known: true, section_known: true,
splits: Default::default(),
}); });
} }
@ -273,7 +272,6 @@ pub fn process_elf<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
} }
let mut link_order = Vec::<ObjUnit>::new(); let mut link_order = Vec::<ObjUnit>::new();
let mut splits = BTreeMap::<u32, Vec<ObjSplit>>::new();
if kind == ObjKind::Executable { if kind == ObjKind::Executable {
// Link order is trivially deduced // Link order is trivially deduced
for file_name in section_starts.keys() { for file_name in section_starts.keys() {
@ -285,9 +283,17 @@ pub fn process_elf<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
} }
// Create a map of address -> file splits // Create a map of address -> file splits
for (file_name, sections) in section_starts { for (file_name, section_addrs) in section_starts {
for (address, _) in sections { for (address, _) in section_addrs {
splits.nested_push(address as u32, ObjSplit { let section =
sections.iter_mut().find(|s| s.contains(address as u32)).ok_or_else(|| {
anyhow!(
"Failed to find section containing address {:#010X} in file {}",
address,
file_name
)
})?;
section.splits.push(address as u32, ObjSplit {
unit: file_name.clone(), unit: file_name.clone(),
end: 0, // TODO end: 0, // TODO
align: None, align: None,
@ -326,7 +332,6 @@ pub fn process_elf<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
obj.db_stack_addr = db_stack_addr; obj.db_stack_addr = db_stack_addr;
obj.arena_lo = arena_lo; obj.arena_lo = arena_lo;
obj.arena_hi = arena_hi; obj.arena_hi = arena_hi;
obj.splits = splits;
obj.link_order = link_order; obj.link_order = link_order;
Ok(obj) Ok(obj)
} }
@ -350,8 +355,8 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
} }
writer.reserve_null_section_index(); writer.reserve_null_section_index();
let mut out_sections: Vec<OutSection> = Vec::with_capacity(obj.sections.len()); let mut out_sections: Vec<OutSection> = Vec::with_capacity(obj.sections.count());
for section in &obj.sections { for (_, section) in obj.sections.iter() {
let name = writer.add_section_name(section.name.as_bytes()); let name = writer.add_section_name(section.name.as_bytes());
let index = writer.reserve_section_index(); let index = writer.reserve_section_index();
out_sections.push(OutSection { out_sections.push(OutSection {
@ -364,8 +369,8 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
}); });
} }
let mut rela_names: Vec<String> = vec![Default::default(); obj.sections.len()]; let mut rela_names: Vec<String> = vec![Default::default(); obj.sections.count()];
for ((section, out_section), rela_name) in for (((_, section), out_section), rela_name) in
obj.sections.iter().zip(&mut out_sections).zip(&mut rela_names) obj.sections.iter().zip(&mut out_sections).zip(&mut rela_names)
{ {
if section.relocations.is_empty() { if section.relocations.is_empty() {
@ -449,12 +454,12 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
// Add section symbols for relocatable objects // Add section symbols for relocatable objects
if obj.kind == ObjKind::Relocatable { if obj.kind == ObjKind::Relocatable {
for section in &obj.sections { for (section_index, section) in obj.sections.iter() {
let section_index = out_sections.get(section.index).map(|s| s.index); let out_section_index = out_sections.get(section_index).map(|s| s.index);
let index = writer.reserve_symbol_index(section_index); let index = writer.reserve_symbol_index(out_section_index);
let sym = object::write::elf::Sym { let sym = object::write::elf::Sym {
name: None, name: None,
section: section_index, section: out_section_index,
st_info: (elf::STB_LOCAL << 4) + elf::STT_SECTION, st_info: (elf::STB_LOCAL << 4) + elf::STT_SECTION,
st_other: elf::STV_DEFAULT, st_other: elf::STV_DEFAULT,
st_shndx: 0, st_shndx: 0,
@ -535,10 +540,10 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
writer.reserve_file_header(); writer.reserve_file_header();
if obj.kind == ObjKind::Executable { if obj.kind == ObjKind::Executable {
writer.reserve_program_headers(obj.sections.len() as u32); writer.reserve_program_headers(obj.sections.count() as u32);
} }
for (section, out_section) in obj.sections.iter().zip(&mut out_sections) { for ((_, section), out_section) in obj.sections.iter().zip(&mut out_sections) {
if section.kind == ObjSectionKind::Bss { if section.kind == ObjSectionKind::Bss {
continue; continue;
} }
@ -553,7 +558,7 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
} }
} }
for (section, out_section) in obj.sections.iter().zip(&mut out_sections) { for ((_, section), out_section) in obj.sections.iter().zip(&mut out_sections) {
if section.relocations.is_empty() { if section.relocations.is_empty() {
continue; continue;
} }
@ -586,7 +591,7 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
if obj.kind == ObjKind::Executable { if obj.kind == ObjKind::Executable {
writer.write_align_program_headers(); writer.write_align_program_headers();
for (section, out_section) in obj.sections.iter().zip(&out_sections) { for ((_, section), out_section) in obj.sections.iter().zip(&out_sections) {
writer.write_program_header(&ProgramHeader { writer.write_program_header(&ProgramHeader {
p_type: elf::PT_LOAD, p_type: elf::PT_LOAD,
p_flags: match section.kind { p_flags: match section.kind {
@ -607,7 +612,7 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
} }
} }
for (section, out_section) in obj.sections.iter().zip(&out_sections) { for ((_, section), out_section) in obj.sections.iter().zip(&out_sections) {
if section.kind == ObjSectionKind::Bss { if section.kind == ObjSectionKind::Bss {
continue; continue;
} }
@ -616,7 +621,7 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
writer.write(&section.data); writer.write(&section.data);
} }
for (section, out_section) in obj.sections.iter().zip(&out_sections) { for ((_, section), out_section) in obj.sections.iter().zip(&out_sections) {
if section.relocations.is_empty() { if section.relocations.is_empty() {
continue; continue;
} }
@ -680,7 +685,7 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
} }
writer.write_null_section_header(); writer.write_null_section_header();
for (section, out_section) in obj.sections.iter().zip(&out_sections) { for ((_, section), out_section) in obj.sections.iter().zip(&out_sections) {
writer.write_section_header(&SectionHeader { writer.write_section_header(&SectionHeader {
name: Some(out_section.name), name: Some(out_section.name),
sh_type: match section.kind { sh_type: match section.kind {
@ -703,7 +708,7 @@ pub fn write_elf(obj: &ObjInfo) -> Result<Vec<u8>> {
sh_entsize: 0, // TODO? sh_entsize: 0, // TODO?
}); });
} }
for (section, out_section) in obj.sections.iter().zip(&out_sections) { for ((_, section), out_section) in obj.sections.iter().zip(&out_sections) {
let Some(rela_name) = out_section.rela_name else { let Some(rela_name) = out_section.rela_name else {
continue; continue;
}; };
@ -853,6 +858,6 @@ fn to_obj_reloc(
_ => Err(anyhow!("Unhandled relocation symbol type {:?}", symbol.kind())), _ => Err(anyhow!("Unhandled relocation symbol type {:?}", symbol.kind())),
}?; }?;
let address = address & !3; // TODO hack: round down for instruction let address = address & !3; // TODO hack: round down for instruction
let reloc_data = ObjReloc { kind: reloc_kind, address, target_symbol, addend }; let reloc_data = ObjReloc { kind: reloc_kind, address, target_symbol, addend, module: None };
Ok(Some(reloc_data)) Ok(Some(reloc_data))
} }

View File

@ -1,5 +1,5 @@
use std::{ use std::{
fs::{File, OpenOptions}, fs::{DirBuilder, File, OpenOptions},
io::{BufRead, BufReader, BufWriter, Cursor, Read}, io::{BufRead, BufReader, BufWriter, Cursor, Read},
path::{Path, PathBuf}, path::{Path, PathBuf},
}; };
@ -35,6 +35,9 @@ pub fn buf_reader<P: AsRef<Path>>(path: P) -> Result<BufReader<File>> {
/// Creates a buffered writer around a file (not memory mapped). /// Creates a buffered writer around a file (not memory mapped).
pub fn buf_writer<P: AsRef<Path>>(path: P) -> Result<BufWriter<File>> { pub fn buf_writer<P: AsRef<Path>>(path: P) -> Result<BufWriter<File>> {
if let Some(parent) = path.as_ref().parent() {
DirBuilder::new().recursive(true).create(parent)?;
}
let file = File::create(&path) let file = File::create(&path)
.with_context(|| format!("Failed to create file '{}'", path.as_ref().display()))?; .with_context(|| format!("Failed to create file '{}'", path.as_ref().display()))?;
Ok(BufWriter::new(file)) Ok(BufWriter::new(file))

View File

@ -9,16 +9,16 @@ use crate::obj::ObjInfo;
const fn align_up(value: u32, align: u32) -> u32 { (value + (align - 1)) & !(align - 1) } const fn align_up(value: u32, align: u32) -> u32 { (value + (align - 1)) & !(align - 1) }
pub fn generate_ldscript(obj: &ObjInfo, auto_force_files: bool) -> Result<String> { pub fn generate_ldscript(obj: &ObjInfo, auto_force_files: bool) -> Result<String> {
let origin = obj.sections.iter().map(|s| s.address).min().unwrap(); let origin = obj.sections.iter().map(|(_, s)| s.address).min().unwrap();
let stack_size = match (obj.stack_address, obj.stack_end) { let stack_size = match (obj.stack_address, obj.stack_end) {
(Some(stack_address), Some(stack_end)) => stack_address - stack_end, (Some(stack_address), Some(stack_end)) => stack_address - stack_end,
_ => 65535, // default _ => 65535, // default
}; };
// Guess section alignment // Guess section alignment
let mut alignments = Vec::with_capacity(obj.sections.len()); let mut alignments = Vec::with_capacity(obj.sections.count());
let mut last_section_end = origin as u32; let mut last_section_end = origin as u32;
for section in &obj.sections { for (_, section) in obj.sections.iter() {
let section_start = section.address as u32; let section_start = section.address as u32;
let mut align = 0x20; let mut align = 0x20;
while align_up(last_section_end, align) < section_start { while align_up(last_section_end, align) < section_start {
@ -40,7 +40,7 @@ pub fn generate_ldscript(obj: &ObjInfo, auto_force_files: bool) -> Result<String
.sections .sections
.iter() .iter()
.zip(alignments) .zip(alignments)
.map(|(s, align)| format!("{} ALIGN({:#X}):{{}}", s.name, align)) .map(|((_, s), align)| format!("{} ALIGN({:#X}):{{}}", s.name, align))
.join("\n "); .join("\n ");
let mut force_files = Vec::with_capacity(obj.link_order.len()); let mut force_files = Vec::with_capacity(obj.link_order.len());
@ -57,7 +57,7 @@ pub fn generate_ldscript(obj: &ObjInfo, auto_force_files: bool) -> Result<String
} }
// Hack to handle missing .sbss2 section... what's the proper way? // Hack to handle missing .sbss2 section... what's the proper way?
let last_section_name = obj.sections.last().unwrap().name.clone(); let last_section_name = obj.sections.iter().next_back().unwrap().1.name.clone();
let last_section_symbol = format!("_f_{}", last_section_name.trim_start_matches('.')); let last_section_symbol = format!("_f_{}", last_section_name.trim_start_matches('.'));
let mut out = include_str!("../../assets/ldscript.lcf") let mut out = include_str!("../../assets/ldscript.lcf")

View File

@ -16,13 +16,10 @@ use regex::{Captures, Regex};
use crate::{ use crate::{
obj::{ obj::{
section_kind_for_section, ObjInfo, ObjSplit, ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags, section_kind_for_section, ObjInfo, ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags,
ObjSymbolKind, ObjSymbolKind,
}, },
util::{ util::file::{map_file, map_reader},
file::{map_file, map_reader},
nested::NestedVec,
},
}; };
#[derive(Debug, Copy, Clone, Eq, PartialEq)] #[derive(Debug, Copy, Clone, Eq, PartialEq)]
@ -658,7 +655,7 @@ pub fn apply_map_file<P: AsRef<Path>>(path: P, obj: &mut ObjInfo) -> Result<()>
} }
pub fn apply_map(result: &MapInfo, obj: &mut ObjInfo) -> Result<()> { pub fn apply_map(result: &MapInfo, obj: &mut ObjInfo) -> Result<()> {
for section in &mut obj.sections { for (_section_index, section) in obj.sections.iter_mut() {
if let Some(info) = result.sections.get(&(section.address as u32)) { if let Some(info) = result.sections.get(&(section.address as u32)) {
let kind = section_kind_for_section(&info.name)?; let kind = section_kind_for_section(&info.name)?;
if section.section_known { if section.section_known {
@ -702,11 +699,9 @@ pub fn apply_map(result: &MapInfo, obj: &mut ObjInfo) -> Result<()> {
} }
// Add section symbols // Add section symbols
for (section_name, symbol_map) in &result.section_symbols { for (section_name, symbol_map) in &result.section_symbols {
let section_index = obj let (section_index, _) = obj
.sections .sections
.iter() .by_name(section_name)?
.find(|s| &s.name == section_name)
.map(|s| s.index)
.ok_or_else(|| anyhow!("Failed to locate section {section_name} from map"))?; .ok_or_else(|| anyhow!("Failed to locate section {section_name} from map"))?;
for symbol_entry in symbol_map.values().flatten() { for symbol_entry in symbol_map.values().flatten() {
add_symbol(obj, symbol_entry, Some(section_index))?; add_symbol(obj, symbol_entry, Some(section_index))?;
@ -721,19 +716,19 @@ pub fn apply_map(result: &MapInfo, obj: &mut ObjInfo) -> Result<()> {
for (section, unit_order) in &result.section_units { for (section, unit_order) in &result.section_units {
let mut units = Vec::new(); let mut units = Vec::new();
let mut existing = HashSet::new(); let mut existing = HashSet::new();
for (addr, unit) in unit_order { for (_addr, unit) in unit_order {
let unit = unit.clone(); let unit = unit.clone();
if !existing.contains(&unit) { if !existing.contains(&unit) {
units.push(unit.clone()); units.push(unit.clone());
existing.insert(unit.clone()); existing.insert(unit.clone());
} }
obj.splits.nested_push(*addr, ObjSplit { // obj.splits.nested_push(*addr, ObjSplit {
unit, // unit,
end: 0, // TODO? // end: 0, // TODO?
align: None, // align: None,
common: false, // TODO? // common: false, // TODO?
autogenerated: false, // autogenerated: false,
}); // });
} }
section_order.push((section.clone(), units)); section_order.push((section.clone(), units));
} }

View File

@ -12,6 +12,8 @@ pub mod nested;
pub mod rarc; pub mod rarc;
pub mod rel; pub mod rel;
pub mod rso; pub mod rso;
pub mod signatures;
pub mod split;
pub mod yaz0; pub mod yaz0;
/// Creates a fixed-size array reference from a slice. /// Creates a fixed-size array reference from a slice.

View File

@ -79,7 +79,6 @@ pub fn process_rel(mut reader: Reader) -> Result<ObjInfo> {
// println!("Section {} offset {:#X} size {:#X}", idx, offset, size); // println!("Section {} offset {:#X} size {:#X}", idx, offset, size);
let index = sections.len();
sections.push(ObjSection { sections.push(ObjSection {
name: format!(".section{}", idx), name: format!(".section{}", idx),
kind: if offset == 0 { kind: if offset == 0 {
@ -97,12 +96,12 @@ pub fn process_rel(mut reader: Reader) -> Result<ObjInfo> {
_ => align, _ => align,
} }
.unwrap_or_default() as u64, .unwrap_or_default() as u64,
index,
elf_index: idx as usize, elf_index: idx as usize,
relocations: vec![], relocations: vec![],
original_address: 0, original_address: 0,
file_offset: offset as u64, file_offset: offset as u64,
section_known: false, section_known: false,
splits: Default::default(),
}); });
if offset == 0 { if offset == 0 {
total_bss_size += size; total_bss_size += size;
@ -116,18 +115,19 @@ pub fn process_rel(mut reader: Reader) -> Result<ObjInfo> {
); );
let mut symbols = Vec::new(); let mut symbols = Vec::new();
let mut add_symbol = |section_idx: u8, offset: u32, name: &str| -> Result<()> { let mut add_symbol = |rel_section_idx: u8, offset: u32, name: &str| -> Result<()> {
if section_idx > 0 { if rel_section_idx > 0 {
let section = sections let (section_index, _) = sections
.iter() .iter()
.find(|section| section.elf_index == section_idx as usize) .enumerate()
.ok_or_else(|| anyhow!("Failed to locate {name} section {section_idx}"))?; .find(|&(_, section)| section.elf_index == rel_section_idx as usize)
log::debug!("Adding {name} section {section_idx} offset {offset:#X}"); .ok_or_else(|| anyhow!("Failed to locate {name} section {rel_section_idx}"))?;
log::debug!("Adding {name} section {rel_section_idx} offset {offset:#X}");
symbols.push(ObjSymbol { symbols.push(ObjSymbol {
name: name.to_string(), name: name.to_string(),
demangled_name: None, demangled_name: None,
address: offset as u64, address: offset as u64,
section: Some(section.index), section: Some(section_index),
size: 0, size: 0,
size_known: false, size_known: false,
flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()), flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()),

View File

@ -89,7 +89,6 @@ pub fn process_rso<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
// println!("Section {} offset {:#X} size {:#X}", idx, offset, size); // println!("Section {} offset {:#X} size {:#X}", idx, offset, size);
let index = sections.len();
sections.push(ObjSection { sections.push(ObjSection {
name: format!(".section{}", idx), name: format!(".section{}", idx),
kind: if offset == 0 { kind: if offset == 0 {
@ -103,12 +102,12 @@ pub fn process_rso<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
size: size as u64, size: size as u64,
data, data,
align: 0, align: 0,
index,
elf_index: idx as usize, elf_index: idx as usize,
relocations: vec![], relocations: vec![],
original_address: 0, original_address: 0,
file_offset: offset as u64, file_offset: offset as u64,
section_known: false, section_known: false,
splits: Default::default(),
}); });
if offset == 0 { if offset == 0 {
total_bss_size += size; total_bss_size += size;
@ -122,18 +121,19 @@ pub fn process_rso<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
); );
let mut symbols = Vec::new(); let mut symbols = Vec::new();
let mut add_symbol = |section_idx: u8, offset: u32, name: &str| -> Result<()> { let mut add_symbol = |rel_section_idx: u8, offset: u32, name: &str| -> Result<()> {
if section_idx > 0 { if rel_section_idx > 0 {
let section = sections let (section_index, _) = sections
.iter() .iter()
.find(|section| section.elf_index == section_idx as usize) .enumerate()
.ok_or_else(|| anyhow!("Failed to locate {name} section {section_idx}"))?; .find(|&(_, section)| section.elf_index == rel_section_idx as usize)
log::debug!("Adding {name} section {section_idx} offset {offset:#X}"); .ok_or_else(|| anyhow!("Failed to locate {name} section {rel_section_idx}"))?;
log::debug!("Adding {name} section {rel_section_idx} offset {offset:#X}");
symbols.push(ObjSymbol { symbols.push(ObjSymbol {
name: name.to_string(), name: name.to_string(),
demangled_name: None, demangled_name: None,
address: offset as u64, address: offset as u64,
section: Some(section.index), section: Some(section_index),
size: 0, size: 0,
size_known: false, size_known: false,
flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()), flags: ObjSymbolFlagSet(ObjSymbolFlags::Global.into()),
@ -182,8 +182,9 @@ pub fn process_rso<P: AsRef<Path>>(path: P) -> Result<ObjInfo> {
let demangled_name = demangle(&name, &DemangleOptions::default()); let demangled_name = demangle(&name, &DemangleOptions::default());
let section = sections let section = sections
.iter() .iter()
.find(|section| section.elf_index == section_idx as usize) .enumerate()
.map(|section| section.index) .find(|&(_, section)| section.elf_index == section_idx as usize)
.map(|(idx, _)| idx)
// HACK: selfiles won't have any sections // HACK: selfiles won't have any sections
.unwrap_or(section_idx as usize); .unwrap_or(section_idx as usize);
log::debug!( log::debug!(

View File

@ -12,7 +12,9 @@ use sha1::{Digest, Sha1};
use crate::{ use crate::{
analysis::tracker::{Relocation, Tracker}, analysis::tracker::{Relocation, Tracker},
array_ref, array_ref,
obj::{ObjInfo, ObjReloc, ObjRelocKind, ObjSymbol, ObjSymbolFlagSet, ObjSymbolKind}, obj::{
ObjInfo, ObjReloc, ObjRelocKind, ObjSection, ObjSymbol, ObjSymbolFlagSet, ObjSymbolKind,
},
util::elf::process_elf, util::elf::process_elf,
}; };
@ -69,19 +71,19 @@ pub fn parse_signatures(sig_str: &str) -> Result<Vec<FunctionSignature>> {
} }
pub fn check_signatures_str( pub fn check_signatures_str(
obj: &ObjInfo, section: &ObjSection,
addr: u32, addr: u32,
sig_str: &str, sig_str: &str,
) -> Result<Option<FunctionSignature>> { ) -> Result<Option<FunctionSignature>> {
check_signatures(obj, addr, &parse_signatures(sig_str)?) check_signatures(section, addr, &parse_signatures(sig_str)?)
} }
pub fn check_signatures( pub fn check_signatures(
obj: &ObjInfo, section: &ObjSection,
addr: u32, addr: u32,
signatures: &Vec<FunctionSignature>, signatures: &Vec<FunctionSignature>,
) -> Result<Option<FunctionSignature>> { ) -> Result<Option<FunctionSignature>> {
let (_, data) = obj.section_data(addr, 0)?; let data = section.data_range(addr, 0)?;
let mut name = None; let mut name = None;
for signature in signatures { for signature in signatures {
if name.is_none() { if name.is_none() {
@ -104,7 +106,7 @@ pub fn check_signatures(
} }
pub fn apply_symbol(obj: &mut ObjInfo, target: u32, sig_symbol: &OutSymbol) -> Result<usize> { pub fn apply_symbol(obj: &mut ObjInfo, target: u32, sig_symbol: &OutSymbol) -> Result<usize> {
let mut target_section_index = obj.section_at(target).ok().map(|section| section.index); let mut target_section_index = obj.sections.at_address(target).ok().map(|(idx, _)| idx);
if let Some(target_section_index) = target_section_index { if let Some(target_section_index) = target_section_index {
let target_section = &mut obj.sections[target_section_index]; let target_section = &mut obj.sections[target_section_index];
if !target_section.section_known { if !target_section.section_known {
@ -138,15 +140,19 @@ pub fn apply_symbol(obj: &mut ObjInfo, target: u32, sig_symbol: &OutSymbol) -> R
Ok(target_symbol_idx) Ok(target_symbol_idx)
} }
pub fn apply_signature(obj: &mut ObjInfo, addr: u32, signature: &FunctionSignature) -> Result<()> { pub fn apply_signature(
let section_index = obj.section_at(addr)?.index; obj: &mut ObjInfo,
section_index: usize,
addr: u32,
signature: &FunctionSignature,
) -> Result<()> {
let in_symbol = &signature.symbols[signature.symbol]; let in_symbol = &signature.symbols[signature.symbol];
let symbol_idx = apply_symbol(obj, addr, in_symbol)?; let symbol_idx = apply_symbol(obj, addr, in_symbol)?;
let mut tracker = Tracker::new(obj); let mut tracker = Tracker::new(obj);
for reloc in &signature.relocations { for reloc in &signature.relocations {
tracker.known_relocations.insert(addr + reloc.offset); tracker.known_relocations.insert(addr + reloc.offset);
} }
tracker.process_function(obj, obj.symbols.at(symbol_idx))?; tracker.process_function(obj, &obj.symbols[symbol_idx])?;
for (&reloc_addr, reloc) in &tracker.relocations { for (&reloc_addr, reloc) in &tracker.relocations {
if reloc_addr < addr || reloc_addr >= addr + in_symbol.size { if reloc_addr < addr || reloc_addr >= addr + in_symbol.size {
continue; continue;
@ -175,6 +181,7 @@ pub fn apply_signature(obj: &mut ObjInfo, addr: u32, signature: &FunctionSignatu
address: reloc_addr as u64, address: reloc_addr as u64,
target_symbol: target_symbol_idx, target_symbol: target_symbol_idx,
addend: sig_reloc.addend as i64, addend: sig_reloc.addend as i64,
module: None,
}; };
// log::info!("Applying relocation {:#010X?}", obj_reloc); // log::info!("Applying relocation {:#010X?}", obj_reloc);
obj.sections[section_index].relocations.push(obj_reloc); obj.sections[section_index].relocations.push(obj_reloc);
@ -296,7 +303,7 @@ pub fn generate_signature<P: AsRef<Path>>(
let reloc = &section.relocations[reloc_idx]; let reloc = &section.relocations[reloc_idx];
let symbol_idx = match symbol_map.entry(reloc.target_symbol) { let symbol_idx = match symbol_map.entry(reloc.target_symbol) {
btree_map::Entry::Vacant(e) => { btree_map::Entry::Vacant(e) => {
let target = obj.symbols.at(reloc.target_symbol); let target = &obj.symbols[reloc.target_symbol];
let symbol_idx = out_symbols.len(); let symbol_idx = out_symbols.len();
e.insert(symbol_idx); e.insert(symbol_idx);
out_symbols.push(OutSymbol { out_symbols.push(OutSymbol {
@ -308,7 +315,10 @@ pub fn generate_signature<P: AsRef<Path>>(
target.size as u32 target.size as u32
}, },
flags: target.flags, flags: target.flags,
section: target.section.map(|idx| obj.sections[idx].name.clone()), section: target
.section
.and_then(|idx| obj.sections.get(idx))
.map(|section| section.name.clone()),
}); });
symbol_idx symbol_idx
} }

View File

@ -8,6 +8,7 @@ use itertools::Itertools;
use petgraph::{graph::NodeIndex, Graph}; use petgraph::{graph::NodeIndex, Graph};
use crate::{ use crate::{
array_ref,
obj::{ obj::{
ObjArchitecture, ObjInfo, ObjKind, ObjReloc, ObjSection, ObjSectionKind, ObjSplit, ObjArchitecture, ObjInfo, ObjKind, ObjReloc, ObjSection, ObjSectionKind, ObjSplit,
ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags, ObjSymbolKind, ObjSymbolScope, ObjUnit, ObjSymbol, ObjSymbolFlagSet, ObjSymbolFlags, ObjSymbolKind, ObjSymbolScope, ObjUnit,
@ -16,25 +17,35 @@ use crate::{
}; };
/// Create splits for function pointers in the given section. /// Create splits for function pointers in the given section.
fn split_ctors_dtors(obj: &mut ObjInfo, section_start: u32, section_end: u32) -> Result<()> { fn split_ctors_dtors(
let mut new_splits = BTreeMap::new(); obj: &mut ObjInfo,
let mut current_address = section_start; ctors_section_index: usize,
start: u32,
end: u32,
) -> Result<()> {
let ctors_section = &obj.sections[ctors_section_index];
let mut new_splits = BTreeMap::<u32, (usize, ObjSplit)>::new();
let mut current_address = start;
let mut referenced_symbols = vec![]; let mut referenced_symbols = vec![];
while current_address < section_end { while current_address < end {
let (section, chunk) = obj.section_data(current_address, current_address + 4)?; let chunk = ctors_section.data_range(current_address, current_address + 4)?;
let function_addr = u32::from_be_bytes(chunk[0..4].try_into().unwrap()); let function_addr = u32::from_be_bytes(*array_ref!(chunk, 0, 4));
log::debug!("Found {} entry: {:#010X}", section.name, function_addr); log::debug!("Found {} entry: {:#010X}", ctors_section.name, function_addr);
let Some((function_symbol_idx, function_symbol)) = let (text_section_index, text_section) = obj.sections.at_address(function_addr)?;
obj.symbols.kind_at_address(function_addr, ObjSymbolKind::Function)? let Some((function_symbol_idx, function_symbol)) = obj.symbols.kind_at_section_address(
text_section_index,
function_addr,
ObjSymbolKind::Function,
)?
else { else {
bail!("Failed to find function symbol @ {:#010X}", function_addr); bail!("Failed to find function symbol @ {:#010X}", function_addr);
}; };
referenced_symbols.push(function_symbol_idx); referenced_symbols.push(function_symbol_idx);
let ctors_split = obj.split_for(current_address); let ctors_split = ctors_section.splits.for_address(current_address);
let function_split = obj.split_for(function_addr); let function_split = text_section.splits.for_address(function_addr);
let mut expected_unit = None; let mut expected_unit = None;
if let Some((_, ctors_split)) = ctors_split { if let Some((_, ctors_split)) = ctors_split {
@ -45,7 +56,7 @@ fn split_ctors_dtors(obj: &mut ObjInfo, section_start: u32, section_end: u32) ->
ensure!( ensure!(
unit == &function_split.unit, unit == &function_split.unit,
"Mismatched splits for {} {:#010X} ({}) and function {:#010X} ({})", "Mismatched splits for {} {:#010X} ({}) and function {:#010X} ({})",
section.name, ctors_section.name,
current_address, current_address,
unit, unit,
function_addr, function_addr,
@ -67,32 +78,42 @@ fn split_ctors_dtors(obj: &mut ObjInfo, section_start: u32, section_end: u32) ->
log::debug!("Adding splits to unit {}", unit); log::debug!("Adding splits to unit {}", unit);
if ctors_split.is_none() { if ctors_split.is_none() {
log::debug!("Adding split for {} entry @ {:#010X}", section.name, current_address); log::debug!(
new_splits.insert(current_address, ObjSplit { "Adding split for {} entry @ {:#010X}",
ctors_section.name,
current_address
);
new_splits.insert(
current_address,
(ctors_section_index, ObjSplit {
unit: unit.clone(), unit: unit.clone(),
end: current_address + 4, end: current_address + 4,
align: None, align: None,
common: false, common: false,
autogenerated: true, autogenerated: true,
}); }),
);
} }
if function_split.is_none() { if function_split.is_none() {
log::debug!("Adding split for function @ {:#010X}", function_addr); log::debug!("Adding split for function @ {:#010X}", function_addr);
new_splits.insert(function_addr, ObjSplit { new_splits.insert(
function_addr,
(text_section_index, ObjSplit {
unit, unit,
end: function_addr + function_symbol.size as u32, end: function_addr + function_symbol.size as u32,
align: None, align: None,
common: false, common: false,
autogenerated: true, autogenerated: true,
}); }),
);
} }
} }
current_address += 4; current_address += 4;
} }
for (addr, split) in new_splits { for (addr, (section_index, split)) in new_splits {
obj.add_split(addr, split)?; obj.add_split(section_index, addr, split)?;
} }
// Hack to avoid deadstripping // Hack to avoid deadstripping
@ -104,8 +125,9 @@ fn split_ctors_dtors(obj: &mut ObjInfo, section_start: u32, section_end: u32) ->
} }
/// Create splits for extabindex + extab entries. /// Create splits for extabindex + extab entries.
fn split_extabindex(obj: &mut ObjInfo, section_index: usize, section_start: u32) -> Result<()> { fn split_extabindex(obj: &mut ObjInfo, section_index: usize, start: u32) -> Result<()> {
let mut new_splits = BTreeMap::new(); let section = &obj.sections[section_index];
let mut new_splits = BTreeMap::<u32, (usize, ObjSplit)>::new();
let (_, eti_init_info) = obj let (_, eti_init_info) = obj
.symbols .symbols
.by_name("_eti_init_info")? .by_name("_eti_init_info")?
@ -116,13 +138,17 @@ fn split_extabindex(obj: &mut ObjInfo, section_index: usize, section_start: u32)
eti_init_info.section, eti_init_info.section,
section_index section_index
); );
let mut current_address = section_start;
let (extab_section_index, extab_section) =
obj.sections.by_name("extab")?.ok_or_else(|| anyhow!("Failed to find extab section"))?;
let mut current_address = start;
let section_end = eti_init_info.address as u32; let section_end = eti_init_info.address as u32;
while current_address < section_end { while current_address < section_end {
let (_eti_section, chunk) = obj.section_data(current_address, current_address + 12)?; let chunk = section.data_range(current_address, current_address + 12)?;
let function_addr = u32::from_be_bytes(chunk[0..4].try_into().unwrap()); let function_addr = u32::from_be_bytes(*array_ref!(chunk, 0, 4));
let function_size = u32::from_be_bytes(chunk[4..8].try_into().unwrap()); let function_size = u32::from_be_bytes(*array_ref!(chunk, 4, 4));
let extab_addr = u32::from_be_bytes(chunk[8..12].try_into().unwrap()); let extab_addr = u32::from_be_bytes(*array_ref!(chunk, 8, 4));
log::debug!( log::debug!(
"Found extabindex entry: {:#010X} size {:#010X} extab {:#010X}", "Found extabindex entry: {:#010X} size {:#010X} extab {:#010X}",
function_addr, function_addr,
@ -130,8 +156,11 @@ fn split_extabindex(obj: &mut ObjInfo, section_index: usize, section_start: u32)
extab_addr extab_addr
); );
let Some((_, eti_symbol)) = let Some((_, eti_symbol)) = obj.symbols.kind_at_section_address(
obj.symbols.kind_at_address(current_address, ObjSymbolKind::Object)? section_index,
current_address,
ObjSymbolKind::Object,
)?
else { else {
bail!("Failed to find extabindex symbol @ {:#010X}", current_address); bail!("Failed to find extabindex symbol @ {:#010X}", current_address);
}; };
@ -143,8 +172,12 @@ fn split_extabindex(obj: &mut ObjInfo, section_index: usize, section_start: u32)
12 12
); );
let Some((_, function_symbol)) = let (text_section_index, text_section) = obj.sections.at_address(function_addr)?;
obj.symbols.kind_at_address(function_addr, ObjSymbolKind::Function)? let Some((_, function_symbol)) = obj.symbols.kind_at_section_address(
text_section_index,
function_addr,
ObjSymbolKind::Function,
)?
else { else {
bail!("Failed to find function symbol @ {:#010X}", function_addr); bail!("Failed to find function symbol @ {:#010X}", function_addr);
}; };
@ -156,8 +189,11 @@ fn split_extabindex(obj: &mut ObjInfo, section_index: usize, section_start: u32)
function_size function_size
); );
let Some((_, extab_symbol)) = let Some((_, extab_symbol)) = obj.symbols.kind_at_section_address(
obj.symbols.kind_at_address(extab_addr, ObjSymbolKind::Object)? extab_section_index,
extab_addr,
ObjSymbolKind::Object,
)?
else { else {
bail!("Failed to find extab symbol @ {:#010X}", extab_addr); bail!("Failed to find extab symbol @ {:#010X}", extab_addr);
}; };
@ -167,9 +203,9 @@ fn split_extabindex(obj: &mut ObjInfo, section_index: usize, section_start: u32)
extab_symbol.name extab_symbol.name
); );
let extabindex_split = obj.split_for(current_address); let extabindex_split = section.splits.for_address(current_address);
let extab_split = obj.split_for(extab_addr); let extab_split = extab_section.splits.for_address(extab_addr);
let function_split = obj.split_for(function_addr); let function_split = text_section.splits.for_address(function_addr);
let mut expected_unit = None; let mut expected_unit = None;
if let Some((_, extabindex_split)) = extabindex_split { if let Some((_, extabindex_split)) = extabindex_split {
@ -221,43 +257,52 @@ fn split_extabindex(obj: &mut ObjInfo, section_index: usize, section_start: u32)
current_address, current_address,
end end
); );
new_splits.insert(current_address, ObjSplit { new_splits.insert(
current_address,
(section_index, ObjSplit {
unit: unit.clone(), unit: unit.clone(),
end, end,
align: None, align: None,
common: false, common: false,
autogenerated: true, autogenerated: true,
}); }),
);
} }
if extab_split.is_none() { if extab_split.is_none() {
let end = extab_addr + extab_symbol.size as u32; let end = extab_addr + extab_symbol.size as u32;
log::debug!("Adding split for extab @ {:#010X}-{:#010X}", extab_addr, end); log::debug!("Adding split for extab @ {:#010X}-{:#010X}", extab_addr, end);
new_splits.insert(extab_addr, ObjSplit { new_splits.insert(
extab_addr,
(extab_section_index, ObjSplit {
unit: unit.clone(), unit: unit.clone(),
end, end,
align: None, align: None,
common: false, common: false,
autogenerated: true, autogenerated: true,
}); }),
);
} }
if function_split.is_none() { if function_split.is_none() {
let end = function_addr + function_symbol.size as u32; let end = function_addr + function_symbol.size as u32;
log::debug!("Adding split for function @ {:#010X}-{:#010X}", function_addr, end); log::debug!("Adding split for function @ {:#010X}-{:#010X}", function_addr, end);
new_splits.insert(function_addr, ObjSplit { new_splits.insert(
function_addr,
(text_section_index, ObjSplit {
unit, unit,
end, end,
align: None, align: None,
common: false, common: false,
autogenerated: true, autogenerated: true,
}); }),
);
} }
} }
current_address += 12; current_address += 12;
} }
for (addr, split) in new_splits { for (addr, (section_index, split)) in new_splits {
obj.add_split(addr, split)?; obj.add_split(section_index, addr, split)?;
} }
Ok(()) Ok(())
@ -265,12 +310,12 @@ fn split_extabindex(obj: &mut ObjInfo, section_index: usize, section_start: u32)
/// Create splits for gaps between existing splits. /// Create splits for gaps between existing splits.
fn create_gap_splits(obj: &mut ObjInfo) -> Result<()> { fn create_gap_splits(obj: &mut ObjInfo) -> Result<()> {
let mut new_splits = BTreeMap::new(); let mut new_splits = BTreeMap::<u32, (usize, ObjSplit)>::new();
for (section_idx, section) in obj.sections.iter().enumerate() { for (section_index, section) in obj.sections.iter() {
let mut current_address = section.address as u32; let mut current_address = section.address as u32;
let section_end = end_for_section(obj, section_idx)?; let section_end = end_for_section(obj, section_index)?;
let mut file_iter = obj.splits_for_range(current_address..section_end).peekable(); let mut file_iter = section.splits.for_range(..section_end).peekable();
log::debug!( log::debug!(
"Checking splits for section {} ({:#010X}..{:#010X})", "Checking splits for section {} ({:#010X}..{:#010X})",
@ -300,16 +345,12 @@ fn create_gap_splits(obj: &mut ObjInfo) -> Result<()> {
if split_start > current_address { if split_start > current_address {
// Find any duplicate symbols in this range // Find any duplicate symbols in this range
let mut new_split_end = split_start; let mut new_split_end = split_start;
let symbols = obj.symbols.for_range(current_address..split_start).collect_vec(); let symbols = obj
.symbols
.for_section_range(section_index, current_address..split_start)
.collect_vec();
let mut existing_symbols = HashSet::new(); let mut existing_symbols = HashSet::new();
for (_, symbol) in symbols { for (_, symbol) in symbols {
// Sanity check? Maybe not required?
ensure!(
symbol.section == Some(section_idx),
"Expected symbol {} to be in section {}",
symbol.name,
section_idx
);
if !existing_symbols.insert(symbol.name.clone()) { if !existing_symbols.insert(symbol.name.clone()) {
log::debug!( log::debug!(
"Found duplicate symbol {} at {:#010X}", "Found duplicate symbol {} at {:#010X}",
@ -328,13 +369,16 @@ fn create_gap_splits(obj: &mut ObjInfo) -> Result<()> {
); );
let unit = let unit =
format!("{:08X}_{}", current_address, section.name.trim_start_matches('.')); format!("{:08X}_{}", current_address, section.name.trim_start_matches('.'));
new_splits.insert(current_address, ObjSplit { new_splits.insert(
current_address,
(section_index, ObjSplit {
unit: unit.clone(), unit: unit.clone(),
end: new_split_end, end: new_split_end,
align: None, align: None,
common: false, common: false,
autogenerated: true, autogenerated: true,
}); }),
);
current_address = new_split_end; current_address = new_split_end;
continue; continue;
} }
@ -353,8 +397,8 @@ fn create_gap_splits(obj: &mut ObjInfo) -> Result<()> {
} }
// Add new splits // Add new splits
for (addr, split) in new_splits { for (addr, (section_index, split)) in new_splits {
obj.add_split(addr, split)?; obj.add_split(section_index, addr, split)?;
} }
Ok(()) Ok(())
@ -362,35 +406,29 @@ fn create_gap_splits(obj: &mut ObjInfo) -> Result<()> {
/// Ensures that all .bss splits following a common split are also marked as common. /// Ensures that all .bss splits following a common split are also marked as common.
fn update_common_splits(obj: &mut ObjInfo) -> Result<()> { fn update_common_splits(obj: &mut ObjInfo) -> Result<()> {
let Some(bss_section) = obj.sections.iter().find(|s| s.name == ".bss") else { let Some((bss_section_index, bss_section)) = obj.sections.by_name(".bss")? else {
return Ok(()); return Ok(());
}; };
let bss_section_start = bss_section.address as u32; let Some(common_bss_start) =
let bss_section_end = (bss_section.address + bss_section.size) as u32; bss_section.splits.iter().find(|(_, split)| split.common).map(|(addr, _)| addr)
let Some(common_bss_start) = obj
.splits_for_range(bss_section_start..bss_section_end)
.find(|(_, split)| split.common)
.map(|(addr, _)| addr)
else { else {
return Ok(()); return Ok(());
}; };
log::debug!("Found common BSS start at {:#010X}", common_bss_start); log::debug!("Found common BSS start at {:#010X}", common_bss_start);
for (addr, vec) in obj.splits.range_mut(common_bss_start..bss_section_end) { let bss_section = &mut obj.sections[bss_section_index];
for split in vec { for (addr, split) in bss_section.splits.for_range_mut(common_bss_start..) {
if !split.common { if !split.common {
split.common = true; split.common = true;
log::debug!("Added common flag to split {} at {:#010X}", split.unit, addr); log::debug!("Added common flag to split {} at {:#010X}", split.unit, addr);
} }
} }
}
Ok(()) Ok(())
} }
/// Final validation of splits. /// Final validation of splits.
fn validate_splits(obj: &ObjInfo) -> Result<()> { fn validate_splits(obj: &ObjInfo) -> Result<()> {
let mut last_split_end = 0; let mut last_split_end = 0;
for (addr, split) in obj.splits_for_range(..) { for (section_index, section, addr, split) in obj.sections.all_splits() {
let section = obj.section_at(addr)?;
ensure!( ensure!(
addr >= last_split_end, addr >= last_split_end,
"Split {} {} {:#010X}..{:#010X} overlaps with previous split", "Split {} {} {:#010X}..{:#010X} overlaps with previous split",
@ -409,8 +447,11 @@ fn validate_splits(obj: &ObjInfo) -> Result<()> {
); );
last_split_end = split.end; last_split_end = split.end;
if let Some((_, symbol)) = if let Some((_, symbol)) = obj
obj.symbols.for_range(..addr).filter(|&(_, s)| s.size_known && s.size > 0).next_back() .symbols
.for_section_range(section_index, ..addr)
.filter(|&(_, s)| s.size_known && s.size > 0)
.next_back()
{ {
ensure!( ensure!(
addr >= symbol.address as u32 + symbol.size as u32, addr >= symbol.address as u32 + symbol.size as u32,
@ -427,7 +468,7 @@ fn validate_splits(obj: &ObjInfo) -> Result<()> {
if let Some((_, symbol)) = obj if let Some((_, symbol)) = obj
.symbols .symbols
.for_range(..split.end) .for_section_range(section_index, ..split.end)
.filter(|&(_, s)| s.size_known && s.size > 0) .filter(|&(_, s)| s.size_known && s.size > 0)
.next_back() .next_back()
{ {
@ -455,22 +496,23 @@ fn validate_splits(obj: &ObjInfo) -> Result<()> {
/// - Resolving a new object link order /// - Resolving a new object link order
pub fn update_splits(obj: &mut ObjInfo) -> Result<()> { pub fn update_splits(obj: &mut ObjInfo) -> Result<()> {
// Create splits for extab and extabindex entries // Create splits for extab and extabindex entries
if let Some(section) = obj.sections.iter().find(|s| s.name == "extabindex") { if let Some((section_index, section)) = obj.sections.by_name("extabindex")? {
split_extabindex(obj, section.index, section.address as u32)?; let start = section.address as u32;
split_extabindex(obj, section_index, start)?;
} }
// Create splits for .ctors entries // Create splits for .ctors entries
if let Some(section) = obj.sections.iter().find(|s| s.name == ".ctors") { if let Some((section_index, section)) = obj.sections.by_name(".ctors")? {
let section_start = section.address as u32; let start = section.address as u32;
let section_end = section.address as u32 + section.size as u32 - 4; let end = section.address as u32 + section.size as u32 - 4;
split_ctors_dtors(obj, section_start, section_end)?; split_ctors_dtors(obj, section_index, start, end)?;
} }
// Create splits for .dtors entries // Create splits for .dtors entries
if let Some(section) = obj.sections.iter().find(|s| s.name == ".dtors") { if let Some((section_index, section)) = obj.sections.by_name(".dtors")? {
let section_start = section.address as u32 + 4; // skip __destroy_global_chain_reference let start = section.address as u32 + 4; // skip __destroy_global_chain_reference
let section_end = section.address as u32 + section.size as u32 - 4; let end = section.address as u32 + section.size as u32 - 4;
split_ctors_dtors(obj, section_start, section_end)?; split_ctors_dtors(obj, section_index, start, end)?;
} }
// Create gap splits // Create gap splits
@ -502,17 +544,15 @@ fn resolve_link_order(obj: &ObjInfo) -> Result<Vec<ObjUnit>> {
let mut graph = Graph::<String, SplitEdge>::new(); let mut graph = Graph::<String, SplitEdge>::new();
let mut unit_to_index_map = BTreeMap::<String, NodeIndex>::new(); let mut unit_to_index_map = BTreeMap::<String, NodeIndex>::new();
for (_, split) in obj.splits_for_range(..) { for (_, _, _, split) in obj.sections.all_splits() {
unit_to_index_map.insert(split.unit.clone(), NodeIndex::new(0)); unit_to_index_map.insert(split.unit.clone(), NodeIndex::new(0));
} }
for (unit, index) in unit_to_index_map.iter_mut() { for (unit, index) in unit_to_index_map.iter_mut() {
*index = graph.add_node(unit.clone()); *index = graph.add_node(unit.clone());
} }
for section in &obj.sections { for (_section_index, section) in obj.sections.iter() {
let mut iter = obj let mut iter = section.splits.iter().peekable();
.splits_for_range(section.address as u32..(section.address + section.size) as u32)
.peekable();
if section.name == ".ctors" || section.name == ".dtors" { if section.name == ".ctors" || section.name == ".dtors" {
// Skip __init_cpp_exceptions.o // Skip __init_cpp_exceptions.o
let skipped = iter.next(); let skipped = iter.next();
@ -604,10 +644,10 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
objects.push(split_obj); objects.push(split_obj);
} }
for (section_idx, section) in obj.sections.iter().enumerate() { for (section_idx, section) in obj.sections.iter() {
let mut current_address = section.address as u32; let mut current_address = section.address as u32;
let section_end = end_for_section(obj, section_idx)?; let section_end = end_for_section(obj, section_idx)?;
let mut file_iter = obj.splits_for_range(current_address..section_end).peekable(); let mut file_iter = section.splits.for_range(current_address..section_end).peekable();
// Build address to relocation / address to symbol maps // Build address to relocation / address to symbol maps
let relocations = section.build_relocation_map()?; let relocations = section.build_relocation_map()?;
@ -679,14 +719,19 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
address: o.address - current_address as u64, address: o.address - current_address as u64,
target_symbol: o.target_symbol, target_symbol: o.target_symbol,
addend: o.addend, addend: o.addend,
module: o.module,
} }
}) })
.collect(); .collect();
// Add section symbols // Add section symbols
let out_section_idx = file.sections.len(); let out_section_idx = file.sections.next_section_index();
let mut comm_addr = current_address; let mut comm_addr = current_address;
for (symbol_idx, symbol) in obj.symbols.for_range(current_address..file_end) { for (symbol_idx, symbol) in
obj.symbols.for_section_range(section_idx, current_address..file_end).filter(
|&(_, s)| s.section == Some(section_idx) && !is_linker_generated_label(&s.name),
)
{
if symbol_idxs[symbol_idx].is_some() { if symbol_idxs[symbol_idx].is_some() {
continue; // should never happen? continue; // should never happen?
} }
@ -708,8 +753,7 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
} }
comm_addr = (symbol.address + symbol.size) as u32; comm_addr = (symbol.address + symbol.size) as u32;
symbol_idxs[symbol_idx] = Some(file.symbols.count()); symbol_idxs[symbol_idx] = Some(file.symbols.add_direct(ObjSymbol {
file.symbols.add_direct(ObjSymbol {
name: symbol.name.clone(), name: symbol.name.clone(),
demangled_name: symbol.demangled_name.clone(), demangled_name: symbol.demangled_name.clone(),
address: if split.common { 4 } else { symbol.address - current_address as u64 }, address: if split.common { 4 } else { symbol.address - current_address as u64 },
@ -724,7 +768,7 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
kind: symbol.kind, kind: symbol.kind,
align: if split.common { Some(4) } else { symbol.align }, align: if split.common { Some(4) } else { symbol.align },
data_kind: symbol.data_kind, data_kind: symbol.data_kind,
})?; })?);
} }
// For mwldeppc 2.7 and above, a .comment section is required to link without error // For mwldeppc 2.7 and above, a .comment section is required to link without error
@ -752,12 +796,12 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
size: file_end as u64 - current_address as u64, size: file_end as u64 - current_address as u64,
data, data,
align, align,
index: out_section_idx,
elf_index: out_section_idx + 1, elf_index: out_section_idx + 1,
relocations: out_relocations, relocations: out_relocations,
original_address: current_address as u64, original_address: current_address as u64,
file_offset: section.file_offset + (current_address as u64 - section.address), file_offset: section.file_offset + (current_address as u64 - section.address),
section_known: true, section_known: true,
splits: Default::default(),
}); });
} }
@ -769,7 +813,7 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
let mut globalize_symbols = vec![]; let mut globalize_symbols = vec![];
for (obj_idx, out_obj) in objects.iter_mut().enumerate() { for (obj_idx, out_obj) in objects.iter_mut().enumerate() {
let symbol_idxs = &mut object_symbols[obj_idx]; let symbol_idxs = &mut object_symbols[obj_idx];
for section in &mut out_obj.sections { for (_section_index, section) in out_obj.sections.iter_mut() {
for reloc in &mut section.relocations { for reloc in &mut section.relocations {
match symbol_idxs[reloc.target_symbol] { match symbol_idxs[reloc.target_symbol] {
Some(out_sym_idx) => { Some(out_sym_idx) => {
@ -778,7 +822,7 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
None => { None => {
// Extern // Extern
let out_sym_idx = out_obj.symbols.count(); let out_sym_idx = out_obj.symbols.count();
let target_sym = obj.symbols.at(reloc.target_symbol); let target_sym = &obj.symbols[reloc.target_symbol];
// If the symbol is local, we'll upgrade the scope to global // If the symbol is local, we'll upgrade the scope to global
// and rename it to avoid conflicts // and rename it to avoid conflicts
@ -802,14 +846,14 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
if section.name.as_str() == "extabindex" { if section.name.as_str() == "extabindex" {
let Some((target_addr, target_split)) = let Some((target_addr, target_split)) =
obj.split_for(target_sym.address as u32) section.splits.for_address(target_sym.address as u32)
else { else {
bail!( bail!(
"Bad extabindex relocation @ {:#010X}", "Bad extabindex relocation @ {:#010X}",
reloc.address + section.original_address reloc.address + section.original_address
); );
}; };
let target_section = &obj.section_at(target_addr)?.name; let target_section = &obj.sections.at_address(target_addr)?.1.name;
log::error!( log::error!(
"Bad extabindex relocation @ {:#010X}\n\ "Bad extabindex relocation @ {:#010X}\n\
\tSource object: {}:{:#010X} ({})\n\ \tSource object: {}:{:#010X} ({})\n\
@ -837,7 +881,7 @@ pub fn split_obj(obj: &ObjInfo) -> Result<Vec<ObjInfo>> {
for (obj, symbol_map) in objects.iter_mut().zip(&object_symbols) { for (obj, symbol_map) in objects.iter_mut().zip(&object_symbols) {
for (globalize_idx, new_name) in &globalize_symbols { for (globalize_idx, new_name) in &globalize_symbols {
if let Some(symbol_idx) = symbol_map[*globalize_idx] { if let Some(symbol_idx) = symbol_map[*globalize_idx] {
let mut symbol = obj.symbols.at(symbol_idx).clone(); let mut symbol = obj.symbols[symbol_idx].clone();
symbol.name = new_name.clone(); symbol.name = new_name.clone();
if symbol.flags.is_local() { if symbol.flags.is_local() {
log::debug!("Globalizing {} in {}", symbol.name, obj.name); log::debug!("Globalizing {} in {}", symbol.name, obj.name);
@ -956,8 +1000,10 @@ pub fn is_linker_generated_object(name: &str) -> bool {
/// Locate the end address of a section when excluding linker generated objects /// Locate the end address of a section when excluding linker generated objects
pub fn end_for_section(obj: &ObjInfo, section_index: usize) -> Result<u32> { pub fn end_for_section(obj: &ObjInfo, section_index: usize) -> Result<u32> {
let section = &obj.sections[section_index]; let section = obj
let section_start = section.address as u32; .sections
.get(section_index)
.ok_or_else(|| anyhow!("Invalid section index: {}", section_index))?;
let mut section_end = (section.address + section.size) as u32; let mut section_end = (section.address + section.size) as u32;
// .ctors and .dtors end with a linker-generated null pointer, // .ctors and .dtors end with a linker-generated null pointer,
// adjust section size appropriately // adjust section size appropriately
@ -970,7 +1016,7 @@ pub fn end_for_section(obj: &ObjInfo, section_index: usize) -> Result<u32> {
loop { loop {
let last_symbol = obj let last_symbol = obj
.symbols .symbols
.for_range(section_start..section_end) .for_section_range(section_index, ..section_end)
.filter(|(_, s)| s.kind == ObjSymbolKind::Object && s.size_known && s.size > 0) .filter(|(_, s)| s.kind == ObjSymbolKind::Object && s.size_known && s.size > 0)
.next_back(); .next_back();
match last_symbol { match last_symbol {