2024-03-22 03:36:23 +00:00
|
|
|
use std::borrow::Cow;
|
2024-03-17 05:30:27 +00:00
|
|
|
|
|
|
|
use anyhow::{anyhow, bail, ensure, Result};
|
|
|
|
use iced_x86::{
|
|
|
|
Decoder, DecoderOptions, DecoratorKind, Formatter, FormatterOutput, FormatterTextKind,
|
|
|
|
GasFormatter, Instruction, IntelFormatter, MasmFormatter, NasmFormatter, NumberKind, OpKind,
|
2024-03-19 00:10:18 +00:00
|
|
|
PrefixKind, Register,
|
2024-03-17 05:30:27 +00:00
|
|
|
};
|
2024-03-17 18:06:18 +00:00
|
|
|
use object::{pe, Endian, Endianness, File, Object, Relocation, RelocationFlags};
|
2024-03-17 05:30:27 +00:00
|
|
|
|
|
|
|
use crate::{
|
2024-03-19 00:10:18 +00:00
|
|
|
arch::{ObjArch, ProcessCodeResult},
|
|
|
|
diff::{DiffObjConfig, X86Formatter},
|
2024-03-22 03:36:23 +00:00
|
|
|
obj::{ObjInfo, ObjIns, ObjInsArg, ObjInsArgValue, ObjSection, SymbolRef},
|
2024-03-17 05:30:27 +00:00
|
|
|
};
|
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
pub struct ObjArchX86 {
|
|
|
|
bits: u32,
|
|
|
|
endianness: Endianness,
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
impl ObjArchX86 {
|
|
|
|
pub fn new(object: &File) -> Result<Self> {
|
|
|
|
Ok(Self { bits: if object.is_64() { 64 } else { 32 }, endianness: object.endianness() })
|
|
|
|
}
|
|
|
|
}
|
2024-03-17 05:30:27 +00:00
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
impl ObjArch for ObjArchX86 {
|
|
|
|
fn process_code(
|
|
|
|
&self,
|
2024-03-22 03:36:23 +00:00
|
|
|
obj: &ObjInfo,
|
|
|
|
symbol_ref: SymbolRef,
|
2024-03-17 18:06:18 +00:00
|
|
|
config: &DiffObjConfig,
|
|
|
|
) -> Result<ProcessCodeResult> {
|
2024-03-22 03:36:23 +00:00
|
|
|
let (section, symbol) = obj.section_symbol(symbol_ref);
|
2024-05-21 05:52:59 +00:00
|
|
|
let section = section.ok_or_else(|| anyhow!("Code symbol section not found"))?;
|
2024-03-22 03:36:23 +00:00
|
|
|
let code = §ion.data
|
|
|
|
[symbol.section_address as usize..(symbol.section_address + symbol.size) as usize];
|
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
let mut result = ProcessCodeResult { ops: Vec::new(), insts: Vec::new() };
|
2024-03-22 03:36:23 +00:00
|
|
|
let mut decoder = Decoder::with_ip(self.bits, code, symbol.address, DecoderOptions::NONE);
|
2024-03-17 18:06:18 +00:00
|
|
|
let mut formatter: Box<dyn Formatter> = match config.x86_formatter {
|
|
|
|
X86Formatter::Intel => Box::new(IntelFormatter::new()),
|
|
|
|
X86Formatter::Gas => Box::new(GasFormatter::new()),
|
|
|
|
X86Formatter::Nasm => Box::new(NasmFormatter::new()),
|
|
|
|
X86Formatter::Masm => Box::new(MasmFormatter::new()),
|
|
|
|
};
|
|
|
|
formatter.options_mut().set_space_after_operand_separator(config.space_between_args);
|
2024-03-17 05:30:27 +00:00
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
let mut output = InstructionFormatterOutput {
|
|
|
|
formatted: String::new(),
|
|
|
|
ins: ObjIns {
|
|
|
|
address: 0,
|
|
|
|
size: 0,
|
|
|
|
op: 0,
|
|
|
|
mnemonic: String::new(),
|
|
|
|
args: vec![],
|
|
|
|
reloc: None,
|
|
|
|
branch_dest: None,
|
|
|
|
line: None,
|
2024-05-20 23:38:20 +00:00
|
|
|
formatted: String::new(),
|
2024-03-17 18:06:18 +00:00
|
|
|
orig: None,
|
|
|
|
},
|
|
|
|
error: None,
|
|
|
|
ins_operands: vec![],
|
2024-03-17 05:30:27 +00:00
|
|
|
};
|
2024-03-17 18:06:18 +00:00
|
|
|
let mut instruction = Instruction::default();
|
|
|
|
while decoder.can_decode() {
|
|
|
|
decoder.decode_out(&mut instruction);
|
2024-03-17 05:30:27 +00:00
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
let address = instruction.ip();
|
|
|
|
let op = instruction.mnemonic() as u16;
|
2024-03-22 03:36:23 +00:00
|
|
|
let reloc = section
|
|
|
|
.relocations
|
2024-03-17 18:06:18 +00:00
|
|
|
.iter()
|
|
|
|
.find(|r| r.address >= address && r.address < address + instruction.len() as u64);
|
|
|
|
output.ins = ObjIns {
|
|
|
|
address,
|
|
|
|
size: instruction.len() as u8,
|
|
|
|
op,
|
|
|
|
mnemonic: String::new(),
|
|
|
|
args: vec![],
|
|
|
|
reloc: reloc.cloned(),
|
|
|
|
branch_dest: None,
|
2024-03-22 03:36:23 +00:00
|
|
|
line: obj.line_info.as_ref().and_then(|m| m.get(&address).cloned()),
|
2024-05-20 23:38:20 +00:00
|
|
|
formatted: String::new(),
|
2024-03-17 18:06:18 +00:00
|
|
|
orig: None,
|
|
|
|
};
|
|
|
|
// Run the formatter, which will populate output.ins
|
|
|
|
formatter.format(&instruction, &mut output);
|
|
|
|
if let Some(error) = output.error.take() {
|
|
|
|
return Err(error);
|
|
|
|
}
|
|
|
|
ensure!(output.ins_operands.len() == output.ins.args.len());
|
2024-05-20 23:38:20 +00:00
|
|
|
output.ins.formatted.clone_from(&output.formatted);
|
2024-03-17 05:30:27 +00:00
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
// Make sure we've put the relocation somewhere in the instruction
|
|
|
|
if reloc.is_some() && !output.ins.args.iter().any(|a| matches!(a, ObjInsArg::Reloc)) {
|
|
|
|
let mut found = replace_arg(
|
|
|
|
OpKind::Memory,
|
2024-03-17 05:30:27 +00:00
|
|
|
ObjInsArg::Reloc,
|
|
|
|
&mut output.ins.args,
|
|
|
|
&instruction,
|
|
|
|
&output.ins_operands,
|
|
|
|
)?;
|
2024-03-17 18:06:18 +00:00
|
|
|
if !found {
|
|
|
|
found = replace_arg(
|
|
|
|
OpKind::Immediate32,
|
|
|
|
ObjInsArg::Reloc,
|
|
|
|
&mut output.ins.args,
|
|
|
|
&instruction,
|
|
|
|
&output.ins_operands,
|
|
|
|
)?;
|
|
|
|
}
|
|
|
|
ensure!(found, "x86: Failed to find operand for Absolute relocation");
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
2024-03-17 18:06:18 +00:00
|
|
|
if reloc.is_some() && !output.ins.args.iter().any(|a| matches!(a, ObjInsArg::Reloc)) {
|
|
|
|
bail!("Failed to find relocation in instruction");
|
|
|
|
}
|
|
|
|
|
|
|
|
result.ops.push(op);
|
|
|
|
result.insts.push(output.ins.clone());
|
|
|
|
|
|
|
|
// Clear for next iteration
|
|
|
|
output.formatted.clear();
|
|
|
|
output.ins_operands.clear();
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
2024-03-17 18:06:18 +00:00
|
|
|
Ok(result)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn implcit_addend(
|
|
|
|
&self,
|
|
|
|
section: &ObjSection,
|
|
|
|
address: u64,
|
|
|
|
reloc: &Relocation,
|
|
|
|
) -> Result<i64> {
|
|
|
|
match reloc.flags() {
|
|
|
|
RelocationFlags::Coff { typ: pe::IMAGE_REL_I386_DIR32 | pe::IMAGE_REL_I386_REL32 } => {
|
|
|
|
let data = section.data[address as usize..address as usize + 4].try_into()?;
|
|
|
|
Ok(self.endianness.read_i32_bytes(data) as i64)
|
|
|
|
}
|
|
|
|
flags => bail!("Unsupported x86 implicit relocation {flags:?}"),
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
2024-03-17 18:06:18 +00:00
|
|
|
}
|
2024-03-17 05:30:27 +00:00
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
fn demangle(&self, name: &str) -> Option<String> {
|
|
|
|
if name.starts_with('?') {
|
|
|
|
msvc_demangler::demangle(name, msvc_demangler::DemangleFlags::llvm()).ok()
|
|
|
|
} else {
|
2024-03-22 03:36:23 +00:00
|
|
|
cpp_demangle::Symbol::new(name)
|
|
|
|
.ok()
|
|
|
|
.and_then(|s| s.demangle(&cpp_demangle::DemangleOptions::default()).ok())
|
2024-03-17 18:06:18 +00:00
|
|
|
}
|
|
|
|
}
|
2024-03-17 05:30:27 +00:00
|
|
|
|
2024-03-17 18:06:18 +00:00
|
|
|
fn display_reloc(&self, flags: RelocationFlags) -> Cow<'static, str> {
|
|
|
|
match flags {
|
|
|
|
RelocationFlags::Coff { typ } => match typ {
|
|
|
|
pe::IMAGE_REL_I386_DIR32 => Cow::Borrowed("IMAGE_REL_I386_DIR32"),
|
|
|
|
pe::IMAGE_REL_I386_REL32 => Cow::Borrowed("IMAGE_REL_I386_REL32"),
|
2024-03-22 03:36:23 +00:00
|
|
|
_ => Cow::Owned(format!("<{flags:?}>")),
|
2024-03-17 18:06:18 +00:00
|
|
|
},
|
2024-03-22 03:36:23 +00:00
|
|
|
_ => Cow::Owned(format!("<{flags:?}>")),
|
2024-03-17 18:06:18 +00:00
|
|
|
}
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn replace_arg(
|
|
|
|
from: OpKind,
|
|
|
|
to: ObjInsArg,
|
|
|
|
args: &mut [ObjInsArg],
|
|
|
|
instruction: &Instruction,
|
|
|
|
ins_operands: &[Option<u32>],
|
|
|
|
) -> Result<bool> {
|
|
|
|
let mut replace = None;
|
|
|
|
for i in 0..instruction.op_count() {
|
|
|
|
let op_kind = instruction.op_kind(i);
|
|
|
|
if op_kind == from {
|
|
|
|
replace = Some(i);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if let Some(i) = replace {
|
|
|
|
for (j, arg) in args.iter_mut().enumerate() {
|
|
|
|
if ins_operands[j] == Some(i) {
|
|
|
|
*arg = to;
|
|
|
|
return Ok(true);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(false)
|
|
|
|
}
|
|
|
|
|
|
|
|
struct InstructionFormatterOutput {
|
|
|
|
formatted: String,
|
|
|
|
ins: ObjIns,
|
|
|
|
error: Option<anyhow::Error>,
|
|
|
|
ins_operands: Vec<Option<u32>>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl InstructionFormatterOutput {
|
|
|
|
fn push_signed(&mut self, value: i64) {
|
|
|
|
// The formatter writes the '-' operator and then gives us a negative value,
|
|
|
|
// so convert it to a positive value to avoid double negatives
|
|
|
|
if value < 0
|
|
|
|
&& matches!(self.ins.args.last(), Some(ObjInsArg::Arg(ObjInsArgValue::Opaque(v))) if v == "-")
|
|
|
|
{
|
|
|
|
self.ins.args.push(ObjInsArg::Arg(ObjInsArgValue::Signed(value.wrapping_abs())));
|
|
|
|
} else {
|
|
|
|
self.ins.args.push(ObjInsArg::Arg(ObjInsArgValue::Signed(value)));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl FormatterOutput for InstructionFormatterOutput {
|
|
|
|
fn write(&mut self, text: &str, kind: FormatterTextKind) {
|
|
|
|
self.formatted.push_str(text);
|
|
|
|
// Skip whitespace after the mnemonic
|
|
|
|
if self.ins.args.is_empty() && kind == FormatterTextKind::Text {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
self.ins_operands.push(None);
|
|
|
|
match kind {
|
|
|
|
FormatterTextKind::Text | FormatterTextKind::Punctuation => {
|
2024-03-22 03:36:23 +00:00
|
|
|
self.ins.args.push(ObjInsArg::PlainText(text.to_string().into()));
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
|
|
|
FormatterTextKind::Keyword | FormatterTextKind::Operator => {
|
2024-03-22 03:36:23 +00:00
|
|
|
self.ins.args.push(ObjInsArg::Arg(ObjInsArgValue::Opaque(text.to_string().into())));
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
|
|
|
_ => {
|
|
|
|
if self.error.is_none() {
|
|
|
|
self.error = Some(anyhow!("x86: Unsupported FormatterTextKind {:?}", kind));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn write_prefix(&mut self, _instruction: &Instruction, text: &str, _prefix: PrefixKind) {
|
|
|
|
self.formatted.push_str(text);
|
|
|
|
self.ins_operands.push(None);
|
2024-03-22 03:36:23 +00:00
|
|
|
self.ins.args.push(ObjInsArg::Arg(ObjInsArgValue::Opaque(text.to_string().into())));
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fn write_mnemonic(&mut self, _instruction: &Instruction, text: &str) {
|
|
|
|
self.formatted.push_str(text);
|
|
|
|
self.ins.mnemonic = text.to_string();
|
|
|
|
}
|
|
|
|
|
|
|
|
fn write_number(
|
|
|
|
&mut self,
|
|
|
|
_instruction: &Instruction,
|
|
|
|
_operand: u32,
|
|
|
|
instruction_operand: Option<u32>,
|
|
|
|
text: &str,
|
|
|
|
value: u64,
|
|
|
|
number_kind: NumberKind,
|
|
|
|
kind: FormatterTextKind,
|
|
|
|
) {
|
|
|
|
self.formatted.push_str(text);
|
|
|
|
self.ins_operands.push(instruction_operand);
|
|
|
|
|
|
|
|
// Handle relocations
|
|
|
|
match kind {
|
|
|
|
FormatterTextKind::LabelAddress => {
|
|
|
|
if let Some(reloc) = self.ins.reloc.as_ref() {
|
2024-03-17 18:06:18 +00:00
|
|
|
if matches!(reloc.flags, RelocationFlags::Coff {
|
|
|
|
typ: pe::IMAGE_REL_I386_DIR32
|
|
|
|
}) {
|
2024-03-17 05:30:27 +00:00
|
|
|
self.ins.args.push(ObjInsArg::Reloc);
|
|
|
|
return;
|
|
|
|
} else if self.error.is_none() {
|
|
|
|
self.error = Some(anyhow!(
|
2024-03-17 18:06:18 +00:00
|
|
|
"x86: Unsupported LabelAddress relocation flags {:?}",
|
|
|
|
reloc.flags
|
2024-03-17 05:30:27 +00:00
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
self.ins.args.push(ObjInsArg::BranchDest(value));
|
|
|
|
self.ins.branch_dest = Some(value);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
FormatterTextKind::FunctionAddress => {
|
|
|
|
if let Some(reloc) = self.ins.reloc.as_ref() {
|
2024-03-17 18:06:18 +00:00
|
|
|
if matches!(reloc.flags, RelocationFlags::Coff {
|
|
|
|
typ: pe::IMAGE_REL_I386_REL32
|
|
|
|
}) {
|
2024-03-17 05:30:27 +00:00
|
|
|
self.ins.args.push(ObjInsArg::Reloc);
|
|
|
|
return;
|
|
|
|
} else if self.error.is_none() {
|
|
|
|
self.error = Some(anyhow!(
|
2024-03-17 18:06:18 +00:00
|
|
|
"x86: Unsupported FunctionAddress relocation flags {:?}",
|
|
|
|
reloc.flags
|
2024-03-17 05:30:27 +00:00
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
_ => {}
|
|
|
|
}
|
|
|
|
|
|
|
|
match number_kind {
|
|
|
|
NumberKind::Int8 => {
|
|
|
|
self.push_signed(value as i8 as i64);
|
|
|
|
}
|
|
|
|
NumberKind::Int16 => {
|
|
|
|
self.push_signed(value as i16 as i64);
|
|
|
|
}
|
|
|
|
NumberKind::Int32 => {
|
|
|
|
self.push_signed(value as i32 as i64);
|
|
|
|
}
|
|
|
|
NumberKind::Int64 => {
|
|
|
|
self.push_signed(value as i64);
|
|
|
|
}
|
|
|
|
NumberKind::UInt8 | NumberKind::UInt16 | NumberKind::UInt32 | NumberKind::UInt64 => {
|
|
|
|
self.ins.args.push(ObjInsArg::Arg(ObjInsArgValue::Unsigned(value)));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn write_decorator(
|
|
|
|
&mut self,
|
|
|
|
_instruction: &Instruction,
|
|
|
|
_operand: u32,
|
|
|
|
instruction_operand: Option<u32>,
|
|
|
|
text: &str,
|
|
|
|
_decorator: DecoratorKind,
|
|
|
|
) {
|
|
|
|
self.formatted.push_str(text);
|
|
|
|
self.ins_operands.push(instruction_operand);
|
2024-03-22 03:36:23 +00:00
|
|
|
self.ins.args.push(ObjInsArg::PlainText(text.to_string().into()));
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fn write_register(
|
|
|
|
&mut self,
|
|
|
|
_instruction: &Instruction,
|
|
|
|
_operand: u32,
|
|
|
|
instruction_operand: Option<u32>,
|
|
|
|
text: &str,
|
|
|
|
_register: Register,
|
|
|
|
) {
|
|
|
|
self.formatted.push_str(text);
|
|
|
|
self.ins_operands.push(instruction_operand);
|
2024-03-22 03:36:23 +00:00
|
|
|
self.ins.args.push(ObjInsArg::Arg(ObjInsArgValue::Opaque(text.to_string().into())));
|
2024-03-17 05:30:27 +00:00
|
|
|
}
|
|
|
|
}
|