From 0dda790639e999eb914d21754acb72bf0b33551d Mon Sep 17 00:00:00 2001 From: rbran Date: Mon, 30 Dec 2024 14:17:22 -0300 Subject: [PATCH 01/53] fix tilib cc print format --- src/tools/tilib.rs | 49 +++++++++++++++++++++++++--------------------- 1 file changed, 27 insertions(+), 22 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index b6f932b..22a4e06 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -41,7 +41,9 @@ fn print_til_section(mut fmt: impl Write, section: &TILSection) -> Result<()> { let dep = core::str::from_utf8(dependency).unwrap(); // TODO open those files? What todo with then? // TODO some files still missing this warning - writeln!(fmt, "Warning: {dep}: No such file or directory")?; + if !dep.is_empty() { + writeln!(fmt, "Warning: {dep}: No such file or directory")?; + } } writeln!(fmt)?; @@ -123,9 +125,9 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b860 if let Some(cc) = section.cc { if section.cm.is_some() || section.cn.is_some() { - write!(fmt, ",")?; + write!(fmt, ", ")?; } - writeln!(fmt, "{}", calling_convention_to_str(cc))?; + write!(fmt, "{}", calling_convention_to_str(cc))?; } writeln!(fmt)?; @@ -466,10 +468,13 @@ fn print_til_type_function( print_til_type(fmt, section, None, &til_type.ret, false, true)?; let cc = match (section.cc, til_type.calling_convention) { - // don't print if using the default cc, or if elipsis just print the '...' as last param - (_, None | Some(CallingConvention::Ellipsis)) => None, - // if uses the default cc, don't print anything - (Some(scc), Some(tcc)) if scc == tcc => None, + // don't print if using the til section default cc + | (_, None) + // if elipsis just print the '...' as last param + | (_, Some(CallingConvention::Ellipsis)) + // if void arg, just don't print the args (there will be none) + | (_, Some(CallingConvention::Voidarg)) => None, + (_, Some(cc)) => Some(calling_convention_to_str(cc)), }; @@ -478,8 +483,8 @@ fn print_til_type_function( match (is_pointer, cc) { (true, None) => write!(fmt, " (*{name})")?, (false, None) => write!(fmt, " {name}")?, - (true, Some(cc)) => write!(fmt, " ({cc} *{name})")?, - (false, Some(cc)) => write!(fmt, " {cc} {name}")?, + (true, Some(cc)) => write!(fmt, " (__{cc} *{name})")?, + (false, Some(cc)) => write!(fmt, " __{cc} {name}")?, } write!(fmt, "(")?; @@ -765,19 +770,19 @@ fn print_til_type_len( fn calling_convention_to_str(cc: CallingConvention) -> &'static str { use idb_rs::til::function::CallingConvention::*; match cc { - Voidarg => "__voidarg", - Cdecl => "__cdecl", - Ellipsis => "__ellipsis", - Stdcall => "__stdcall", - Pascal => "__pascal", - Fastcall => "__fastcall", - Thiscall => "__thiscall", - Swift => "__swift", - Golang => "__golang", - Userpurge => "__userpurge", - Uservars => "__uservars", - Usercall => "__usercall", - Reserved3 => "__ccreserved3", + Voidarg => "voidarg", + Cdecl => "cdecl", + Ellipsis => "ellipsis", + Stdcall => "stdcall", + Pascal => "pascal", + Fastcall => "fastcall", + Thiscall => "thiscall", + Swift => "swift", + Golang => "golang", + Userpurge => "userpurge", + Uservars => "uservars", + Usercall => "usercall", + Reserved3 => "ccreserved3", } } From 5ef02d698a9496408b6827a9163c80c1c320e153 Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 31 Dec 2024 09:40:26 -0300 Subject: [PATCH 02/53] fix tilib invalid utf8 names --- src/tools/tilib.rs | 184 +++++++++++++++++++++++---------------------- 1 file changed, 93 insertions(+), 91 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 22a4e06..00e81a3 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -9,7 +9,6 @@ use idb_rs::til::union::Union; use idb_rs::til::{Basic, TILTypeInfo, Type, TypeVariant, Typedef}; use idb_rs::IDBParser; -use std::borrow::Borrow; use std::fs::File; use std::io::{BufReader, Result, Write}; use std::num::NonZeroU8; @@ -46,15 +45,18 @@ fn print_til_section(mut fmt: impl Write, section: &TILSection) -> Result<()> { } } + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b6d0 writeln!(fmt)?; writeln!(fmt, "TYPE INFORMATION LIBRARY CONTENTS")?; print_header(&mut fmt, section)?; writeln!(fmt)?; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b926 writeln!(fmt, "SYMBOLS")?; print_symbols(&mut fmt, section)?; writeln!(fmt)?; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b94d writeln!(fmt, "TYPES")?; print_types(&mut fmt, section)?; writeln!(fmt)?; @@ -202,14 +204,18 @@ fn print_symbols(fmt: &mut impl Write, section: &TILSection) -> Result<()> { for symbol in §ion.symbols { print_til_type_len(fmt, section, None, &symbol.tinfo)?; let len = section.type_size_bytes(None, &symbol.tinfo).ok(); - match len { - // TODO What is that???? Find it in InnerRef... + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a80 + match len.and_then(|b| u32::try_from(b).ok()) { Some(8) => write!(fmt, " {:016X} ", symbol.ordinal)?, - // TODO is limited to 32bits in InnerRef? - _ => write!(fmt, " {:08X} ", symbol.ordinal & 0xFFFF_FFFF)?, + Some(bytes @ 0..=7) => write!( + fmt, + " {:08X} ", + symbol.ordinal & !(u64::MAX << (bytes * 8)) + )?, + _ => write!(fmt, " {:08X} ", symbol.ordinal)?, } - let name = std::str::from_utf8(&symbol.name).unwrap(); - print_til_type(fmt, section, Some(name), &symbol.tinfo, true, false)?; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a3a + print_til_type(fmt, section, Some(&symbol.name), &symbol.tinfo, true, false)?; writeln!(fmt, ";")?; } Ok(()) @@ -267,8 +273,7 @@ fn print_types_by_ordinals(fmt: &mut impl Write, section: &TILSection) -> Result if let OrdType::Alias((_alias_ord, type_ord)) = ord_type { write!(fmt, "(aliased to {type_ord}) ")?; } - let name = std::str::from_utf8(&final_type.name).unwrap(); - print_til_type_root(fmt, section, Some(name), &final_type.tinfo)?; + print_til_type_root(fmt, section, Some(&final_type.name), &final_type.tinfo)?; writeln!(fmt, ";")?; } Ok(()) @@ -281,8 +286,7 @@ fn print_types_by_name(fmt: &mut impl Write, section: &TILSection) -> Result<()> } print_til_type_len(fmt, section, Some(idx), &symbol.tinfo).unwrap(); write!(fmt, " ")?; - let name = std::str::from_utf8(&symbol.name).unwrap(); - print_til_type_root(fmt, section, Some(name), &symbol.tinfo)?; + print_til_type_root(fmt, section, Some(&symbol.name), &symbol.tinfo)?; writeln!(fmt, ";")?; } Ok(()) @@ -291,7 +295,7 @@ fn print_types_by_name(fmt: &mut impl Write, section: &TILSection) -> Result<()> fn print_til_type_root( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, til_type: &Type, ) -> Result<()> { match &til_type.type_variant { @@ -304,7 +308,7 @@ fn print_til_type_root( fn print_til_type( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, til_type: &Type, print_pointer_space: bool, print_type_prefix: bool, @@ -366,7 +370,7 @@ fn print_til_type( fn print_til_type_basic( fmt: &mut impl Write, _section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, til_basic: &Basic, ) -> Result<()> { const fn signed_name(is_signed: Option) -> &'static str { @@ -377,41 +381,37 @@ fn print_til_type_basic( } let name_space = if name.is_some() { " " } else { "" }; - let name = name.unwrap_or(""); match til_basic { - Basic::Bool => write!(fmt, "bool{name_space}{name}",)?, - Basic::Char => write!(fmt, "char{name_space}{name}",)?, - Basic::Short { is_signed } => { - write!(fmt, "{}short{name_space}{name}", signed_name(*is_signed))? - } - Basic::Void => write!(fmt, "void{name_space}{name}",)?, - Basic::SegReg => write!(fmt, "SegReg{name_space}{name}")?, - Basic::Unknown { bytes: 1 } => write!(fmt, "_BYTE")?, - Basic::Unknown { bytes: 2 } => write!(fmt, "_WORD")?, - Basic::Unknown { bytes: 4 } => write!(fmt, "_DWORD")?, - Basic::Unknown { bytes: 8 } => write!(fmt, "_QWORD")?, - Basic::Unknown { bytes } => write!(fmt, "unknown{bytes}{name_space}{name}")?, - Basic::Int { is_signed } => { - write!(fmt, "{}int{name_space}{name}", signed_name(*is_signed))? - } - Basic::Long { is_signed } => { - write!(fmt, "{}long{name_space}{name}", signed_name(*is_signed))? - } + Basic::Bool => write!(fmt, "bool{name_space}",)?, + Basic::Char => write!(fmt, "char{name_space}",)?, + Basic::Short { is_signed } => write!(fmt, "{}short{name_space}", signed_name(*is_signed))?, + Basic::Void => write!(fmt, "void{name_space}",)?, + Basic::SegReg => write!(fmt, "SegReg{name_space}")?, + Basic::Unknown { bytes: 1 } => write!(fmt, "_BYTE{name_space}")?, + Basic::Unknown { bytes: 2 } => write!(fmt, "_WORD{name_space}")?, + Basic::Unknown { bytes: 4 } => write!(fmt, "_DWORD{name_space}")?, + Basic::Unknown { bytes: 8 } => write!(fmt, "_QWORD{name_space}")?, + Basic::Unknown { bytes } => write!(fmt, "unknown{bytes}{name_space}")?, + Basic::Int { is_signed } => write!(fmt, "{}int{name_space}", signed_name(*is_signed))?, + Basic::Long { is_signed } => write!(fmt, "{}long{name_space}", signed_name(*is_signed))?, Basic::LongLong { is_signed } => { - write!(fmt, "{}longlong{name_space}{name}", signed_name(*is_signed))? + write!(fmt, "{}longlong{name_space}", signed_name(*is_signed))? } Basic::IntSized { bytes, is_signed } => { if let Some(false) = is_signed { write!(fmt, "unsigned ")?; } - write!(fmt, "__int{}{name_space}{name}", bytes.get() * 8)? + write!(fmt, "__int{}{name_space}", bytes.get() * 8)? } - Basic::LongDouble => write!(fmt, "longfloat{name_space}{name}")?, - Basic::Float { bytes } if bytes.get() == 4 => write!(fmt, "float{name_space}{name}")?, - Basic::Float { bytes } if bytes.get() == 8 => write!(fmt, "double{name_space}{name}")?, - Basic::Float { bytes } => write!(fmt, "float{bytes}{name_space}{name}")?, - Basic::BoolSized { bytes } if bytes.get() == 1 => write!(fmt, "bool{name_space}{name}")?, - Basic::BoolSized { bytes } => write!(fmt, "bool{bytes}{name_space}{name}")?, + Basic::LongDouble => write!(fmt, "longfloat{name_space}")?, + Basic::Float { bytes } if bytes.get() == 4 => write!(fmt, "float{name_space}")?, + Basic::Float { bytes } if bytes.get() == 8 => write!(fmt, "double{name_space}")?, + Basic::Float { bytes } => write!(fmt, "float{bytes}{name_space}")?, + Basic::BoolSized { bytes } if bytes.get() == 1 => write!(fmt, "bool{name_space}")?, + Basic::BoolSized { bytes } => write!(fmt, "bool{bytes}{name_space}")?, + } + if let Some(name) = name { + fmt.write_all(name)?; } Ok(()) } @@ -419,7 +419,7 @@ fn print_til_type_basic( fn print_til_type_pointer( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, pointer: &Pointer, print_pointer_space: bool, print_type_prefix: bool, @@ -452,7 +452,9 @@ fn print_til_type_pointer( print_til_type_only(fmt, section, ty)?; write!(fmt, ",{value:#X}) ")?; } - write!(fmt, "{}", name.unwrap_or(""))?; + if let Some(name) = name { + fmt.write_all(name)?; + } } Ok(()) } @@ -460,7 +462,7 @@ fn print_til_type_pointer( fn print_til_type_function( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, til_type: &Function, is_pointer: bool, ) -> Result<()> { @@ -479,12 +481,18 @@ fn print_til_type_function( }; // print name and calling convention - let name = name.unwrap_or(""); match (is_pointer, cc) { - (true, None) => write!(fmt, " (*{name})")?, - (false, None) => write!(fmt, " {name}")?, - (true, Some(cc)) => write!(fmt, " (__{cc} *{name})")?, - (false, Some(cc)) => write!(fmt, " __{cc} {name}")?, + (true, None) => write!(fmt, " (*")?, + (false, None) => write!(fmt, " ")?, + (true, Some(cc)) => write!(fmt, " (__{cc} *")?, + (false, Some(cc)) => write!(fmt, " __{cc} ")?, + } + if let Some(name) = name { + fmt.write_all(name)?; + } + match (is_pointer, cc) { + (true, Some(_)) | (true, None) => write!(fmt, ")")?, + (false, Some(_)) | (false, None) => {} } write!(fmt, "(")?; @@ -492,17 +500,8 @@ fn print_til_type_function( if i != 0 { write!(fmt, ", ")?; } - let param_name = param_name - .as_ref() - .map(|name| String::from_utf8_lossy(&name[..])); - print_til_type( - fmt, - section, - param_name.as_ref().map(|name| name.borrow()), - param, - true, - false, - )?; + let param_name = param_name.as_ref().map(Vec::as_slice); + print_til_type(fmt, section, param_name, param, true, false)?; } if til_type.calling_convention == Some(CallingConvention::Ellipsis) { if !til_type.args.is_empty() { @@ -516,7 +515,7 @@ fn print_til_type_function( fn print_til_type_array( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, til_array: &Array, print_pointer_space: bool, print_type_prefix: bool, @@ -529,9 +528,10 @@ fn print_til_type_array( print_pointer_space, print_type_prefix, )?; - let name_space = if name.is_some() { " " } else { "" }; - let name = name.unwrap_or(""); - write!(fmt, "{name_space}{name}")?; + if let Some(name) = name { + write!(fmt, " ")?; + fmt.write_all(name)?; + } if til_array.nelem != 0 { write!(fmt, "[{}]", til_array.nelem)?; } else { @@ -543,7 +543,7 @@ fn print_til_type_array( fn print_til_type_typedef( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, typedef: &Typedef, ) -> Result<()> { // only print prefix, if is root @@ -563,18 +563,19 @@ fn print_til_type_typedef( } } } - let name_space = if name.is_some() { " " } else { "" }; - let name = name.unwrap_or(""); - write!(fmt, "{name_space}{name}") + if let Some(name) = name { + write!(fmt, " ")?; + fmt.write_all(name)?; + } + Ok(()) } fn print_til_type_struct( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, til_struct: &Struct, ) -> Result<()> { - let name = name.unwrap_or(""); write!(fmt, "struct ")?; if til_struct.is_unaligned { write!(fmt, "__unaligned ")?; @@ -594,12 +595,12 @@ fn print_til_type_struct( if let Some(others) = til_struct.others { write!(fmt, "__other({others:04x}) ")?; } - write!(fmt, "{name} {{")?; + if let Some(name) = name { + fmt.write_all(name)?; + } + write!(fmt, " {{")?; for member in &til_struct.members { - let name = member - .name - .as_ref() - .map(|x| core::str::from_utf8(x).unwrap()); + let name = member.name.as_ref().map(Vec::as_slice); print_til_type(fmt, section, name, &member.member_type, true, false)?; if let Some(att) = &member.att { print_til_struct_member_att(fmt, &member.member_type, att)?; @@ -612,19 +613,19 @@ fn print_til_type_struct( fn print_til_type_union( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, til_union: &Union, ) -> Result<()> { - let name = name.unwrap_or(""); write!(fmt, "union ")?; if let Some(align) = til_union.alignment { write!(fmt, "__attribute__((aligned({align}))) ")?; } - write!(fmt, "{name} {{")?; + if let Some(name) = name { + fmt.write_all(name)?; + } + write!(fmt, " {{")?; for (member_name, member) in &til_union.members { - let member_name = member_name - .as_ref() - .map(|x| core::str::from_utf8(x).unwrap()); + let member_name = member_name.as_ref().map(Vec::as_slice); print_til_type(fmt, section, member_name, member, true, false)?; write!(fmt, ";")?; } @@ -634,19 +635,21 @@ fn print_til_type_union( fn print_til_type_enum( fmt: &mut impl Write, section: &TILSection, - name: Option<&str>, + name: Option<&[u8]>, til_enum: &Enum, ) -> Result<()> { use idb_rs::til::r#enum::EnumFormat::*; - let name = name.unwrap_or(""); let output_fmt_name = match til_enum.output_format { Char => "__char ", Hex => "", SignedDecimal => "__dec ", UnsignedDecimal => "__udec ", }; - write!(fmt, "enum {output_fmt_name}{name} ")?; + write!(fmt, "enum {output_fmt_name}")?; + if let Some(name) = name { + fmt.write_all(name)?; + } match (til_enum.storage_size, section.size_enum) { (None, None) => {} (Some(storage_size), Some(size_enum)) => { @@ -659,20 +662,19 @@ fn print_til_type_enum( .map(|x| x.max(1)) //can't have a value being represented in 0bits .unwrap_or(8); if bits_required / 8 < storage_size.get().into() { - write!(fmt, ": __int{} ", storage_size.get() as usize * 8)?; + write!(fmt, ": __int{}", storage_size.get() as usize * 8)?; } } } (None, Some(_)) => {} (Some(_), None) => {} } - write!(fmt, "{{")?; + write!(fmt, " {{")?; for (member_name, value) in &til_enum.members { - let name = member_name - .as_ref() - .map(|x| core::str::from_utf8(x).unwrap()) - .unwrap_or("_"); - write!(fmt, "{name} = ")?; + if let Some(member_name) = member_name { + fmt.write_all(member_name)?; + } + write!(fmt, " = ")?; match til_enum.output_format { Char if *value <= 0xFF => write!(fmt, "'{}'", (*value) as u8 as char)?, Char => write!(fmt, "'\\xu{value:X}'")?, From fa6f8f81a3db05c41b4d77b3f394620b35253438 Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 31 Dec 2024 15:56:16 -0300 Subject: [PATCH 03/53] add todos for tilib prints --- src/tools/tilib.rs | 31 ++++++++++++++++++++++++------- 1 file changed, 24 insertions(+), 7 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 00e81a3..e5efd54 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -206,14 +206,28 @@ fn print_symbols(fmt: &mut impl Write, section: &TILSection) -> Result<()> { let len = section.type_size_bytes(None, &symbol.tinfo).ok(); // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a80 match len.and_then(|b| u32::try_from(b).ok()) { - Some(8) => write!(fmt, " {:016X} ", symbol.ordinal)?, - Some(bytes @ 0..=7) => write!( - fmt, - " {:08X} ", - symbol.ordinal & !(u64::MAX << (bytes * 8)) - )?, - _ => write!(fmt, " {:08X} ", symbol.ordinal)?, + Some(8) => write!(fmt, " {:016X}", symbol.ordinal)?, + Some(bytes @ 0..=7) => { + write!(fmt, " {:08X}", symbol.ordinal & !(u64::MAX << (bytes * 8)))? + } + _ => write!(fmt, " {:08X}", symbol.ordinal)?, } + + // TODO find this in InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a49 + //let sym_kind = match arg8 { + // 0 => " ", + // 1 => "typedef ", + // 2 => "extern ", + // 3 => "static ", + // 4 => "register", + // 5 => "auto ", + // 6 => "friend ", + // 7 => "virtual ", + // _ => "?!", + //}; + let sym_kind = " "; + write!(fmt, "{}", sym_kind)?; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a3a print_til_type(fmt, section, Some(&symbol.name), &symbol.tinfo, true, false)?; writeln!(fmt, ";")?; @@ -298,8 +312,11 @@ fn print_til_type_root( name: Option<&[u8]>, til_type: &Type, ) -> Result<()> { + // TODO: InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4438d1 + // TODO: if a is a typedef and ComplexRef or something like it, also print typedef match &til_type.type_variant { TypeVariant::Struct(_) | TypeVariant::Union(_) | TypeVariant::Enum(_) => {} + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x443906 _ => write!(fmt, "typedef ")?, } print_til_type(fmt, section, name, til_type, true, true) From 04485202a04ab62f98de9798fca9e9082f764984 Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 31 Dec 2024 16:55:58 -0300 Subject: [PATCH 04/53] restrict til complex ref to typedefs --- src/til.rs | 25 ++--- src/til/enum.rs | 5 +- src/til/section.rs | 236 ++++++++++++++++++++++++++------------------- src/til/struct.rs | 5 +- src/til/union.rs | 7 +- src/tools/tilib.rs | 72 +++++++------- 6 files changed, 198 insertions(+), 152 deletions(-) diff --git a/src/til.rs b/src/til.rs index 6d10644..4464061 100644 --- a/src/til.rs +++ b/src/til.rs @@ -114,10 +114,9 @@ pub enum TypeVariant { Struct(Struct), Union(Union), Enum(Enum), - // TODO narrow what kinds of Type can be inside the Ref - StructRef(Box), - UnionRef(Box), - EnumRef(Box), + StructRef(Typedef), + UnionRef(Typedef), + EnumRef(Typedef), Bitfield(Bitfield), } @@ -139,15 +138,9 @@ impl Type { TypeVariantRaw::Struct(x) => Struct::new(til, x, fields).map(TypeVariant::Struct)?, TypeVariantRaw::Union(x) => Union::new(til, x, fields).map(TypeVariant::Union)?, TypeVariantRaw::Enum(x) => Enum::new(til, x, fields).map(TypeVariant::Enum)?, - TypeVariantRaw::StructRef(type_raw) => { - TypeVariant::StructRef(Box::new(Type::new(til, *type_raw, fields)?)) - } - TypeVariantRaw::UnionRef(type_raw) => { - TypeVariant::UnionRef(Box::new(Type::new(til, *type_raw, fields)?)) - } - TypeVariantRaw::EnumRef(type_raw) => { - TypeVariant::EnumRef(Box::new(Type::new(til, *type_raw, fields)?)) - } + TypeVariantRaw::StructRef(typedef) => TypeVariant::StructRef(typedef), + TypeVariantRaw::UnionRef(typedef) => TypeVariant::UnionRef(typedef), + TypeVariantRaw::EnumRef(typedef) => TypeVariant::EnumRef(typedef), }; Ok(Self { is_const: tinfo_raw.is_const, @@ -215,9 +208,9 @@ pub(crate) enum TypeVariantRaw { Struct(StructRaw), Union(UnionRaw), Enum(EnumRaw), - StructRef(Box), - UnionRef(Box), - EnumRef(Box), + StructRef(Typedef), + UnionRef(Typedef), + EnumRef(Typedef), Bitfield(Bitfield), } diff --git a/src/til/enum.rs b/src/til/enum.rs index df07f4f..ee21207 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -56,7 +56,10 @@ impl EnumRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4803b4 let ref_type = TypeRaw::read_ref(&mut *input, header)?; let _taenum_bits = SDACL::read(&mut *input)?.0; - return Ok(TypeVariantRaw::EnumRef(Box::new(ref_type))); + let TypeVariantRaw::Typedef(ref_type) = ref_type.variant else { + return Err(anyhow!("EnumRef Non Typedef")); + }; + return Ok(TypeVariantRaw::EnumRef(ref_type)); }; let taenum_bits = TAH::read(&mut *input)?.0; diff --git a/src/til/section.rs b/src/til/section.rs index 0cb5f48..7c0d5d1 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -4,7 +4,8 @@ use crate::til::{flag, Basic, TILMacro, TILTypeInfo, TypeVariant}; use crate::IDBSectionCompression; use anyhow::{anyhow, ensure, Result}; use serde::{Deserialize, Serialize}; -use std::collections::HashSet; + +use std::collections::{HashMap, HashSet}; use std::fmt::Debug; use std::io::{BufReader, Read, Write}; use std::num::NonZeroU8; @@ -454,104 +455,6 @@ impl TILSection { .map(CCPtrSize::near_bytes) .unwrap_or(NonZeroU8::new(4).unwrap()) } - - // TODO stub implementation - pub fn type_size_bytes(&self, type_idx: Option, ty: &Type) -> Result { - let mut map = type_idx.into_iter().collect(); - self.inner_type_size_bytes(ty, &mut map) - } - - // map is used to avoid loops - fn inner_type_size_bytes(&self, ty: &Type, map: &mut HashSet) -> Result { - Ok(match &ty.type_variant { - TypeVariant::Basic(Basic::Char) => 1, - // TODO what is the SegReg size? - TypeVariant::Basic(Basic::SegReg) => 1, - TypeVariant::Basic(Basic::Void) => 0, - TypeVariant::Basic(Basic::Unknown { bytes }) => (*bytes).into(), - TypeVariant::Basic(Basic::Bool) => self.size_bool.get().into(), - TypeVariant::Basic(Basic::Short { .. }) => self.sizeof_short().get().into(), - TypeVariant::Basic(Basic::Int { .. }) => self.size_int.get().into(), - TypeVariant::Basic(Basic::Long { .. }) => self.sizeof_long().get().into(), - TypeVariant::Basic(Basic::LongLong { .. }) => self.sizeof_long_long().get().into(), - TypeVariant::Basic(Basic::IntSized { bytes, .. }) => bytes.get().into(), - TypeVariant::Basic(Basic::BoolSized { bytes }) => bytes.get().into(), - // TODO what's the long double default size if it's not defined? - TypeVariant::Basic(Basic::LongDouble) => { - self.size_long_double.map(|x| x.get()).unwrap_or(8).into() - } - TypeVariant::Basic(Basic::Float { bytes }) => bytes.get().into(), - // TODO is pointer always near? Do pointer size default to 4? - TypeVariant::Pointer(_) => self.addr_size().get().into(), - TypeVariant::Function(_) => 0, // function type dont have a size, only a pointer to it - TypeVariant::Array(array) => { - let element_len = self.inner_type_size_bytes(&array.elem_type, map)?; - element_len * array.nelem as u64 - } - TypeVariant::Typedef(Typedef::Name(name)) => { - let inner_type_idx = self.get_name_idx(name).ok_or_else(|| { - anyhow!( - "Unable to find typedef by name: {}", - String::from_utf8_lossy(name) - ) - })?; - if !map.insert(inner_type_idx) { - return Err(anyhow!( - "Loop detected, type inside itself using named typedef " - )); - } - let inner_type = self.get_type_by_idx(inner_type_idx); - let result = self.inner_type_size_bytes(&inner_type.tinfo, map)?; - map.remove(&inner_type_idx); - result - } - TypeVariant::Typedef(Typedef::Ordinal(ord)) => { - let inner_type_idx = self - .get_ord_idx(crate::id0::Id0TilOrd { ord: (*ord).into() }) - .ok_or_else(|| anyhow!("Unable to find typedef by ord: {ord}",))?; - if !map.insert(inner_type_idx) { - return Err(anyhow!( - "Loop detected, type inside itself using ordinal typedef" - )); - } - let inner_type = self.get_type_by_idx(inner_type_idx); - let result = self.inner_type_size_bytes(&inner_type.tinfo, map)?; - map.remove(&inner_type_idx); - result - } - TypeVariant::StructRef(ref_type) - | TypeVariant::UnionRef(ref_type) - | TypeVariant::EnumRef(ref_type) => self.inner_type_size_bytes(ref_type, map)?, - TypeVariant::Struct(Struct { members, .. }) => { - let mut sum = 0u64; - // TODO default alignment, seems like default alignemnt is the field size - let align: u64 = 1; - for member in members { - let field_size = self.inner_type_size_bytes(&member.member_type, map)?; - let align_diff = sum % align; - if align_diff != 0 { - sum += align - align_diff; - } - sum += field_size; - } - sum - } - TypeVariant::Union(Union { members, .. }) => { - let mut max = 0; - for (_, member) in members { - let size = self.inner_type_size_bytes(member, map)?; - max = max.max(size); - } - max - } - TypeVariant::Enum(Enum { storage_size, .. }) => storage_size - .or(self.size_enum) - .map(|x| x.get()) - .unwrap_or(4) - .into(), - TypeVariant::Bitfield(bitfield) => bitfield.width.into(), - }) - } } // TODO remove deserialize and implement a verification if the value is correct @@ -780,3 +683,138 @@ impl TILSection { Ok(()) } } + +pub struct TILTypeSizeSolver<'a> { + section: &'a TILSection, + solved: HashMap, + // HACK used to avoid infinte lopping during recursive solving + solving: HashSet, +} + +impl<'a> TILTypeSizeSolver<'a> { + pub fn new(section: &'a TILSection) -> Self { + Self { + section, + solved: Default::default(), + solving: Default::default(), + } + } + + // TODO make a type for type_idx and symbol_idx, accept both here + /// NOTE that type_idx need to be specified if not a symbol + pub fn type_size_bytes(&mut self, type_idx: Option, ty: &Type) -> Option { + assert!(self.solving.is_empty()); + if let Some(idx) = type_idx { + // if cached return it + if let Some(solved) = self.cached(idx) { + return Some(solved); + } + self.solving.insert(idx); + } + let result = self.inner_type_size_bytes(ty); + if let Some(idx) = type_idx { + assert!(self.solving.remove(&idx)); + } + assert!(self.solving.is_empty()); + if let (Some(idx), Some(result)) = (type_idx, result) { + assert!(self.solved.insert(idx, result).is_none()); + } + result + } + + fn cached(&self, idx: usize) -> Option { + self.solved.get(&idx).copied() + } + + fn inner_type_size_bytes(&mut self, ty: &Type) -> Option { + Some(match &ty.type_variant { + TypeVariant::Basic(Basic::Char) => 1, + // TODO what is the SegReg size? + TypeVariant::Basic(Basic::SegReg) => 1, + TypeVariant::Basic(Basic::Void) => 0, + TypeVariant::Basic(Basic::Unknown { bytes }) => (*bytes).into(), + TypeVariant::Basic(Basic::Bool) => self.section.size_bool.get().into(), + TypeVariant::Basic(Basic::Short { .. }) => self.section.sizeof_short().get().into(), + TypeVariant::Basic(Basic::Int { .. }) => self.section.size_int.get().into(), + TypeVariant::Basic(Basic::Long { .. }) => self.section.sizeof_long().get().into(), + TypeVariant::Basic(Basic::LongLong { .. }) => { + self.section.sizeof_long_long().get().into() + } + TypeVariant::Basic(Basic::IntSized { bytes, .. }) => bytes.get().into(), + TypeVariant::Basic(Basic::BoolSized { bytes }) => bytes.get().into(), + // TODO what's the long double default size if it's not defined? + TypeVariant::Basic(Basic::LongDouble) => self + .section + .size_long_double + .map(|x| x.get()) + .unwrap_or(8) + .into(), + TypeVariant::Basic(Basic::Float { bytes }) => bytes.get().into(), + // TODO is pointer always near? Do pointer size default to 4? + TypeVariant::Pointer(_) => self.section.addr_size().get().into(), + TypeVariant::Function(_) => 0, // function type dont have a size, only a pointer to it + TypeVariant::Array(array) => { + let element_len = self.inner_type_size_bytes(&array.elem_type)?; + element_len * array.nelem as u64 + } + TypeVariant::StructRef(ref_type) + | TypeVariant::UnionRef(ref_type) + | TypeVariant::EnumRef(ref_type) + | TypeVariant::Typedef(ref_type) => self.solve_typedef(ref_type)?, + TypeVariant::Struct(Struct { members, .. }) => { + let mut sum = 0u64; + // TODO default alignment, seems like default alignemnt is the field size + let align: u64 = 1; + for member in members { + let field_size = self.inner_type_size_bytes(&member.member_type)?; + let align_diff = sum % align; + if align_diff != 0 { + sum += align - align_diff; + } + sum += field_size; + } + sum + } + TypeVariant::Union(Union { members, .. }) => { + let mut max = 0; + for (_, member) in members { + let size = self.inner_type_size_bytes(member)?; + max = max.max(size); + } + max + } + TypeVariant::Enum(Enum { storage_size, .. }) => storage_size + .or(self.section.size_enum) + .map(|x| x.get()) + .unwrap_or(4) + .into(), + TypeVariant::Bitfield(bitfield) => bitfield.width.into(), + }) + } + + fn solve_typedef(&mut self, typedef: &Typedef) -> Option { + let idx = match typedef { + Typedef::Name(name) => { + // NOTE missing names may indicate a external type, just return no size + self.section.get_name_idx(name)? + } + Typedef::Ordinal(ord) => self + .section + .get_ord_idx(crate::id0::Id0TilOrd { ord: (*ord).into() })?, + }; + // if cached return it + if let Some(solved) = self.cached(idx) { + return Some(solved); + } + if !self.solving.insert(idx) { + return None; + } + let inner_type = self.section.get_type_by_idx(idx); + let result = self.inner_type_size_bytes(&inner_type.tinfo); + self.solving.remove(&idx); + if let Some(result) = result { + assert!(self.solved.insert(idx, result).is_none()); + } + result + } +} diff --git a/src/til/struct.rs b/src/til/struct.rs index 618508f..ce4d441 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -68,7 +68,10 @@ impl StructRaw { // simple reference let ref_type = TypeRaw::read_ref(&mut *input, header)?; let _taudt_bits = SDACL::read(&mut *input)?; - return Ok(TypeVariantRaw::StructRef(Box::new(ref_type))); + let TypeVariantRaw::Typedef(ref_type) = ref_type.variant else { + return Err(anyhow!("StructRef Non Typedef")); + }; + return Ok(TypeVariantRaw::StructRef(ref_type)); }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4808f9 diff --git a/src/til/union.rs b/src/til/union.rs index c5e6026..bae359d 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -1,3 +1,5 @@ +use anyhow::anyhow; + use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; @@ -56,7 +58,10 @@ impl UnionRaw { // is ref let ref_type = TypeRaw::read_ref(&mut *input, header)?; let _taudt_bits = SDACL::read(&mut *input)?; - return Ok(TypeVariantRaw::UnionRef(Box::new(ref_type))); + let TypeVariantRaw::Typedef(ref_type) = ref_type.variant else { + return Err(anyhow!("UnionRef Non Typedef")); + }; + return Ok(TypeVariantRaw::UnionRef(ref_type)); }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4808f9 diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index e5efd54..24a0941 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -4,7 +4,7 @@ use idb_rs::til::function::{CallingConvention, Function}; use idb_rs::til::pointer::Pointer; use idb_rs::til::r#enum::Enum; use idb_rs::til::r#struct::{Struct, StructMemberAtt}; -use idb_rs::til::section::TILSection; +use idb_rs::til::section::{TILSection, TILTypeSizeSolver}; use idb_rs::til::union::Union; use idb_rs::til::{Basic, TILTypeInfo, Type, TypeVariant, Typedef}; use idb_rs::IDBParser; @@ -51,14 +51,16 @@ fn print_til_section(mut fmt: impl Write, section: &TILSection) -> Result<()> { print_header(&mut fmt, section)?; writeln!(fmt)?; + let mut size_solver = TILTypeSizeSolver::new(section); + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b926 writeln!(fmt, "SYMBOLS")?; - print_symbols(&mut fmt, section)?; + print_symbols(&mut fmt, section, &mut size_solver)?; writeln!(fmt)?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b94d writeln!(fmt, "TYPES")?; - print_types(&mut fmt, section)?; + print_types(&mut fmt, section, &mut size_solver)?; writeln!(fmt)?; // TODO streams @@ -200,10 +202,14 @@ fn compiler_id_to_str(compiler: Compiler) -> &'static str { } } -fn print_symbols(fmt: &mut impl Write, section: &TILSection) -> Result<()> { +fn print_symbols( + fmt: &mut impl Write, + section: &TILSection, + solver: &mut TILTypeSizeSolver<'_>, +) -> Result<()> { for symbol in §ion.symbols { - print_til_type_len(fmt, section, None, &symbol.tinfo)?; - let len = section.type_size_bytes(None, &symbol.tinfo).ok(); + print_til_type_len(fmt, None, &symbol.tinfo, solver)?; + let len = solver.type_size_bytes(None, &symbol.tinfo); // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a80 match len.and_then(|b| u32::try_from(b).ok()) { Some(8) => write!(fmt, " {:016X}", symbol.ordinal)?, @@ -235,15 +241,23 @@ fn print_symbols(fmt: &mut impl Write, section: &TILSection) -> Result<()> { Ok(()) } -fn print_types(fmt: &mut impl Write, section: &TILSection) -> Result<()> { +fn print_types( + fmt: &mut impl Write, + section: &TILSection, + solver: &mut TILTypeSizeSolver<'_>, +) -> Result<()> { writeln!(fmt, "(enumerated by ordinals)")?; - print_types_by_ordinals(fmt, section)?; + print_types_by_ordinals(fmt, section, solver)?; writeln!(fmt, "(enumerated by names)")?; - print_types_by_name(fmt, section)?; + print_types_by_name(fmt, section, solver)?; Ok(()) } -fn print_types_by_ordinals(fmt: &mut impl Write, section: &TILSection) -> Result<()> { +fn print_types_by_ordinals( + fmt: &mut impl Write, + section: &TILSection, + solver: &mut TILTypeSizeSolver<'_>, +) -> Result<()> { enum OrdType<'a> { Alias(&'a (u32, u32)), Type { idx: usize, ty: &'a TILTypeInfo }, @@ -282,7 +296,7 @@ fn print_types_by_ordinals(fmt: &mut impl Write, section: &TILSection) -> Result } OrdType::Type { idx, ty } => (idx, ty), }; - print_til_type_len(fmt, section, Some(idx), &final_type.tinfo).unwrap(); + print_til_type_len(fmt, Some(idx), &final_type.tinfo, solver).unwrap(); write!(fmt, "{:5}. ", ord_num)?; if let OrdType::Alias((_alias_ord, type_ord)) = ord_type { write!(fmt, "(aliased to {type_ord}) ")?; @@ -293,12 +307,16 @@ fn print_types_by_ordinals(fmt: &mut impl Write, section: &TILSection) -> Result Ok(()) } -fn print_types_by_name(fmt: &mut impl Write, section: &TILSection) -> Result<()> { +fn print_types_by_name( + fmt: &mut impl Write, + section: &TILSection, + solver: &mut TILTypeSizeSolver<'_>, +) -> Result<()> { for (idx, symbol) in section.types.iter().enumerate() { if symbol.name.is_empty() { continue; } - print_til_type_len(fmt, section, Some(idx), &symbol.tinfo).unwrap(); + print_til_type_len(fmt, Some(idx), &symbol.tinfo, solver).unwrap(); write!(fmt, " ")?; print_til_type_root(fmt, section, Some(&symbol.name), &symbol.tinfo)?; writeln!(fmt, ";")?; @@ -358,27 +376,11 @@ fn print_til_type( print_type_prefix, ), TypeVariant::Typedef(typedef) => print_til_type_typedef(fmt, section, name, typedef), - TypeVariant::StructRef(ref_type) => print_til_type( - fmt, - section, - name, - ref_type, - print_pointer_space, - print_type_prefix, - ), + TypeVariant::UnionRef(ref_type) + | TypeVariant::EnumRef(ref_type) + | TypeVariant::StructRef(ref_type) => print_til_type_typedef(fmt, section, name, ref_type), TypeVariant::Struct(til_struct) => print_til_type_struct(fmt, section, name, til_struct), - TypeVariant::UnionRef(ref_type) => { - print_til_type(fmt, section, name, ref_type, true, print_type_prefix) - } TypeVariant::Union(til_union) => print_til_type_union(fmt, section, name, til_union), - TypeVariant::EnumRef(ref_type) => print_til_type( - fmt, - section, - name, - ref_type, - print_pointer_space, - print_type_prefix, - ), TypeVariant::Enum(til_enum) => print_til_type_enum(fmt, section, name, til_enum), TypeVariant::Bitfield(_bitfield) => write!(fmt, "todo!(\"Bitfield\")"), } @@ -772,15 +774,17 @@ fn print_til_type_only(fmt: &mut impl Write, section: &TILSection, tinfo: &Type) fn print_til_type_len( fmt: &mut impl Write, - section: &TILSection, idx: Option, tinfo: &Type, + size_solver: &mut TILTypeSizeSolver<'_>, ) -> Result<()> { if let TypeVariant::Function(_function) = &tinfo.type_variant { write!(fmt, "FFFFFFFF")?; } else { // if the type is unknown it just prints "FFFFFFF" - let len = section.type_size_bytes(idx, tinfo).unwrap_or(0xFFFF_FFFF); + let len = size_solver + .type_size_bytes(idx, tinfo) + .unwrap_or(0xFFFF_FFFF); write!(fmt, "{len:08X}")?; } Ok(()) From 8122efcd3012eedec379fb90c2dbf0778fbda585 Mon Sep 17 00:00:00 2001 From: rbran Date: Thu, 2 Jan 2025 10:04:25 -0300 Subject: [PATCH 05/53] fix tilib enum/struct embed types --- src/til.rs | 20 +++--- src/til/array.rs | 2 +- src/til/enum.rs | 4 +- src/til/function.rs | 4 +- src/til/pointer.rs | 2 +- src/til/struct.rs | 6 +- src/til/union.rs | 4 +- src/tools/tilib.rs | 158 +++++++++++++++++++++++++++++++++++++++----- 8 files changed, 161 insertions(+), 39 deletions(-) diff --git a/src/til.rs b/src/til.rs index 4464061..b03e7ea 100644 --- a/src/til.rs +++ b/src/til.rs @@ -78,12 +78,11 @@ impl TILTypeInfo { let fieldcmts = cursor.read_c_string_raw()?; let sclass: u8 = cursor.read_u8()?; - let mut fields_iter = fields.into_iter(); + let mut fields_iter = fields + .into_iter() + .map(|field| field.is_empty().then_some(None).unwrap_or(Some(field))); let tinfo = Type::new(til, tinfo_raw, &mut fields_iter)?; - ensure!( - fields_iter.as_slice().is_empty(), - "Extra fields found for til" - ); + ensure!(fields_iter.next() == None, "Extra fields found for til"); Ok(Self { _flags: flags, @@ -124,7 +123,7 @@ impl Type { pub(crate) fn new( til: &TILSectionHeader, tinfo_raw: TypeRaw, - fields: &mut impl Iterator>, + fields: &mut impl Iterator>>, ) -> Result { let type_variant = match tinfo_raw.variant { TypeVariantRaw::Basic(x) => TypeVariant::Basic(x), @@ -181,12 +180,11 @@ impl Type { )); } } - let mut fields_iter = fields.into_iter(); + let mut fields_iter = fields + .into_iter() + .map(|field| field.is_empty().then_some(None).unwrap_or(Some(field))); let result = Self::new(&header, type_raw, &mut fields_iter)?; - ensure!( - fields_iter.as_slice().is_empty(), - "Extra fields found for id0 til" - ); + ensure!(fields_iter.next() == None, "Extra fields found for id0 til"); Ok(result) } } diff --git a/src/til/array.rs b/src/til/array.rs index 499a5b6..14120ff 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -14,7 +14,7 @@ impl Array { pub(crate) fn new( til: &TILSectionHeader, value: ArrayRaw, - fields: &mut impl Iterator>, + fields: &mut impl Iterator>>, ) -> anyhow::Result { Ok(Self { base: value.base, diff --git a/src/til/enum.rs b/src/til/enum.rs index ee21207..65d95bf 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -18,12 +18,12 @@ impl Enum { pub(crate) fn new( _til: &TILSectionHeader, value: EnumRaw, - fields: &mut impl Iterator>, + fields: &mut impl Iterator>>, ) -> anyhow::Result { let members = value .members .into_iter() - .map(|member| (fields.next(), member)) + .map(|member| (fields.next().flatten(), member)) .collect(); Ok(Self { output_format: value.output_format, diff --git a/src/til/function.rs b/src/til/function.rs index 7063d24..0362890 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -29,12 +29,12 @@ impl Function { pub(crate) fn new( til: &TILSectionHeader, value: FunctionRaw, - fields: &mut impl Iterator>, + fields: &mut impl Iterator>>, ) -> Result { let ret = Type::new(til, *value.ret, &mut *fields)?; let mut args = Vec::with_capacity(value.args.len()); for (arg_type, arg_loc) in value.args { - let field_name = fields.next(); + let field_name = fields.next().flatten(); let new_member = Type::new(til, arg_type, &mut *fields)?; args.push((field_name, new_member, arg_loc)); } diff --git a/src/til/pointer.rs b/src/til/pointer.rs index 79fc92b..e1870b9 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -16,7 +16,7 @@ impl Pointer { pub(crate) fn new( til: &TILSectionHeader, raw: PointerRaw, - fields: &mut impl Iterator>, + fields: &mut impl Iterator>>, ) -> Result { let shifted = raw .shifted diff --git a/src/til/struct.rs b/src/til/struct.rs index ce4d441..b06d3c9 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -30,12 +30,12 @@ impl Struct { pub(crate) fn new( til: &TILSectionHeader, value: StructRaw, - fields: &mut impl Iterator>, + fields: &mut impl Iterator>>, ) -> Result { let members = value .members .into_iter() - .map(|member| StructMember::new(til, fields.next(), member, &mut *fields)) + .map(|member| StructMember::new(til, fields.next().flatten(), member, &mut *fields)) .collect::>()?; Ok(Struct { effective_alignment: value.effective_alignment, @@ -108,7 +108,7 @@ impl StructMember { til: &TILSectionHeader, name: Option>, m: StructMemberRaw, - fields: &mut impl Iterator>, + fields: &mut impl Iterator>>, ) -> Result { Ok(Self { name, diff --git a/src/til/union.rs b/src/til/union.rs index bae359d..3ee6977 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -20,13 +20,13 @@ impl Union { pub(crate) fn new( til: &TILSectionHeader, value: UnionRaw, - fields: &mut impl Iterator>, + fields: &mut impl Iterator>>, ) -> anyhow::Result { let members = value .members .into_iter() .map(|member| { - let field_name = fields.next(); + let field_name = fields.next().flatten(); let new_member = Type::new(til, member, &mut *fields)?; Ok((field_name, new_member)) }) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 24a0941..432c357 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -235,7 +235,15 @@ fn print_symbols( write!(fmt, "{}", sym_kind)?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a3a - print_til_type(fmt, section, Some(&symbol.name), &symbol.tinfo, true, false)?; + print_til_type( + fmt, + section, + Some(&symbol.name), + &symbol.tinfo, + true, + false, + true, + )?; writeln!(fmt, ";")?; } Ok(()) @@ -337,7 +345,7 @@ fn print_til_type_root( // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x443906 _ => write!(fmt, "typedef ")?, } - print_til_type(fmt, section, name, til_type, true, true) + print_til_type(fmt, section, name, til_type, true, true, true) } fn print_til_type( @@ -347,6 +355,7 @@ fn print_til_type( til_type: &Type, print_pointer_space: bool, print_type_prefix: bool, + print_name: bool, ) -> Result<()> { if til_type.is_volatile { write!(fmt, "volatile ")?; @@ -375,12 +384,20 @@ fn print_til_type( print_pointer_space, print_type_prefix, ), - TypeVariant::Typedef(typedef) => print_til_type_typedef(fmt, section, name, typedef), + TypeVariant::Typedef(ref_type) => { + print_til_type_typedef(fmt, section, name, ref_type, false) + } TypeVariant::UnionRef(ref_type) | TypeVariant::EnumRef(ref_type) - | TypeVariant::StructRef(ref_type) => print_til_type_typedef(fmt, section, name, ref_type), - TypeVariant::Struct(til_struct) => print_til_type_struct(fmt, section, name, til_struct), - TypeVariant::Union(til_union) => print_til_type_union(fmt, section, name, til_union), + | TypeVariant::StructRef(ref_type) => { + print_til_type_typedef(fmt, section, name, ref_type, true) + } + TypeVariant::Struct(til_struct) => { + print_til_type_struct(fmt, section, name, til_struct, print_name) + } + TypeVariant::Union(til_union) => { + print_til_type_union(fmt, section, name, til_union, print_name) + } TypeVariant::Enum(til_enum) => print_til_type_enum(fmt, section, name, til_enum), TypeVariant::Bitfield(_bitfield) => write!(fmt, "todo!(\"Bitfield\")"), } @@ -455,6 +472,7 @@ fn print_til_type_pointer( &pointer.typ, print_pointer_space, print_type_prefix, + true, )?; if print_pointer_space { write!(fmt, " ")?; @@ -486,7 +504,7 @@ fn print_til_type_function( is_pointer: bool, ) -> Result<()> { // return type - print_til_type(fmt, section, None, &til_type.ret, false, true)?; + print_til_type(fmt, section, None, &til_type.ret, false, true, true)?; let cc = match (section.cc, til_type.calling_convention) { // don't print if using the til section default cc @@ -520,7 +538,7 @@ fn print_til_type_function( write!(fmt, ", ")?; } let param_name = param_name.as_ref().map(Vec::as_slice); - print_til_type(fmt, section, param_name, param, true, false)?; + print_til_type(fmt, section, param_name, param, true, false, true)?; } if til_type.calling_convention == Some(CallingConvention::Ellipsis) { if !til_type.args.is_empty() { @@ -546,6 +564,7 @@ fn print_til_type_array( &til_array.elem_type, print_pointer_space, print_type_prefix, + true, )?; if let Some(name) = name { write!(fmt, " ")?; @@ -564,6 +583,7 @@ fn print_til_type_typedef( section: &TILSection, name: Option<&[u8]>, typedef: &Typedef, + print_prefix: bool, ) -> Result<()> { // only print prefix, if is root match typedef { @@ -571,12 +591,12 @@ fn print_til_type_typedef( let ty = section .get_ord(idb_rs::id0::Id0TilOrd { ord: (*ord).into() }) .unwrap(); - print_til_type_name(fmt, &ty.name, &ty.tinfo, false)?; + print_til_type_name(fmt, &ty.name, &ty.tinfo, print_prefix)?; } idb_rs::til::Typedef::Name(name) => { let ty = section.get_name(name); match ty { - Some(ty) => print_til_type_name(fmt, &ty.name, &ty.tinfo, false)?, + Some(ty) => print_til_type_name(fmt, &ty.name, &ty.tinfo, print_prefix)?, // if we can't find the type, just print the name None => write!(fmt, "{}", core::str::from_utf8(name).unwrap())?, } @@ -594,6 +614,7 @@ fn print_til_type_struct( section: &TILSection, name: Option<&[u8]>, til_struct: &Struct, + print_name: bool, ) -> Result<()> { write!(fmt, "struct ")?; if til_struct.is_unaligned { @@ -615,12 +636,23 @@ fn print_til_type_struct( write!(fmt, "__other({others:04x}) ")?; } if let Some(name) = name { - fmt.write_all(name)?; + if print_name { + fmt.write_all(name)?; + write!(fmt, " ")?; + } } - write!(fmt, " {{")?; + write!(fmt, "{{")?; for member in &til_struct.members { - let name = member.name.as_ref().map(Vec::as_slice); - print_til_type(fmt, section, name, &member.member_type, true, false)?; + let member_name = member.name.as_ref().map(Vec::as_slice); + print_til_type_complex_member( + fmt, + section, + name, + member_name, + &member.member_type, + true, + true, + )?; if let Some(att) = &member.att { print_til_struct_member_att(fmt, &member.member_type, att)?; } @@ -634,23 +666,115 @@ fn print_til_type_union( section: &TILSection, name: Option<&[u8]>, til_union: &Union, + print_name: bool, ) -> Result<()> { write!(fmt, "union ")?; if let Some(align) = til_union.alignment { write!(fmt, "__attribute__((aligned({align}))) ")?; } if let Some(name) = name { - fmt.write_all(name)?; + if print_name { + fmt.write_all(name)?; + write!(fmt, " ")?; + } } - write!(fmt, " {{")?; + write!(fmt, "{{")?; for (member_name, member) in &til_union.members { let member_name = member_name.as_ref().map(Vec::as_slice); - print_til_type(fmt, section, member_name, member, true, false)?; + print_til_type_complex_member(fmt, section, name, member_name, member, true, true)?; write!(fmt, ";")?; } write!(fmt, "}}") } +// just print the type, unless we want to embed it +fn print_til_type_complex_member( + fmt: &mut impl Write, + section: &TILSection, + parent_name: Option<&[u8]>, + name: Option<&[u8]>, + til: &Type, + print_pointer_space: bool, + print_name: bool, +) -> Result<()> { + // if parent is not named, don't embeded it, because we can verify if it's part + // of the parent + let Some(parent_name) = parent_name else { + return print_til_type( + fmt, + section, + name, + til, + print_pointer_space, + false, + print_name, + ); + }; + let qualified_parent_name: Vec<_> = parent_name.iter().chain(b"::").copied().collect(); + + // TODO if the field is named, don't embeded it? + if name.is_some() { + return print_til_type( + fmt, + section, + name, + til, + print_pointer_space, + false, + print_name, + ); + } + + // if typedef of complex ref, we may want to embed the definition inside the type + // otherwise just print the type regularly + let typedef = match &til.type_variant { + TypeVariant::EnumRef(typedef) + | TypeVariant::StructRef(typedef) + | TypeVariant::UnionRef(typedef) + | TypeVariant::Typedef(typedef) => typedef, + _ => { + return print_til_type( + fmt, + section, + name, + til, + print_pointer_space, + false, + print_name, + ); + } + }; + + let inner_type = match typedef { + Typedef::Ordinal(ord) => section.get_ord(Id0TilOrd { ord: (*ord).into() }).unwrap(), + Typedef::Name(name) => section.get_name(name).unwrap(), + }; + + // if the inner_type name is in the format `parent_name::something_else` then + // we embed it + if !inner_type.name.starts_with(&qualified_parent_name) { + return print_til_type( + fmt, + section, + name, + til, + print_pointer_space, + false, + print_name, + ); + } + + print_til_type( + fmt, + section, + Some(&inner_type.name), + &inner_type.tinfo, + print_pointer_space, + true, + false, + ) +} + fn print_til_type_enum( fmt: &mut impl Write, section: &TILSection, From f8ec1b882f7330f04d99553e1da981e968f118cd Mon Sep 17 00:00:00 2001 From: rbran Date: Thu, 2 Jan 2025 10:32:33 -0300 Subject: [PATCH 06/53] fix tilib unamed complex ref types definitions --- src/til.rs | 6 ++-- src/til/section.rs | 2 +- src/tools/tilib.rs | 79 +++++++++++++++++++++++++++++++++++----------- 3 files changed, 66 insertions(+), 21 deletions(-) diff --git a/src/til.rs b/src/til.rs index b03e7ea..b441cf9 100644 --- a/src/til.rs +++ b/src/til.rs @@ -447,7 +447,7 @@ impl Basic { pub enum Typedef { // TODO make this a `Id0TilOrd` Ordinal(u32), - Name(Vec), + Name(Option>), } impl Typedef { @@ -462,7 +462,9 @@ impl Typedef { } Ok(Typedef::Ordinal(de)) } - _ => Ok(Typedef::Name(buf)), + _ => Ok(Typedef::Name( + buf.is_empty().then_some(None).unwrap_or(Some(buf)), + )), } } } diff --git a/src/til/section.rs b/src/til/section.rs index 7c0d5d1..553a02e 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -796,7 +796,7 @@ impl<'a> TILTypeSizeSolver<'a> { let idx = match typedef { Typedef::Name(name) => { // NOTE missing names may indicate a external type, just return no size - self.section.get_name_idx(name)? + self.section.get_name_idx(name.as_ref()?)? } Typedef::Ordinal(ord) => self .section diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 432c357..c81cadd 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -37,11 +37,12 @@ pub fn tilib_print(args: &Args) -> anyhow::Result<()> { fn print_til_section(mut fmt: impl Write, section: &TILSection) -> Result<()> { if let Some(dependency) = §ion.dependency { - let dep = core::str::from_utf8(dependency).unwrap(); // TODO open those files? What todo with then? // TODO some files still missing this warning - if !dep.is_empty() { - writeln!(fmt, "Warning: {dep}: No such file or directory")?; + if !dependency.is_empty() { + write!(fmt, "Warning: ")?; + fmt.write_all(dependency)?; + writeln!(fmt, ": No such file or directory")?; } } @@ -77,11 +78,9 @@ fn print_til_section(mut fmt: impl Write, section: &TILSection) -> Result<()> { fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { // the description of the file // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b710 - writeln!( - fmt, - "Description: {}", - core::str::from_utf8(§ion.title).unwrap() - )?; + write!(fmt, "Description: ")?; + fmt.write_all(§ion.title)?; + writeln!(fmt)?; // flags from the section header // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b721 @@ -254,6 +253,7 @@ fn print_types( section: &TILSection, solver: &mut TILTypeSizeSolver<'_>, ) -> Result<()> { + // TODO only print by ordinals if there are ordinals writeln!(fmt, "(enumerated by ordinals)")?; print_types_by_ordinals(fmt, section, solver)?; writeln!(fmt, "(enumerated by names)")?; @@ -342,6 +342,9 @@ fn print_til_type_root( // TODO: if a is a typedef and ComplexRef or something like it, also print typedef match &til_type.type_variant { TypeVariant::Struct(_) | TypeVariant::Union(_) | TypeVariant::Enum(_) => {} + TypeVariant::StructRef(Typedef::Name(None)) + | TypeVariant::UnionRef(Typedef::Name(None)) + | TypeVariant::EnumRef(Typedef::Name(None)) => {} // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x443906 _ => write!(fmt, "typedef ")?, } @@ -387,10 +390,14 @@ fn print_til_type( TypeVariant::Typedef(ref_type) => { print_til_type_typedef(fmt, section, name, ref_type, false) } - TypeVariant::UnionRef(ref_type) - | TypeVariant::EnumRef(ref_type) - | TypeVariant::StructRef(ref_type) => { - print_til_type_typedef(fmt, section, name, ref_type, true) + TypeVariant::UnionRef(ref_type) => { + print_til_type_complex_ref(fmt, section, name, ref_type, "union", true) + } + TypeVariant::EnumRef(ref_type) => { + print_til_type_complex_ref(fmt, section, name, ref_type, "enum", true) + } + TypeVariant::StructRef(ref_type) => { + print_til_type_complex_ref(fmt, section, name, ref_type, "struct", true) } TypeVariant::Struct(til_struct) => { print_til_type_struct(fmt, section, name, til_struct, print_name) @@ -593,12 +600,15 @@ fn print_til_type_typedef( .unwrap(); print_til_type_name(fmt, &ty.name, &ty.tinfo, print_prefix)?; } - idb_rs::til::Typedef::Name(name) => { + idb_rs::til::Typedef::Name(None) => { + // TODO print nothing? + } + idb_rs::til::Typedef::Name(Some(name)) => { let ty = section.get_name(name); match ty { Some(ty) => print_til_type_name(fmt, &ty.name, &ty.tinfo, print_prefix)?, // if we can't find the type, just print the name - None => write!(fmt, "{}", core::str::from_utf8(name).unwrap())?, + None => write!(fmt, "{}", String::from_utf8_lossy(name))?, } } } @@ -609,6 +619,28 @@ fn print_til_type_typedef( Ok(()) } +fn print_til_type_complex_ref( + fmt: &mut impl Write, + section: &TILSection, + name: Option<&[u8]>, + typedef: &Typedef, + prefix_name: &str, + print_prefix: bool, +) -> Result<()> { + if let idb_rs::til::Typedef::Name(None) = typedef { + if print_prefix { + write!(fmt, "{}", prefix_name)?; + if let Some(name) = name { + write!(fmt, " ")?; + fmt.write_all(name)?; + } + } + } else { + print_til_type_typedef(fmt, section, name, typedef, print_prefix)?; + } + Ok(()) +} + fn print_til_type_struct( fmt: &mut impl Write, section: &TILSection, @@ -747,7 +779,18 @@ fn print_til_type_complex_member( let inner_type = match typedef { Typedef::Ordinal(ord) => section.get_ord(Id0TilOrd { ord: (*ord).into() }).unwrap(), - Typedef::Name(name) => section.get_name(name).unwrap(), + Typedef::Name(None) => { + return print_til_type( + fmt, + section, + name, + til, + print_pointer_space, + false, + print_name, + ); + } + Typedef::Name(Some(name)) => section.get_name(name).unwrap(), }; // if the inner_type name is in the format `parent_name::something_else` then @@ -884,12 +927,12 @@ fn print_til_type_name( fn print_til_type_only(fmt: &mut impl Write, section: &TILSection, tinfo: &Type) -> Result<()> { match &tinfo.type_variant { - TypeVariant::Typedef(Typedef::Name(name)) => { - write!(fmt, "{}", String::from_utf8_lossy(name))?; + TypeVariant::Typedef(Typedef::Name(Some(name))) => { + fmt.write_all(name)?; } TypeVariant::Typedef(Typedef::Ordinal(ord)) => { let ty = section.get_ord(Id0TilOrd { ord: (*ord).into() }).unwrap(); - write!(fmt, "{}", String::from_utf8_lossy(&ty.name))?; + fmt.write_all(&ty.name)?; } _ => {} }; From 3e9ea5e28bdc3d6b3553d683a2edfda7af7ee833 Mon Sep 17 00:00:00 2001 From: rbran Date: Thu, 2 Jan 2025 10:36:15 -0300 Subject: [PATCH 07/53] follow clippy sugestions --- src/til.rs | 25 ++++++++++++++----------- src/tools/tilib.rs | 4 ++-- 2 files changed, 16 insertions(+), 13 deletions(-) diff --git a/src/til.rs b/src/til.rs index b441cf9..ec3640f 100644 --- a/src/til.rs +++ b/src/til.rs @@ -78,11 +78,12 @@ impl TILTypeInfo { let fieldcmts = cursor.read_c_string_raw()?; let sclass: u8 = cursor.read_u8()?; - let mut fields_iter = fields - .into_iter() - .map(|field| field.is_empty().then_some(None).unwrap_or(Some(field))); + let mut fields_iter = + fields + .into_iter() + .map(|field| if field.is_empty() { None } else { Some(field) }); let tinfo = Type::new(til, tinfo_raw, &mut fields_iter)?; - ensure!(fields_iter.next() == None, "Extra fields found for til"); + ensure!(fields_iter.next().is_none(), "Extra fields found for til"); Ok(Self { _flags: flags, @@ -180,11 +181,15 @@ impl Type { )); } } - let mut fields_iter = fields - .into_iter() - .map(|field| field.is_empty().then_some(None).unwrap_or(Some(field))); + let mut fields_iter = + fields + .into_iter() + .map(|field| if field.is_empty() { None } else { Some(field) }); let result = Self::new(&header, type_raw, &mut fields_iter)?; - ensure!(fields_iter.next() == None, "Extra fields found for id0 til"); + ensure!( + fields_iter.next().is_none(), + "Extra fields found for id0 til" + ); Ok(result) } } @@ -462,9 +467,7 @@ impl Typedef { } Ok(Typedef::Ordinal(de)) } - _ => Ok(Typedef::Name( - buf.is_empty().then_some(None).unwrap_or(Some(buf)), - )), + _ => Ok(Typedef::Name(if buf.is_empty() { None } else { Some(buf) })), } } } diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index c81cadd..ae9dd57 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -675,7 +675,7 @@ fn print_til_type_struct( } write!(fmt, "{{")?; for member in &til_struct.members { - let member_name = member.name.as_ref().map(Vec::as_slice); + let member_name = member.name.as_deref(); print_til_type_complex_member( fmt, section, @@ -712,7 +712,7 @@ fn print_til_type_union( } write!(fmt, "{{")?; for (member_name, member) in &til_union.members { - let member_name = member_name.as_ref().map(Vec::as_slice); + let member_name = member_name.as_deref(); print_til_type_complex_member(fmt, section, name, member_name, member, true, true)?; write!(fmt, ";")?; } From 5ff66145da2ac0d3029f5c75b14e21f3394061b3 Mon Sep 17 00:00:00 2001 From: rbran Date: Thu, 2 Jan 2025 12:58:28 -0300 Subject: [PATCH 08/53] add til type ext att offset --- src/til/struct.rs | 65 ++++++++++++++++++++++++++++++++++++++++++++++ src/tools/tilib.rs | 50 +++++++++++++++++++++++++++++++---- 2 files changed, 110 insertions(+), 5 deletions(-) diff --git a/src/til/struct.rs b/src/til/struct.rs index b06d3c9..2311ad0 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -231,8 +231,23 @@ pub enum StructMemberAtt { }, } +// InnerRef InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x720880 #[derive(Clone, Copy, Debug)] pub enum StructMemberAttBasic { + // 0x0 0x1 "__bin" + // 0x0 0x2 "__oct" + // 0x0 0x3 "__hex" + // 0x0 0x404 "__dec" + // 0x0 0x5 "__float" + // 0x0 0x6 "__char" + // 0x0 0x7 "__segm" + // 0x6 0x8 "__enum" + // 0x0 0x9 "__off" + // 0x8 0x9 "__offset" + // 0x8 0xa "__strlit" + // 0x8 0xb "__stroff" + // 0x8 0xc "__custom" + // 0x0 0x100 "__invsign" Var1(u64), Var2 { att: u64, @@ -245,6 +260,7 @@ pub enum StructMemberAttBasic { impl StructMemberAtt { pub fn str_type(self) -> Option { match self { + // 0x8 0xa "__strlit" StructMemberAtt::VarAorC { val1, att0: StructMemberAttBasic::Var1(0xa), @@ -252,6 +268,55 @@ impl StructMemberAtt { _ => None, } } + pub fn offset_type(self) -> Option { + match self { + // 0x8 0x9 "__offset" + StructMemberAtt::Var9 { + val1, + att0: None, + att1: 0, + att2: u64::MAX, + } => Some(ExtAttOffset { + offset: (val1 & 0xf) as u8, + flag: val1 & !0xf, + }), + _ => None, + } + } +} + +#[derive(Clone, Copy, Debug)] +pub struct ExtAttOffset { + pub offset: u8, + // InnerRef InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x720aa0 + flag: u32, +} + +impl ExtAttOffset { + pub fn is_rvaoff(&self) -> bool { + self.flag & 0x10 != 0 + } + pub fn is_pastend(&self) -> bool { + self.flag & 0x20 != 0 + } + pub fn is_nobase(&self) -> bool { + self.flag & 0x80 != 0 + } + pub fn is_subtract(&self) -> bool { + self.flag & 0x100 != 0 + } + pub fn is_signedop(&self) -> bool { + self.flag & 0x200 != 0 + } + pub fn is_nozeroes(&self) -> bool { + self.flag & 0x400 != 0 + } + pub fn is_noones(&self) -> bool { + self.flag & 0x800 != 0 + } + pub fn is_selfref(&self) -> bool { + self.flag & 0x1000 != 0 + } } #[derive(Clone, Copy, Debug, FromPrimitive, IntoPrimitive)] diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index ae9dd57..b228d37 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -231,7 +231,7 @@ fn print_symbols( // _ => "?!", //}; let sym_kind = " "; - write!(fmt, "{}", sym_kind)?; + write!(fmt, " {} ", sym_kind)?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a3a print_til_type( @@ -877,6 +877,7 @@ fn print_til_type_enum( write!(fmt, "}}") } +// InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x423c20 fn print_til_struct_member_att( fmt: &mut impl Write, tinfo: &Type, @@ -885,6 +886,8 @@ fn print_til_struct_member_att( match &tinfo.type_variant { TypeVariant::Pointer(pointer) => match &pointer.typ.type_variant { TypeVariant::Basic(Basic::Char) => print_til_struct_member_string_att(fmt, att)?, + // TODO is valid for other then void? + TypeVariant::Basic(Basic::Void) => print_til_struct_member_void_pointer_att(fmt, att)?, _ => {} }, TypeVariant::Array(array) => match &array.elem_type.type_variant { @@ -896,12 +899,49 @@ fn print_til_struct_member_att( Ok(()) } +// InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4872f0 fn print_til_struct_member_string_att(fmt: &mut impl Write, att: &StructMemberAtt) -> Result<()> { - let Some(value) = att.str_type() else { - // todo att is unknown - return Ok(()); + if let Some(value) = att.str_type() { + write!(fmt, " __strlit(0x{:08X})", value.as_strlib())?; }; - write!(fmt, " __strlit(0x{:08X})", value.as_strlib()) + Ok(()) +} + +fn print_til_struct_member_void_pointer_att( + fmt: &mut impl Write, + att: &StructMemberAtt, +) -> Result<()> { + if let Some(value) = att.offset_type() { + write!(fmt, " __offset({:#X}", value.offset)?; + // InnerRef InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x720aa0 + if value.is_rvaoff() { + write!(fmt, "|RVAOFF")?; + } + if value.is_pastend() { + write!(fmt, "|PASTEND")?; + } + if value.is_nobase() { + write!(fmt, "|NOBASE")?; + } + if value.is_subtract() { + write!(fmt, "|SUBTRACT")?; + } + if value.is_signedop() { + write!(fmt, "|SIGNEDOP")?; + } + if value.is_nozeroes() { + write!(fmt, "|NOZEROES")?; + } + if value.is_noones() { + write!(fmt, "|NOONES")?; + } + if value.is_selfref() { + write!(fmt, "|SELFREF")?; + } + write!(fmt, ")")?; + } + + return Ok(()); } fn print_til_type_name( From c0dee1ff0578441fdfcb1ed20205a1197cd2d2a8 Mon Sep 17 00:00:00 2001 From: rbran Date: Thu, 2 Jan 2025 14:12:36 -0300 Subject: [PATCH 09/53] add til basic type ext att parsing --- src/til/struct.rs | 114 +++++++++++++++++++++++++++++++++++++------ src/tools/tilib.rs | 118 +++++++++++++++++++++++++++++++++------------ 2 files changed, 185 insertions(+), 47 deletions(-) diff --git a/src/til/struct.rs b/src/til/struct.rs index 2311ad0..9a56c1a 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -4,7 +4,7 @@ use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeRaw, SDACL}; use anyhow::{anyhow, Result}; -use num_enum::{FromPrimitive, IntoPrimitive}; +use num_enum::{FromPrimitive, IntoPrimitive, TryFromPrimitive}; use super::{StructModifierRaw, TypeVariantRaw}; @@ -217,7 +217,6 @@ impl StructMemberRaw { #[derive(Clone, Copy, Debug)] pub enum StructMemberAtt { - // Var0to7(Var1(0)) seems to indicate a "None" kind of value Var0to7(StructMemberAttBasic), Var9 { val1: u32, @@ -234,20 +233,6 @@ pub enum StructMemberAtt { // InnerRef InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x720880 #[derive(Clone, Copy, Debug)] pub enum StructMemberAttBasic { - // 0x0 0x1 "__bin" - // 0x0 0x2 "__oct" - // 0x0 0x3 "__hex" - // 0x0 0x404 "__dec" - // 0x0 0x5 "__float" - // 0x0 0x6 "__char" - // 0x0 0x7 "__segm" - // 0x6 0x8 "__enum" - // 0x0 0x9 "__off" - // 0x8 0x9 "__offset" - // 0x8 0xa "__strlit" - // 0x8 0xb "__stroff" - // 0x8 0xc "__custom" - // 0x0 0x100 "__invsign" Var1(u64), Var2 { att: u64, @@ -283,6 +268,22 @@ impl StructMemberAtt { _ => None, } } + + pub fn basic(self) -> Option { + match self { + StructMemberAtt::Var0to7(StructMemberAttBasic::Var1(raw)) => { + ExtAttBasic::from_raw(raw, None) + } + // 0x9 0x1000 "__tabform" + StructMemberAtt::Var0to7(StructMemberAttBasic::Var2 { + att, + val1, + val2, + val3: u32::MAX, + }) if att & 0x1000 != 0 => ExtAttBasic::from_raw(att & !0x1000, Some((val1, val2))), + _ => None, + } + } } #[derive(Clone, Copy, Debug)] @@ -336,3 +337,84 @@ impl StringType { self.into() } } + +#[derive(Clone, Copy, Debug)] +pub struct ExtAttBasic { + pub fmt: ExtAttBasicFmt, + pub tabform: Option, + pub is_signed: bool, + pub is_inv_sign: bool, + pub is_inv_bits: bool, + pub is_lzero: bool, +} +impl ExtAttBasic { + fn from_raw(value: u64, val1: Option<(u32, u32)>) -> Option { + use ExtAttBasicFmt::*; + let fmt = match value & 0xf { + 0x1 => Bin, + 0x2 => Oct, + 0x3 => Hex, + 0x4 => Dec, + 0x5 => Float, + 0x6 => Char, + 0x7 => Segm, + 0x9 => Off, + _ => return None, + }; + let is_inv_sign = value & 0x100 != 0; + let is_inv_bits = value & 0x200 != 0; + let is_signed = value & 0x400 != 0; + let is_lzero = value & 0x800 != 0; + + let tabform = val1.map(|(val1, val2)| { + let val1 = ExtAttBasicTabformVal1::try_from_primitive(val1.try_into().ok()?).ok()?; + Some(ExtAttBasicTabform { val1, val2 }) + }); + let tabform = match tabform { + // convert correctly + Some(Some(val)) => Some(val), + // coud not convert, return nothing + Some(None) => return None, + // there is no tabform + None => None, + }; + + // TODO panic on unknown values? + Some(Self { + fmt, + tabform, + is_signed, + is_inv_sign, + is_inv_bits, + is_lzero, + }) + } +} + +#[derive(Clone, Copy, Debug)] +pub enum ExtAttBasicFmt { + Bin, + Oct, + Hex, + Dec, + Float, + Char, + Segm, + Off, +} + +#[derive(Clone, Copy, Debug)] +pub struct ExtAttBasicTabform { + pub val1: ExtAttBasicTabformVal1, + pub val2: u32, +} + +#[derive(Clone, Copy, Debug, TryFromPrimitive, IntoPrimitive)] +#[repr(u8)] +pub enum ExtAttBasicTabformVal1 { + NODUPS = 0, + HEX = 1, + DEC = 2, + OCT = 3, + BIN = 4, +} diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index b228d37..9efcb4a 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -884,6 +884,7 @@ fn print_til_struct_member_att( att: &StructMemberAtt, ) -> Result<()> { match &tinfo.type_variant { + TypeVariant::Basic(_) => print_til_struct_member_basic_att(fmt, att)?, TypeVariant::Pointer(pointer) => match &pointer.typ.type_variant { TypeVariant::Basic(Basic::Char) => print_til_struct_member_string_att(fmt, att)?, // TODO is valid for other then void? @@ -901,9 +902,11 @@ fn print_til_struct_member_att( // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4872f0 fn print_til_struct_member_string_att(fmt: &mut impl Write, att: &StructMemberAtt) -> Result<()> { - if let Some(value) = att.str_type() { - write!(fmt, " __strlit(0x{:08X})", value.as_strlib())?; + let Some(value) = att.str_type() else { + // TODO don't ignore errors + return Ok(()); }; + write!(fmt, " __strlit(0x{:08X})", value.as_strlib())?; Ok(()) } @@ -911,37 +914,90 @@ fn print_til_struct_member_void_pointer_att( fmt: &mut impl Write, att: &StructMemberAtt, ) -> Result<()> { - if let Some(value) = att.offset_type() { - write!(fmt, " __offset({:#X}", value.offset)?; - // InnerRef InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x720aa0 - if value.is_rvaoff() { - write!(fmt, "|RVAOFF")?; - } - if value.is_pastend() { - write!(fmt, "|PASTEND")?; - } - if value.is_nobase() { - write!(fmt, "|NOBASE")?; - } - if value.is_subtract() { - write!(fmt, "|SUBTRACT")?; - } - if value.is_signedop() { - write!(fmt, "|SIGNEDOP")?; - } - if value.is_nozeroes() { - write!(fmt, "|NOZEROES")?; - } - if value.is_noones() { - write!(fmt, "|NOONES")?; - } - if value.is_selfref() { - write!(fmt, "|SELFREF")?; - } - write!(fmt, ")")?; + let Some(value) = att.offset_type() else { + // TODO don't ignore errors + return Ok(()); + }; + write!(fmt, " __offset({:#X}", value.offset)?; + // InnerRef InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x720aa0 + if value.is_rvaoff() { + write!(fmt, "|RVAOFF")?; + } + if value.is_pastend() { + write!(fmt, "|PASTEND")?; + } + if value.is_nobase() { + write!(fmt, "|NOBASE")?; + } + if value.is_subtract() { + write!(fmt, "|SUBTRACT")?; + } + if value.is_signedop() { + write!(fmt, "|SIGNEDOP")?; + } + if value.is_nozeroes() { + write!(fmt, "|NOZEROES")?; + } + if value.is_noones() { + write!(fmt, "|NOONES")?; } + if value.is_selfref() { + write!(fmt, "|SELFREF")?; + } + write!(fmt, ")")?; + Ok(()) +} + +fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt) -> Result<()> { + let Some(basic_att) = att.basic() else { + write!(fmt, " {att:x?}")?; + // TODO don't ignore errors + return Ok(()); + }; + + use idb_rs::til::r#struct::ExtAttBasicFmt::*; + if basic_att.is_inv_bits { + write!(fmt, " __invbits")? + } + if basic_att.is_inv_sign { + write!(fmt, " __invsign")? + } + if basic_att.is_lzero { + write!(fmt, " __lzero")? + } + match (basic_att.fmt, basic_att.is_signed) { + (Bin, true) => write!(fmt, " __sbin")?, + (Bin, false) => write!(fmt, " __bin")?, + (Oct, true) => write!(fmt, " __soct")?, + (Oct, false) => write!(fmt, " __oct")?, + (Hex, true) => write!(fmt, " __shex")?, + (Hex, false) => write!(fmt, " __hex")?, + (Dec, true) => write!(fmt, " __dec")?, + (Dec, false) => write!(fmt, " __udec")?, + (Float, _) => write!(fmt, " __float")?, + (Char, _) => write!(fmt, " __char")?, + (Segm, _) => write!(fmt, " __segm")?, + (Off, _) => write!(fmt, " __off")?, + }; + match (basic_att.fmt, basic_att.is_signed) { + (_, false) => {} + // already included on the name + (Bin | Dec | Oct | Hex, _) => {} + (Float | Char | Segm | Off, true) => write!(fmt, " __signed")?, + }; - return Ok(()); + if let Some(tabform) = basic_att.tabform { + // InnerRef InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48857f + let val1 = match tabform.val1 { + idb_rs::til::r#struct::ExtAttBasicTabformVal1::NODUPS => "NODUPS", + idb_rs::til::r#struct::ExtAttBasicTabformVal1::HEX => "HEX", + idb_rs::til::r#struct::ExtAttBasicTabformVal1::DEC => "DEC", + idb_rs::til::r#struct::ExtAttBasicTabformVal1::OCT => "OCT", + idb_rs::til::r#struct::ExtAttBasicTabformVal1::BIN => "BIN", + }; + write!(fmt, " __tabform({val1},{})", tabform.val2)?; + } + Ok(()) } fn print_til_type_name( From 3319897adcf51169b4bf65b7d73a482b945239d8 Mon Sep 17 00:00:00 2001 From: rbran Date: Thu, 2 Jan 2025 14:53:08 -0300 Subject: [PATCH 10/53] fix tilib not removing "_" from some symbols --- src/tools/tilib.rs | 17 ++++++++--------- 1 file changed, 8 insertions(+), 9 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 9efcb4a..6848d35 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -233,16 +233,15 @@ fn print_symbols( let sym_kind = " "; write!(fmt, " {} ", sym_kind)?; + // TODO investiage this + let name = if symbol.ordinal == 0 && symbol.name.get(0) == Some(&b'_') { + // remove the first "_", if any + &symbol.name[1..] + } else { + &symbol.name + }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a3a - print_til_type( - fmt, - section, - Some(&symbol.name), - &symbol.tinfo, - true, - false, - true, - )?; + print_til_type(fmt, section, Some(name), &symbol.tinfo, true, false, true)?; writeln!(fmt, ";")?; } Ok(()) From a39825bea086b655f0834a5505d5bb88bb54a2ed Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 09:29:32 -0300 Subject: [PATCH 11/53] fix tilib missing prefix name for complex ref --- src/tools/tilib.rs | 17 +++++++++++++---- 1 file changed, 13 insertions(+), 4 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 6848d35..8b1b26b 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -387,7 +387,7 @@ fn print_til_type( print_type_prefix, ), TypeVariant::Typedef(ref_type) => { - print_til_type_typedef(fmt, section, name, ref_type, false) + print_til_type_typedef(fmt, section, name, ref_type, false, None) } TypeVariant::UnionRef(ref_type) => { print_til_type_complex_ref(fmt, section, name, ref_type, "union", true) @@ -480,7 +480,8 @@ fn print_til_type_pointer( print_type_prefix, true, )?; - if print_pointer_space { + // if the innertype is also a pointer, don't print the space + if print_pointer_space && !matches!(&pointer.typ.type_variant, TypeVariant::Pointer(_)) { write!(fmt, " ")?; } let modifier = match pointer.modifier { @@ -590,6 +591,7 @@ fn print_til_type_typedef( name: Option<&[u8]>, typedef: &Typedef, print_prefix: bool, + ref_prefix: Option<&str>, ) -> Result<()> { // only print prefix, if is root match typedef { @@ -607,7 +609,14 @@ fn print_til_type_typedef( match ty { Some(ty) => print_til_type_name(fmt, &ty.name, &ty.tinfo, print_prefix)?, // if we can't find the type, just print the name - None => write!(fmt, "{}", String::from_utf8_lossy(name))?, + None => { + if print_prefix { + if let Some(ref_prefix) = ref_prefix { + write!(fmt, "{ref_prefix} ")?; + } + } + write!(fmt, "{}", String::from_utf8_lossy(name))? + } } } } @@ -635,7 +644,7 @@ fn print_til_type_complex_ref( } } } else { - print_til_type_typedef(fmt, section, name, typedef, print_prefix)?; + print_til_type_typedef(fmt, section, name, typedef, print_prefix, Some(prefix_name))?; } Ok(()) } From 651f57935ed2dc6fa9ffab81f93a6998280cfe9e Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 09:40:31 -0300 Subject: [PATCH 12/53] fix tilib small formting issues --- src/tools/tilib.rs | 18 +++++++++++------- 1 file changed, 11 insertions(+), 7 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 8b1b26b..e8ac333 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -511,7 +511,10 @@ fn print_til_type_function( is_pointer: bool, ) -> Result<()> { // return type - print_til_type(fmt, section, None, &til_type.ret, false, true, true)?; + print_til_type(fmt, section, None, &til_type.ret, true, true, true)?; + if !matches!(&til_type.ret.type_variant, TypeVariant::Pointer(_)) { + write!(fmt, " ")?; + } let cc = match (section.cc, til_type.calling_convention) { // don't print if using the til section default cc @@ -526,10 +529,10 @@ fn print_til_type_function( // print name and calling convention match (is_pointer, cc) { - (true, None) => write!(fmt, " (*")?, - (false, None) => write!(fmt, " ")?, - (true, Some(cc)) => write!(fmt, " (__{cc} *")?, - (false, Some(cc)) => write!(fmt, " __{cc} ")?, + (true, None) => write!(fmt, "(*")?, + (false, None) => write!(fmt, "")?, + (true, Some(cc)) => write!(fmt, "(__{cc} *")?, + (false, Some(cc)) => write!(fmt, "__{cc} ")?, } if let Some(name) = name { fmt.write_all(name)?; @@ -843,6 +846,7 @@ fn print_til_type_enum( write!(fmt, "enum {output_fmt_name}")?; if let Some(name) = name { fmt.write_all(name)?; + write!(fmt, " ")?; } match (til_enum.storage_size, section.size_enum) { (None, None) => {} @@ -856,14 +860,14 @@ fn print_til_type_enum( .map(|x| x.max(1)) //can't have a value being represented in 0bits .unwrap_or(8); if bits_required / 8 < storage_size.get().into() { - write!(fmt, ": __int{}", storage_size.get() as usize * 8)?; + write!(fmt, ": __int{} ", storage_size.get() as usize * 8)?; } } } (None, Some(_)) => {} (Some(_), None) => {} } - write!(fmt, " {{")?; + write!(fmt, "{{")?; for (member_name, value) in &til_enum.members { if let Some(member_name) = member_name { fmt.write_all(member_name)?; From 65917c7362c7c8b25cfaf96bffc6ef0c8b45d877 Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 10:24:13 -0300 Subject: [PATCH 13/53] fix tilib enum format printing --- src/til/enum.rs | 15 ++++++++++++++- src/til/section.rs | 1 + src/tools/tilib.rs | 27 +++++++++------------------ 3 files changed, 24 insertions(+), 19 deletions(-) diff --git a/src/til/enum.rs b/src/til/enum.rs index 65d95bf..e6e7337 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -7,6 +7,8 @@ use anyhow::{anyhow, ensure}; #[derive(Clone, Debug)] pub struct Enum { + pub is_signed: bool, + pub is_unsigned: bool, pub output_format: EnumFormat, pub members: Vec<(Option>, u64)>, pub groups: Option>, @@ -26,6 +28,8 @@ impl Enum { .map(|member| (fields.next().flatten(), member)) .collect(); Ok(Self { + is_signed: value.is_signed, + is_unsigned: value.is_unsigned, output_format: value.output_format, members, groups: value.groups, @@ -36,6 +40,8 @@ impl Enum { #[derive(Clone, Debug)] pub(crate) struct EnumRaw { + is_signed: bool, + is_unsigned: bool, output_format: EnumFormat, groups: Option>, members: Vec, @@ -72,7 +78,7 @@ impl EnumRaw { "Enum BTE missing the Always sub-field" ); let storage_size: Option = match bte & BTE_SIZE_MASK { - 0 => header.size_enum, + 0 => None, emsize @ 1..=4 => Some((1 << (emsize - 1)).try_into().unwrap()), // Allowed at InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4523c8 deserialize_enum 5..=7 => return Err(anyhow!("BTE emsize with reserved values")), @@ -96,6 +102,11 @@ impl EnumRaw { _ => unreachable!(), }; + // TODO ensure no bits from bte or taenum_bits are unparsed + let is_signed = taenum_bits.0 & TAENUM_SIGNED != 0; + let is_unsigned = taenum_bits.0 & TAENUM_UNSIGNED != 0; + // TODO ensure only signed/unsigned is allowed? + // let is_64 = (taenum_bits.0 & TAENUM_64BIT) != 0; let mut low_acc: u32 = 0; let mut high_acc: u32 = 0; @@ -123,6 +134,8 @@ impl EnumRaw { .collect::>()?; Ok(TypeVariantRaw::Enum(EnumRaw { + is_signed, + is_unsigned, output_format, members, groups, diff --git a/src/til/section.rs b/src/til/section.rs index 553a02e..b8fe97a 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -293,6 +293,7 @@ impl TILSection { title, description, compiler_id: header2.compiler_id, + // TODO panic if None? size_enum: header2.size_enum.try_into().ok(), size_int: header2.size_int.try_into()?, size_bool: header2.size_bool.try_into()?, diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index e8ac333..d37c4b2 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -848,24 +848,15 @@ fn print_til_type_enum( fmt.write_all(name)?; write!(fmt, " ")?; } - match (til_enum.storage_size, section.size_enum) { - (None, None) => {} - (Some(storage_size), Some(size_enum)) => { - if storage_size != size_enum { - let bits_required = til_enum - .members - .iter() - .map(|(_, value)| u64::BITS - value.leading_zeros()) - .max() - .map(|x| x.max(1)) //can't have a value being represented in 0bits - .unwrap_or(8); - if bits_required / 8 < storage_size.get().into() { - write!(fmt, ": __int{} ", storage_size.get() as usize * 8)?; - } - } - } - (None, Some(_)) => {} - (Some(_), None) => {} + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4443b0 + if til_enum.storage_size.is_some() || til_enum.is_signed || til_enum.is_unsigned { + let bytes = til_enum.storage_size.or(section.size_enum).unwrap(); + let signed = if til_enum.is_unsigned { + "unsigned " + } else { + "" + }; + write!(fmt, ": {signed}__int{} ", bytes.get() as usize * 8)?; } write!(fmt, "{{")?; for (member_name, value) in &til_enum.members { From 43982681bd6c40928a77c7cd8d3731bd1586241d Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 11:39:26 -0300 Subject: [PATCH 14/53] fix tilib missing vft flag --- src/tools/tilib.rs | 27 ++++++++++++++++++++++++++- 1 file changed, 26 insertions(+), 1 deletion(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index d37c4b2..0f936da 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -499,6 +499,11 @@ fn print_til_type_pointer( if let Some(name) = name { fmt.write_all(name)?; } + + // if the pointed type itself is a VFT then the pointer need to print that + if is_vft(section, &pointer.typ) { + write!(fmt, " /*VFT*/")?; + } } Ok(()) } @@ -953,7 +958,6 @@ fn print_til_struct_member_void_pointer_att( fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt) -> Result<()> { let Some(basic_att) = att.basic() else { - write!(fmt, " {att:x?}")?; // TODO don't ignore errors return Ok(()); }; @@ -1121,3 +1125,24 @@ fn print_types_total(fmt: &mut impl Write, section: &TILSection) -> Result<()> { "Total {symbols_num} symbols, {types_num} types, {macros_num} macros" ) } + +fn is_vft(section: &TILSection, typ: &Type) -> bool { + match &typ.type_variant { + // propagate the search? + //TypeVariant::Pointer(pointer) => todo!(), + // TODO struct with only function-pointers is also vftable? + TypeVariant::Struct(ty) => ty.is_vftable, + TypeVariant::Typedef(typedef) | TypeVariant::StructRef(typedef) => { + let inner_type = match typedef { + Typedef::Ordinal(ord) => section.get_ord(Id0TilOrd { ord: (*ord).into() }), + Typedef::Name(None) => return false, + Typedef::Name(Some(name)) => section.get_name(name), + }; + let Some(inner_type) = inner_type else { + return false; + }; + is_vft(section, &inner_type.tinfo) + } + _ => false, + } +} From f84cb0a15752aa049c1721934f5747fd73ff7f6d Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 12:14:07 -0300 Subject: [PATCH 15/53] add tilib bitfield implementation --- src/til/bitfield.rs | 6 ++- src/tools/tilib.rs | 100 +++++++++++++++++++++++++++----------------- 2 files changed, 66 insertions(+), 40 deletions(-) diff --git a/src/til/bitfield.rs b/src/til/bitfield.rs index 6c457d3..0bd7a1b 100644 --- a/src/til/bitfield.rs +++ b/src/til/bitfield.rs @@ -1,3 +1,5 @@ +use std::num::NonZeroU8; + use crate::ida_reader::IdaGenericBufUnpack; use crate::til::TAH; @@ -5,7 +7,7 @@ use crate::til::TAH; pub struct Bitfield { pub unsigned: bool, pub width: u16, - pub nbytes: i32, + pub nbytes: NonZeroU8, } impl Bitfield { @@ -25,7 +27,7 @@ impl Bitfield { Ok(Self { unsigned, width, - nbytes, + nbytes: nbytes.try_into().unwrap(), }) } } diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 0f936da..532d14d 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -1,5 +1,6 @@ use idb_rs::id0::{Compiler, Id0TilOrd}; use idb_rs::til::array::Array; +use idb_rs::til::bitfield::Bitfield; use idb_rs::til::function::{CallingConvention, Function}; use idb_rs::til::pointer::Pointer; use idb_rs::til::r#enum::Enum; @@ -405,7 +406,7 @@ fn print_til_type( print_til_type_union(fmt, section, name, til_union, print_name) } TypeVariant::Enum(til_enum) => print_til_type_enum(fmt, section, name, til_enum), - TypeVariant::Bitfield(_bitfield) => write!(fmt, "todo!(\"Bitfield\")"), + TypeVariant::Bitfield(bitfield) => print_til_type_bitfield(fmt, name, bitfield), } } @@ -415,44 +416,9 @@ fn print_til_type_basic( name: Option<&[u8]>, til_basic: &Basic, ) -> Result<()> { - const fn signed_name(is_signed: Option) -> &'static str { - match is_signed { - Some(true) | None => "", - Some(false) => "unsigned ", - } - } - - let name_space = if name.is_some() { " " } else { "" }; - match til_basic { - Basic::Bool => write!(fmt, "bool{name_space}",)?, - Basic::Char => write!(fmt, "char{name_space}",)?, - Basic::Short { is_signed } => write!(fmt, "{}short{name_space}", signed_name(*is_signed))?, - Basic::Void => write!(fmt, "void{name_space}",)?, - Basic::SegReg => write!(fmt, "SegReg{name_space}")?, - Basic::Unknown { bytes: 1 } => write!(fmt, "_BYTE{name_space}")?, - Basic::Unknown { bytes: 2 } => write!(fmt, "_WORD{name_space}")?, - Basic::Unknown { bytes: 4 } => write!(fmt, "_DWORD{name_space}")?, - Basic::Unknown { bytes: 8 } => write!(fmt, "_QWORD{name_space}")?, - Basic::Unknown { bytes } => write!(fmt, "unknown{bytes}{name_space}")?, - Basic::Int { is_signed } => write!(fmt, "{}int{name_space}", signed_name(*is_signed))?, - Basic::Long { is_signed } => write!(fmt, "{}long{name_space}", signed_name(*is_signed))?, - Basic::LongLong { is_signed } => { - write!(fmt, "{}longlong{name_space}", signed_name(*is_signed))? - } - Basic::IntSized { bytes, is_signed } => { - if let Some(false) = is_signed { - write!(fmt, "unsigned ")?; - } - write!(fmt, "__int{}{name_space}", bytes.get() * 8)? - } - Basic::LongDouble => write!(fmt, "longfloat{name_space}")?, - Basic::Float { bytes } if bytes.get() == 4 => write!(fmt, "float{name_space}")?, - Basic::Float { bytes } if bytes.get() == 8 => write!(fmt, "double{name_space}")?, - Basic::Float { bytes } => write!(fmt, "float{bytes}{name_space}")?, - Basic::BoolSized { bytes } if bytes.get() == 1 => write!(fmt, "bool{name_space}")?, - Basic::BoolSized { bytes } => write!(fmt, "bool{bytes}{name_space}")?, - } + print_basic_type(fmt, til_basic)?; if let Some(name) = name { + write!(fmt, " ")?; fmt.write_all(name)?; } Ok(()) @@ -885,6 +851,26 @@ fn print_til_type_enum( write!(fmt, "}}") } +fn print_til_type_bitfield( + fmt: &mut impl Write, + name: Option<&[u8]>, + bitfield: &Bitfield, +) -> Result<()> { + print_basic_type( + fmt, + &Basic::IntSized { + bytes: bitfield.nbytes, + is_signed: Some(!bitfield.unsigned), + }, + )?; + if let Some(name) = name { + write!(fmt, " ")?; + fmt.write_all(name)?; + } + write!(fmt, " : {}", bitfield.width)?; + Ok(()) +} + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x423c20 fn print_til_struct_member_att( fmt: &mut impl Write, @@ -1146,3 +1132,41 @@ fn is_vft(section: &TILSection, typ: &Type) -> bool { _ => false, } } + +fn print_basic_type(fmt: &mut impl Write, til_basic: &Basic) -> Result<()> { + const fn signed_name(is_signed: Option) -> &'static str { + match is_signed { + Some(true) | None => "", + Some(false) => "unsigned ", + } + } + + match til_basic { + Basic::Bool => write!(fmt, "bool")?, + Basic::Char => write!(fmt, "char")?, + Basic::Short { is_signed } => write!(fmt, "{}short", signed_name(*is_signed))?, + Basic::Void => write!(fmt, "void")?, + Basic::SegReg => write!(fmt, "SegReg")?, + Basic::Unknown { bytes: 1 } => write!(fmt, "_BYTE")?, + Basic::Unknown { bytes: 2 } => write!(fmt, "_WORD")?, + Basic::Unknown { bytes: 4 } => write!(fmt, "_DWORD")?, + Basic::Unknown { bytes: 8 } => write!(fmt, "_QWORD")?, + Basic::Unknown { bytes } => write!(fmt, "unknown{bytes}")?, + Basic::Int { is_signed } => write!(fmt, "{}int", signed_name(*is_signed))?, + Basic::Long { is_signed } => write!(fmt, "{}long", signed_name(*is_signed))?, + Basic::LongLong { is_signed } => write!(fmt, "{}longlong", signed_name(*is_signed))?, + Basic::IntSized { bytes, is_signed } => { + if let Some(false) = is_signed { + write!(fmt, "unsigned ")?; + } + write!(fmt, "__int{}", bytes.get() * 8)? + } + Basic::LongDouble => write!(fmt, "longfloat")?, + Basic::Float { bytes } if bytes.get() == 4 => write!(fmt, "float")?, + Basic::Float { bytes } if bytes.get() == 8 => write!(fmt, "double")?, + Basic::Float { bytes } => write!(fmt, "float{bytes}")?, + Basic::BoolSized { bytes } if bytes.get() == 1 => write!(fmt, "bool")?, + Basic::BoolSized { bytes } => write!(fmt, "bool{bytes}")?, + } + Ok(()) +} From e813ba6582eba273e09aff178e2402cffccfb4e4 Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 12:42:53 -0300 Subject: [PATCH 16/53] add til struct unknown flag 8 --- src/til.rs | 12 ++++++++++-- src/til/struct.rs | 23 ++++++++++++++++------- src/tools/tilib.rs | 6 +++++- 3 files changed, 31 insertions(+), 10 deletions(-) diff --git a/src/til.rs b/src/til.rs index ec3640f..ad86749 100644 --- a/src/til.rs +++ b/src/til.rs @@ -676,6 +676,8 @@ pub struct StructModifierRaw { is_cpp_obj: bool, /// Virtual function table is_vftable: bool, + // TODO unknown meaning + is_unknown_8: bool, /// Alignment in bytes alignment: Option, /// other unknown value @@ -695,10 +697,15 @@ impl StructModifierRaw { let is_unaligned = value & TAUDT_UNALIGNED != 0; let is_vftable = value & TAUDT_VFTABLE != 0; let alignment_raw = value & TAUDT_ALIGN_MASK; + let is_unknown_8 = value & 0x8 != 0; let alignment = (alignment_raw != 0).then(|| NonZeroU8::new(1 << (alignment_raw - 1)).unwrap()); - let all_masks = - TAUDT_MSSTRUCT | TAUDT_CPPOBJ | TAUDT_UNALIGNED | TAUDT_VFTABLE | TAUDT_ALIGN_MASK; + let all_masks = TAUDT_MSSTRUCT + | TAUDT_CPPOBJ + | TAUDT_UNALIGNED + | TAUDT_VFTABLE + | TAUDT_ALIGN_MASK + | 0x8; let others = NonZeroU16::new(value & !all_masks); Self { is_unaligned, @@ -706,6 +713,7 @@ impl StructModifierRaw { is_cpp_obj, is_vftable, alignment, + is_unknown_8, others, } } diff --git a/src/til/struct.rs b/src/til/struct.rs index 9a56c1a..b328753 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -20,6 +20,8 @@ pub struct Struct { pub is_cpp_obj: bool, /// Virtual function table pub is_vftable: bool, + /// Unknown meaning, use at your own risk + pub is_uknown_8: bool, /// Alignment in bytes pub alignment: Option, // TODO delete others, parse all values or return an error @@ -44,6 +46,7 @@ impl Struct { is_msstruct: value.modifier.is_msstruct, is_cpp_obj: value.modifier.is_cpp_obj, is_vftable: value.modifier.is_vftable, + is_uknown_8: value.modifier.is_unknown_8, alignment: value.modifier.alignment, others: value.modifier.others, }) @@ -80,9 +83,17 @@ impl StructRaw { let alpow = n & 7; let effective_alignment = (alpow != 0).then(|| NonZeroU8::new(1 << (alpow - 1)).unwrap()); // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459c97 - let taudt_bits = SDACL::read(&mut *input)?; + let mut taudt_bits = SDACL::read(&mut *input)?; + + // consume the is_bit used by the StructMemberRaw + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 + let is_bitset = taudt_bits.0 .0 & 0x200 != 0; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47822d + let is_bitset2 = taudt_bits.0 .0 & 0x4 != 0; + taudt_bits.0 .0 &= !0x204; + let members = (0..mem_cnt) - .map(|_| StructMemberRaw::read(&mut *input, header, taudt_bits.0 .0)) + .map(|_| StructMemberRaw::read(&mut *input, header, is_bitset, is_bitset2)) .collect::>()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x46c4fc print_til_types_att @@ -129,13 +140,11 @@ impl StructMemberRaw { fn read( input: &mut impl IdaGenericBufUnpack, header: &TILSectionHeader, - taudt_bits: u16, + is_bit_set: bool, + is_bit_set2: bool, ) -> Result { let ty = TypeRaw::read(&mut *input, header)?; - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 - let is_bit_set = taudt_bits & 0x200 != 0; - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478256 let att = is_bit_set .then(|| Self::read_member_att_1(input, header)) @@ -147,7 +156,7 @@ impl StructMemberRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47825d sdacl = SDACL::read(&mut *input)?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47822d - if taudt_bits & 4 != 0 && sdacl.0 .0 & 0x200 == 0 { + if is_bit_set2 && sdacl.0 .0 & 0x200 == 0 { // TODO there is more to this impl? // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478411 // todo!(); diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 532d14d..f868ab9 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -632,7 +632,11 @@ fn print_til_type_struct( ) -> Result<()> { write!(fmt, "struct ")?; if til_struct.is_unaligned { - write!(fmt, "__unaligned ")?; + if til_struct.is_uknown_8 { + write!(fmt, "__attribute__((packed)) ")?; + } else { + write!(fmt, "__unaligned ")?; + } } if til_struct.is_msstruct { write!(fmt, "__attribute__((msstruct)) ")?; From 530b027b07d0b9aff0d78ff24944fbc343920ed2 Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 12:51:38 -0300 Subject: [PATCH 17/53] add tilib basic type offset att --- src/til/struct.rs | 12 ++++++++++++ src/tools/tilib.rs | 10 ++++++++++ 2 files changed, 22 insertions(+) diff --git a/src/til/struct.rs b/src/til/struct.rs index b328753..3a2caa5 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -293,6 +293,18 @@ impl StructMemberAtt { _ => None, } } + + pub fn basic_offset_type(self) -> Option<(u32, bool)> { + match self { + StructMemberAtt::Var9 { + val1, + att0: Some(att0 @ (0 | 0x3f58)), + att1: 0, + att2: u64::MAX, + } => Some((val1, att0 == 0x3f58)), + _ => None, + } + } } #[derive(Clone, Copy, Debug)] diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index f868ab9..03e7c0b 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -947,6 +947,16 @@ fn print_til_struct_member_void_pointer_att( } fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt) -> Result<()> { + // TODO imcomplete implementation + if let Some((val, is_auto)) = att.basic_offset_type() { + write!( + fmt, + " __offset({val:#x}{})", + if is_auto { "|AUTO" } else { "" } + )?; + return Ok(()); + } + let Some(basic_att) = att.basic() else { // TODO don't ignore errors return Ok(()); From 94a8aa7e958f2cb3c72c3ec9a255992f8766e54d Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 13:10:33 -0300 Subject: [PATCH 18/53] fix tilib wrong struct alignment value --- src/til/struct.rs | 3 ++- src/tools/tilib.rs | 2 +- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/src/til/struct.rs b/src/til/struct.rs index 3a2caa5..537ab06 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -89,8 +89,9 @@ impl StructRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 let is_bitset = taudt_bits.0 .0 & 0x200 != 0; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47822d + // TODO this value can't be right, it defines the alignment! let is_bitset2 = taudt_bits.0 .0 & 0x4 != 0; - taudt_bits.0 .0 &= !0x204; + taudt_bits.0 .0 &= !0x200; // NOTE don't consume 0x4, it's used somewhere else let members = (0..mem_cnt) .map(|_| StructMemberRaw::read(&mut *input, header, is_bitset, is_bitset2)) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 03e7c0b..2e307ba 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -947,7 +947,7 @@ fn print_til_struct_member_void_pointer_att( } fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt) -> Result<()> { - // TODO imcomplete implementation + // TODO incomplete implementation if let Some((val, is_auto)) = att.basic_offset_type() { write!( fmt, From c6e02c643da8eff8a608393230470d5930c92a7f Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 13:19:22 -0300 Subject: [PATCH 19/53] fix tilib missing basic offset att --- src/til/struct.rs | 5 +++-- src/tools/tilib.rs | 6 ++++++ 2 files changed, 9 insertions(+), 2 deletions(-) diff --git a/src/til/struct.rs b/src/til/struct.rs index 537ab06..bd8becb 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -296,13 +296,14 @@ impl StructMemberAtt { } pub fn basic_offset_type(self) -> Option<(u32, bool)> { + // TODO find the InnerRef match self { StructMemberAtt::Var9 { val1, - att0: Some(att0 @ (0 | 0x3f58)), + att0: Some(att0 @ (0 | 0x4e8 | 0x3f58)), att1: 0, att2: u64::MAX, - } => Some((val1, att0 == 0x3f58)), + } => Some((val1, att0 != 0)), _ => None, } } diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 2e307ba..f66ae49 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -958,6 +958,12 @@ fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt } let Some(basic_att) = att.basic() else { + if !matches!( + att, + StructMemberAtt::Var0to7(idb_rs::til::r#struct::StructMemberAttBasic::Var1(0)) + ) { + write!(fmt, " __other({att:x?})",)?; + } // TODO don't ignore errors return Ok(()); }; From 7b51fd869c3714623532b29cc7500e7dd84ee019 Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 3 Jan 2025 13:52:08 -0300 Subject: [PATCH 20/53] fix tilib function not printing void for no args --- src/tools/tilib.rs | 9 +++------ 1 file changed, 3 insertions(+), 6 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index f66ae49..33884e7 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -521,6 +521,9 @@ fn print_til_type_function( let param_name = param_name.as_ref().map(Vec::as_slice); print_til_type(fmt, section, param_name, param, true, false, true)?; } + if til_type.args.len() == 0 { + write!(fmt, "void")?; + } if til_type.calling_convention == Some(CallingConvention::Ellipsis) { if !til_type.args.is_empty() { write!(fmt, ", ")?; @@ -958,12 +961,6 @@ fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt } let Some(basic_att) = att.basic() else { - if !matches!( - att, - StructMemberAtt::Var0to7(idb_rs::til::r#struct::StructMemberAttBasic::Var1(0)) - ) { - write!(fmt, " __other({att:x?})",)?; - } // TODO don't ignore errors return Ok(()); }; From 716ea991855c1fbad2db150a88abc249ba790feb Mon Sep 17 00:00:00 2001 From: rbran Date: Mon, 6 Jan 2025 09:14:04 -0300 Subject: [PATCH 21/53] fix tilib function not printing some flags --- src/tools/tilib.rs | 30 +++++++++++++++++++++++------- 1 file changed, 23 insertions(+), 7 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 33884e7..2b24a08 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -498,19 +498,35 @@ fn print_til_type_function( (_, Some(cc)) => Some(calling_convention_to_str(cc)), }; - // print name and calling convention + // print name and calling convention and some flags match (is_pointer, cc) { - (true, None) => write!(fmt, "(*")?, - (false, None) => write!(fmt, "")?, - (true, Some(cc)) => write!(fmt, "(__{cc} *")?, + (true, None) => write!(fmt, "(")?, + (false, None) => {} + (true, Some(cc)) => write!(fmt, "(__{cc} ")?, (false, Some(cc)) => write!(fmt, "__{cc} ")?, } + + // between the name and cc print some flags + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x442ccf + if til_type.is_noret { + write!(fmt, "__noreturn ")?; + } + if til_type.is_pure { + write!(fmt, "__pure ")?; + } + if til_type.is_high { + write!(fmt, "__high ")?; + } + + if is_pointer { + write!(fmt, "*")?; + } + if let Some(name) = name { fmt.write_all(name)?; } - match (is_pointer, cc) { - (true, Some(_)) | (true, None) => write!(fmt, ")")?, - (false, Some(_)) | (false, None) => {} + if is_pointer { + write!(fmt, ")")?; } write!(fmt, "(")?; From b4c9edee69868d9bff80724bd95a5d2797f13f63 Mon Sep 17 00:00:00 2001 From: rbran Date: Mon, 6 Jan 2025 09:55:09 -0300 Subject: [PATCH 22/53] fix tilib const/volatile flag location --- src/tools/tilib.rs | 174 +++++++++++++++++++++++++++------------------ 1 file changed, 105 insertions(+), 69 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 2b24a08..de77511 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -360,53 +360,51 @@ fn print_til_type( print_type_prefix: bool, print_name: bool, ) -> Result<()> { - if til_type.is_volatile { - write!(fmt, "volatile ")?; - } - if til_type.is_const { - write!(fmt, "const ")?; - } match &til_type.type_variant { - TypeVariant::Basic(til_basic) => print_til_type_basic(fmt, section, name, til_basic), + TypeVariant::Basic(til_basic) => { + print_til_type_basic(fmt, section, name, til_type, til_basic) + } TypeVariant::Pointer(pointer) => print_til_type_pointer( fmt, section, name, + til_type, pointer, print_pointer_space, print_type_prefix, ), TypeVariant::Function(function) => { - print_til_type_function(fmt, section, name, function, false) + print_til_type_function(fmt, section, name, til_type, function, false) } TypeVariant::Array(array) => print_til_type_array( fmt, section, name, + til_type, array, print_pointer_space, print_type_prefix, ), TypeVariant::Typedef(ref_type) => { - print_til_type_typedef(fmt, section, name, ref_type, false, None) + print_til_type_typedef(fmt, section, name, til_type, ref_type, false) } TypeVariant::UnionRef(ref_type) => { - print_til_type_complex_ref(fmt, section, name, ref_type, "union", true) + print_til_type_complex_ref(fmt, section, name, til_type, ref_type, print_type_prefix) } TypeVariant::EnumRef(ref_type) => { - print_til_type_complex_ref(fmt, section, name, ref_type, "enum", true) + print_til_type_complex_ref(fmt, section, name, til_type, ref_type, print_type_prefix) } TypeVariant::StructRef(ref_type) => { - print_til_type_complex_ref(fmt, section, name, ref_type, "struct", true) + print_til_type_complex_ref(fmt, section, name, til_type, ref_type, print_type_prefix) } TypeVariant::Struct(til_struct) => { - print_til_type_struct(fmt, section, name, til_struct, print_name) + print_til_type_struct(fmt, section, name, til_type, til_struct, print_name) } TypeVariant::Union(til_union) => { - print_til_type_union(fmt, section, name, til_union, print_name) + print_til_type_union(fmt, section, name, til_type, til_union, print_name) } - TypeVariant::Enum(til_enum) => print_til_type_enum(fmt, section, name, til_enum), - TypeVariant::Bitfield(bitfield) => print_til_type_bitfield(fmt, name, bitfield), + TypeVariant::Enum(til_enum) => print_til_type_enum(fmt, section, name, til_type, til_enum), + TypeVariant::Bitfield(bitfield) => print_til_type_bitfield(fmt, name, til_type, bitfield), } } @@ -414,8 +412,15 @@ fn print_til_type_basic( fmt: &mut impl Write, _section: &TILSection, name: Option<&[u8]>, + til_type: &Type, til_basic: &Basic, ) -> Result<()> { + if til_type.is_volatile { + write!(fmt, "volatile ")?; + } + if til_type.is_const { + write!(fmt, "const ")?; + } print_basic_type(fmt, til_basic)?; if let Some(name) = name { write!(fmt, " ")?; @@ -428,13 +433,14 @@ fn print_til_type_pointer( fmt: &mut impl Write, section: &TILSection, name: Option<&[u8]>, + til_type: &Type, pointer: &Pointer, print_pointer_space: bool, print_type_prefix: bool, ) -> Result<()> { if let TypeVariant::Function(inner_fun) = &pointer.typ.type_variant { // How to handle modifier here? - print_til_type_function(fmt, section, name, inner_fun, true)?; + print_til_type_function(fmt, section, name, til_type, inner_fun, true)?; } else { // TODO name print_til_type( @@ -450,13 +456,21 @@ fn print_til_type_pointer( if print_pointer_space && !matches!(&pointer.typ.type_variant, TypeVariant::Pointer(_)) { write!(fmt, " ")?; } - let modifier = match pointer.modifier { - None => "", - Some(idb_rs::til::pointer::PointerModifier::Ptr32) => "__ptr32 ", - Some(idb_rs::til::pointer::PointerModifier::Ptr64) => "__ptr64 ", - Some(idb_rs::til::pointer::PointerModifier::Restricted) => "__restricted ", - }; - write!(fmt, "*{modifier}")?; + write!(fmt, "*")?; + if til_type.is_volatile { + write!(fmt, "volatile ")?; + } + if til_type.is_const { + write!(fmt, "const ")?; + } + match pointer.modifier { + None => {} + Some(idb_rs::til::pointer::PointerModifier::Ptr32) => write!(fmt, "__ptr32 ")?, + Some(idb_rs::til::pointer::PointerModifier::Ptr64) => write!(fmt, "__ptr64 ")?, + Some(idb_rs::til::pointer::PointerModifier::Restricted) => { + write!(fmt, "__restricted ")? + } + } if let Some((ty, value)) = &pointer.shifted { write!(fmt, "__shifted(")?; print_til_type_only(fmt, section, ty)?; @@ -478,16 +492,23 @@ fn print_til_type_function( fmt: &mut impl Write, section: &TILSection, name: Option<&[u8]>, - til_type: &Function, + til_type: &Type, + til_function: &Function, is_pointer: bool, ) -> Result<()> { + if til_type.is_volatile { + write!(fmt, "volatile ")?; + } + if til_type.is_const { + write!(fmt, "const ")?; + } // return type - print_til_type(fmt, section, None, &til_type.ret, true, true, true)?; - if !matches!(&til_type.ret.type_variant, TypeVariant::Pointer(_)) { + print_til_type(fmt, section, None, &til_function.ret, true, true, true)?; + if !matches!(&til_function.ret.type_variant, TypeVariant::Pointer(_)) { write!(fmt, " ")?; } - let cc = match (section.cc, til_type.calling_convention) { + let cc = match (section.cc, til_function.calling_convention) { // don't print if using the til section default cc | (_, None) // if elipsis just print the '...' as last param @@ -508,13 +529,13 @@ fn print_til_type_function( // between the name and cc print some flags // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x442ccf - if til_type.is_noret { + if til_function.is_noret { write!(fmt, "__noreturn ")?; } - if til_type.is_pure { + if til_function.is_pure { write!(fmt, "__pure ")?; } - if til_type.is_high { + if til_function.is_high { write!(fmt, "__high ")?; } @@ -530,18 +551,18 @@ fn print_til_type_function( } write!(fmt, "(")?; - for (i, (param_name, param, _argloc)) in til_type.args.iter().enumerate() { + for (i, (param_name, param, _argloc)) in til_function.args.iter().enumerate() { if i != 0 { write!(fmt, ", ")?; } let param_name = param_name.as_ref().map(Vec::as_slice); print_til_type(fmt, section, param_name, param, true, false, true)?; } - if til_type.args.len() == 0 { + if til_function.args.len() == 0 { write!(fmt, "void")?; } - if til_type.calling_convention == Some(CallingConvention::Ellipsis) { - if !til_type.args.is_empty() { + if til_function.calling_convention == Some(CallingConvention::Ellipsis) { + if !til_function.args.is_empty() { write!(fmt, ", ")?; } write!(fmt, "...")?; @@ -553,10 +574,17 @@ fn print_til_type_array( fmt: &mut impl Write, section: &TILSection, name: Option<&[u8]>, + til_type: &Type, til_array: &Array, print_pointer_space: bool, print_type_prefix: bool, ) -> Result<()> { + if til_type.is_volatile { + write!(fmt, "volatile ")?; + } + if til_type.is_const { + write!(fmt, "const ")?; + } print_til_type( fmt, section, @@ -567,7 +595,11 @@ fn print_til_type_array( true, )?; if let Some(name) = name { - write!(fmt, " ")?; + // only print space if not a pointer + match &til_array.elem_type.type_variant { + TypeVariant::Pointer(_) => {} + _ => write!(fmt, " ")?, + } fmt.write_all(name)?; } if til_array.nelem != 0 { @@ -582,17 +614,26 @@ fn print_til_type_typedef( fmt: &mut impl Write, section: &TILSection, name: Option<&[u8]>, + til_type: &Type, typedef: &Typedef, print_prefix: bool, - ref_prefix: Option<&str>, ) -> Result<()> { + if til_type.is_volatile { + write!(fmt, "volatile ")?; + } + if til_type.is_const { + write!(fmt, "const ")?; + } // only print prefix, if is root match typedef { idb_rs::til::Typedef::Ordinal(ord) => { let ty = section .get_ord(idb_rs::id0::Id0TilOrd { ord: (*ord).into() }) .unwrap(); - print_til_type_name(fmt, &ty.name, &ty.tinfo, print_prefix)?; + if print_prefix { + print_til_type_prefix(fmt, &ty.tinfo, true)?; + } + fmt.write_all(&ty.name)?; } idb_rs::til::Typedef::Name(None) => { // TODO print nothing? @@ -600,13 +641,16 @@ fn print_til_type_typedef( idb_rs::til::Typedef::Name(Some(name)) => { let ty = section.get_name(name); match ty { - Some(ty) => print_til_type_name(fmt, &ty.name, &ty.tinfo, print_prefix)?, + Some(ty) => { + if print_prefix { + print_til_type_prefix(fmt, &ty.tinfo, true)?; + } + fmt.write_all(&ty.name)?; + } // if we can't find the type, just print the name None => { if print_prefix { - if let Some(ref_prefix) = ref_prefix { - write!(fmt, "{ref_prefix} ")?; - } + print_til_type_prefix(fmt, til_type, true)?; } write!(fmt, "{}", String::from_utf8_lossy(name))? } @@ -624,20 +668,16 @@ fn print_til_type_complex_ref( fmt: &mut impl Write, section: &TILSection, name: Option<&[u8]>, + til_type: &Type, typedef: &Typedef, - prefix_name: &str, print_prefix: bool, ) -> Result<()> { if let idb_rs::til::Typedef::Name(None) = typedef { - if print_prefix { - write!(fmt, "{}", prefix_name)?; - if let Some(name) = name { - write!(fmt, " ")?; - fmt.write_all(name)?; - } + if let Some(name) = name { + fmt.write_all(name)?; } } else { - print_til_type_typedef(fmt, section, name, typedef, print_prefix, Some(prefix_name))?; + print_til_type_typedef(fmt, section, name, til_type, typedef, print_prefix)?; } Ok(()) } @@ -646,6 +686,7 @@ fn print_til_type_struct( fmt: &mut impl Write, section: &TILSection, name: Option<&[u8]>, + _til_type: &Type, til_struct: &Struct, print_name: bool, ) -> Result<()> { @@ -702,6 +743,7 @@ fn print_til_type_union( fmt: &mut impl Write, section: &TILSection, name: Option<&[u8]>, + _til_type: &Type, til_union: &Union, print_name: bool, ) -> Result<()> { @@ -827,6 +869,7 @@ fn print_til_type_enum( fmt: &mut impl Write, section: &TILSection, name: Option<&[u8]>, + _til_type: &Type, til_enum: &Enum, ) -> Result<()> { use idb_rs::til::r#enum::EnumFormat::*; @@ -877,6 +920,7 @@ fn print_til_type_enum( fn print_til_type_bitfield( fmt: &mut impl Write, name: Option<&[u8]>, + _til_type: &Type, bitfield: &Bitfield, ) -> Result<()> { print_basic_type( @@ -1026,25 +1070,17 @@ fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt Ok(()) } -fn print_til_type_name( - fmt: &mut impl Write, - name: &[u8], - tinfo: &Type, - print_prefix: bool, -) -> Result<()> { - let name = String::from_utf8_lossy(name); - let prefix = match &tinfo.type_variant { - TypeVariant::Basic(_) - | TypeVariant::Pointer(_) - | TypeVariant::Function(_) - | TypeVariant::Array(_) - | TypeVariant::Typedef(_) - | TypeVariant::Bitfield(_) => "", - TypeVariant::UnionRef(_) | TypeVariant::Union(_) => "union ", - TypeVariant::StructRef(_) | TypeVariant::Struct(_) => "struct ", - TypeVariant::EnumRef(_) | TypeVariant::Enum(_) => "enum ", - }; - write!(fmt, "{}{name}", if print_prefix { prefix } else { "" }) +fn print_til_type_prefix(fmt: &mut impl Write, tinfo: &Type, with_space: bool) -> Result<()> { + match &tinfo.type_variant { + TypeVariant::UnionRef(_) | TypeVariant::Union(_) => write!(fmt, "union")?, + TypeVariant::StructRef(_) | TypeVariant::Struct(_) => write!(fmt, "struct")?, + TypeVariant::EnumRef(_) | TypeVariant::Enum(_) => write!(fmt, "enum")?, + _ => return Ok(()), + } + if with_space { + write!(fmt, " ")?; + } + Ok(()) } fn print_til_type_only(fmt: &mut impl Write, section: &TILSection, tinfo: &Type) -> Result<()> { From 3eefb5f1c49312d76282b4949dc1b6ff27bb621d Mon Sep 17 00:00:00 2001 From: rbran Date: Mon, 6 Jan 2025 10:35:05 -0300 Subject: [PATCH 23/53] fix tilib multiple small print issues --- src/tools/tilib.rs | 82 ++++++++++++++++++++++------------------------ 1 file changed, 39 insertions(+), 43 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index de77511..762e483 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -254,9 +254,11 @@ fn print_types( solver: &mut TILTypeSizeSolver<'_>, ) -> Result<()> { // TODO only print by ordinals if there are ordinals - writeln!(fmt, "(enumerated by ordinals)")?; - print_types_by_ordinals(fmt, section, solver)?; - writeln!(fmt, "(enumerated by names)")?; + if section.flags.has_ordinal() { + writeln!(fmt, "(enumerated by ordinals)")?; + print_types_by_ordinals(fmt, section, solver)?; + writeln!(fmt, "(enumerated by names)")?; + } print_types_by_name(fmt, section, solver)?; Ok(()) } @@ -558,14 +560,15 @@ fn print_til_type_function( let param_name = param_name.as_ref().map(Vec::as_slice); print_til_type(fmt, section, param_name, param, true, false, true)?; } - if til_function.args.len() == 0 { - write!(fmt, "void")?; - } - if til_function.calling_convention == Some(CallingConvention::Ellipsis) { - if !til_function.args.is_empty() { - write!(fmt, ", ")?; + match til_function.calling_convention { + Some(CallingConvention::Voidarg) => write!(fmt, "void")?, + Some(CallingConvention::Ellipsis) => { + if !til_function.args.is_empty() { + write!(fmt, ", ")?; + } + write!(fmt, "...")?; } - write!(fmt, "...")?; + _ => {} } write!(fmt, ")") } @@ -624,41 +627,31 @@ fn print_til_type_typedef( if til_type.is_const { write!(fmt, "const ")?; } - // only print prefix, if is root - match typedef { + if print_prefix { + print_til_type_prefix(fmt, til_type, true)?; + } + // get the type referenced by the typdef + let need_space = match typedef { idb_rs::til::Typedef::Ordinal(ord) => { - let ty = section + let inner_ty = section .get_ord(idb_rs::id0::Id0TilOrd { ord: (*ord).into() }) .unwrap(); - if print_prefix { - print_til_type_prefix(fmt, &ty.tinfo, true)?; - } - fmt.write_all(&ty.name)?; - } - idb_rs::til::Typedef::Name(None) => { - // TODO print nothing? + fmt.write_all(&inner_ty.name)?; + true } idb_rs::til::Typedef::Name(Some(name)) => { - let ty = section.get_name(name); - match ty { - Some(ty) => { - if print_prefix { - print_til_type_prefix(fmt, &ty.tinfo, true)?; - } - fmt.write_all(&ty.name)?; - } - // if we can't find the type, just print the name - None => { - if print_prefix { - print_til_type_prefix(fmt, til_type, true)?; - } - write!(fmt, "{}", String::from_utf8_lossy(name))? - } - } + // NOTE don't need to get the inner type, we already have it's name + fmt.write_all(&name)?; + true } - } + // Nothing to print + idb_rs::til::Typedef::Name(None) => false, + }; + // print the type name, if some if let Some(name) = name { - write!(fmt, " ")?; + if need_space { + write!(fmt, " ")?; + } fmt.write_all(name)?; } Ok(()) @@ -673,6 +666,9 @@ fn print_til_type_complex_ref( print_prefix: bool, ) -> Result<()> { if let idb_rs::til::Typedef::Name(None) = typedef { + if print_prefix { + print_til_type_prefix(fmt, til_type, true)?; + } if let Some(name) = name { fmt.write_all(name)?; } @@ -785,7 +781,7 @@ fn print_til_type_complex_member( name, til, print_pointer_space, - false, + true, print_name, ); }; @@ -799,7 +795,7 @@ fn print_til_type_complex_member( name, til, print_pointer_space, - false, + true, print_name, ); } @@ -818,7 +814,7 @@ fn print_til_type_complex_member( name, til, print_pointer_space, - false, + true, print_name, ); } @@ -833,7 +829,7 @@ fn print_til_type_complex_member( name, til, print_pointer_space, - false, + true, print_name, ); } @@ -849,7 +845,7 @@ fn print_til_type_complex_member( name, til, print_pointer_space, - false, + true, print_name, ); } From 360a4da3f639617974b99af8d06aa04e627162bd Mon Sep 17 00:00:00 2001 From: rbran Date: Mon, 6 Jan 2025 14:10:30 -0300 Subject: [PATCH 24/53] fix til bitfield size calculation --- src/til.rs | 4 + src/til/bitfield.rs | 2 +- src/til/section.rs | 142 +-------------------------- src/til/size_calculator.rs | 193 +++++++++++++++++++++++++++++++++++++ src/tools/tilib.rs | 4 +- 5 files changed, 201 insertions(+), 144 deletions(-) create mode 100644 src/til/size_calculator.rs diff --git a/src/til.rs b/src/til.rs index ad86749..b9f8ec7 100644 --- a/src/til.rs +++ b/src/til.rs @@ -9,6 +9,10 @@ pub mod section; pub mod r#struct; pub mod union; +mod size_calculator; + +pub use size_calculator::*; + use std::num::{NonZeroU16, NonZeroU8}; use anyhow::{anyhow, ensure, Context, Result}; diff --git a/src/til/bitfield.rs b/src/til/bitfield.rs index 0bd7a1b..4a694f5 100644 --- a/src/til/bitfield.rs +++ b/src/til/bitfield.rs @@ -3,7 +3,7 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::TAH; -#[derive(Debug, Clone)] +#[derive(Debug, Clone, Copy)] pub struct Bitfield { pub unsigned: bool, pub width: u16, diff --git a/src/til/section.rs b/src/til/section.rs index b8fe97a..ad91dea 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -1,20 +1,15 @@ use crate::id0::{Compiler, Id0TilOrd}; use crate::ida_reader::{IdaGenericBufUnpack, IdaGenericUnpack}; -use crate::til::{flag, Basic, TILMacro, TILTypeInfo, TypeVariant}; +use crate::til::{flag, TILMacro, TILTypeInfo}; use crate::IDBSectionCompression; use anyhow::{anyhow, ensure, Result}; use serde::{Deserialize, Serialize}; -use std::collections::{HashMap, HashSet}; use std::fmt::Debug; use std::io::{BufReader, Read, Write}; use std::num::NonZeroU8; use super::function::{CCModel, CCPtrSize, CallingConvention}; -use super::r#enum::Enum; -use super::r#struct::Struct; -use super::union::Union; -use super::{Type, Typedef}; // TODO migrate this to flags pub const TIL_SECTION_MAGIC: &[u8; 6] = b"IDATIL"; @@ -684,138 +679,3 @@ impl TILSection { Ok(()) } } - -pub struct TILTypeSizeSolver<'a> { - section: &'a TILSection, - solved: HashMap, - // HACK used to avoid infinte lopping during recursive solving - solving: HashSet, -} - -impl<'a> TILTypeSizeSolver<'a> { - pub fn new(section: &'a TILSection) -> Self { - Self { - section, - solved: Default::default(), - solving: Default::default(), - } - } - - // TODO make a type for type_idx and symbol_idx, accept both here - /// NOTE that type_idx need to be specified if not a symbol - pub fn type_size_bytes(&mut self, type_idx: Option, ty: &Type) -> Option { - assert!(self.solving.is_empty()); - if let Some(idx) = type_idx { - // if cached return it - if let Some(solved) = self.cached(idx) { - return Some(solved); - } - self.solving.insert(idx); - } - let result = self.inner_type_size_bytes(ty); - if let Some(idx) = type_idx { - assert!(self.solving.remove(&idx)); - } - assert!(self.solving.is_empty()); - if let (Some(idx), Some(result)) = (type_idx, result) { - assert!(self.solved.insert(idx, result).is_none()); - } - result - } - - fn cached(&self, idx: usize) -> Option { - self.solved.get(&idx).copied() - } - - fn inner_type_size_bytes(&mut self, ty: &Type) -> Option { - Some(match &ty.type_variant { - TypeVariant::Basic(Basic::Char) => 1, - // TODO what is the SegReg size? - TypeVariant::Basic(Basic::SegReg) => 1, - TypeVariant::Basic(Basic::Void) => 0, - TypeVariant::Basic(Basic::Unknown { bytes }) => (*bytes).into(), - TypeVariant::Basic(Basic::Bool) => self.section.size_bool.get().into(), - TypeVariant::Basic(Basic::Short { .. }) => self.section.sizeof_short().get().into(), - TypeVariant::Basic(Basic::Int { .. }) => self.section.size_int.get().into(), - TypeVariant::Basic(Basic::Long { .. }) => self.section.sizeof_long().get().into(), - TypeVariant::Basic(Basic::LongLong { .. }) => { - self.section.sizeof_long_long().get().into() - } - TypeVariant::Basic(Basic::IntSized { bytes, .. }) => bytes.get().into(), - TypeVariant::Basic(Basic::BoolSized { bytes }) => bytes.get().into(), - // TODO what's the long double default size if it's not defined? - TypeVariant::Basic(Basic::LongDouble) => self - .section - .size_long_double - .map(|x| x.get()) - .unwrap_or(8) - .into(), - TypeVariant::Basic(Basic::Float { bytes }) => bytes.get().into(), - // TODO is pointer always near? Do pointer size default to 4? - TypeVariant::Pointer(_) => self.section.addr_size().get().into(), - TypeVariant::Function(_) => 0, // function type dont have a size, only a pointer to it - TypeVariant::Array(array) => { - let element_len = self.inner_type_size_bytes(&array.elem_type)?; - element_len * array.nelem as u64 - } - TypeVariant::StructRef(ref_type) - | TypeVariant::UnionRef(ref_type) - | TypeVariant::EnumRef(ref_type) - | TypeVariant::Typedef(ref_type) => self.solve_typedef(ref_type)?, - TypeVariant::Struct(Struct { members, .. }) => { - let mut sum = 0u64; - // TODO default alignment, seems like default alignemnt is the field size - let align: u64 = 1; - for member in members { - let field_size = self.inner_type_size_bytes(&member.member_type)?; - let align_diff = sum % align; - if align_diff != 0 { - sum += align - align_diff; - } - sum += field_size; - } - sum - } - TypeVariant::Union(Union { members, .. }) => { - let mut max = 0; - for (_, member) in members { - let size = self.inner_type_size_bytes(member)?; - max = max.max(size); - } - max - } - TypeVariant::Enum(Enum { storage_size, .. }) => storage_size - .or(self.section.size_enum) - .map(|x| x.get()) - .unwrap_or(4) - .into(), - TypeVariant::Bitfield(bitfield) => bitfield.width.into(), - }) - } - - fn solve_typedef(&mut self, typedef: &Typedef) -> Option { - let idx = match typedef { - Typedef::Name(name) => { - // NOTE missing names may indicate a external type, just return no size - self.section.get_name_idx(name.as_ref()?)? - } - Typedef::Ordinal(ord) => self - .section - .get_ord_idx(crate::id0::Id0TilOrd { ord: (*ord).into() })?, - }; - // if cached return it - if let Some(solved) = self.cached(idx) { - return Some(solved); - } - if !self.solving.insert(idx) { - return None; - } - let inner_type = self.section.get_type_by_idx(idx); - let result = self.inner_type_size_bytes(&inner_type.tinfo); - self.solving.remove(&idx); - if let Some(result) = result { - assert!(self.solved.insert(idx, result).is_none()); - } - result - } -} diff --git a/src/til/size_calculator.rs b/src/til/size_calculator.rs new file mode 100644 index 0000000..aa5f5a7 --- /dev/null +++ b/src/til/size_calculator.rs @@ -0,0 +1,193 @@ +use std::collections::{HashMap, HashSet}; +use std::num::NonZeroU8; + +use crate::til::bitfield::Bitfield; + +use super::r#enum::Enum; +use super::r#struct::{Struct, StructMember}; +use super::section::TILSection; +use super::union::Union; +use super::{Basic, Type, TypeVariant, Typedef}; + +pub struct TILTypeSizeSolver<'a> { + section: &'a TILSection, + solved: HashMap, + // HACK used to avoid infinte lopping during recursive solving + solving: HashSet, +} + +impl<'a> TILTypeSizeSolver<'a> { + pub fn new(section: &'a TILSection) -> Self { + Self { + section, + solved: Default::default(), + solving: Default::default(), + } + } + + // TODO make a type for type_idx and symbol_idx, accept both here + /// NOTE that type_idx need to be specified if not a symbol + pub fn type_size_bytes(&mut self, type_idx: Option, ty: &Type) -> Option { + assert!(self.solving.is_empty()); + if let Some(idx) = type_idx { + // if cached return it + if let Some(solved) = self.cached(idx) { + return Some(solved); + } + self.solving.insert(idx); + } + let result = self.inner_type_size_bytes(ty); + if let Some(idx) = type_idx { + assert!(self.solving.remove(&idx)); + } + assert!(self.solving.is_empty()); + if let (Some(idx), Some(result)) = (type_idx, result) { + assert!(self.solved.insert(idx, result).is_none()); + } + result + } + + fn cached(&self, idx: usize) -> Option { + self.solved.get(&idx).copied() + } + + fn inner_type_size_bytes(&mut self, ty: &Type) -> Option { + Some(match &ty.type_variant { + TypeVariant::Basic(Basic::Char) => 1, + // TODO what is the SegReg size? + TypeVariant::Basic(Basic::SegReg) => 1, + TypeVariant::Basic(Basic::Void) => 0, + TypeVariant::Basic(Basic::Unknown { bytes }) => (*bytes).into(), + TypeVariant::Basic(Basic::Bool) => self.section.size_bool.get().into(), + TypeVariant::Basic(Basic::Short { .. }) => self.section.sizeof_short().get().into(), + TypeVariant::Basic(Basic::Int { .. }) => self.section.size_int.get().into(), + TypeVariant::Basic(Basic::Long { .. }) => self.section.sizeof_long().get().into(), + TypeVariant::Basic(Basic::LongLong { .. }) => { + self.section.sizeof_long_long().get().into() + } + TypeVariant::Basic(Basic::IntSized { bytes, .. }) => bytes.get().into(), + TypeVariant::Basic(Basic::BoolSized { bytes }) => bytes.get().into(), + // TODO what's the long double default size if it's not defined? + TypeVariant::Basic(Basic::LongDouble) => self + .section + .size_long_double + .map(|x| x.get()) + .unwrap_or(8) + .into(), + TypeVariant::Basic(Basic::Float { bytes }) => bytes.get().into(), + // TODO is pointer always near? Do pointer size default to 4? + TypeVariant::Pointer(_) => self.section.addr_size().get().into(), + TypeVariant::Function(_) => 0, // function type dont have a size, only a pointer to it + TypeVariant::Array(array) => { + let element_len = self.inner_type_size_bytes(&array.elem_type)?; + element_len * array.nelem as u64 + } + TypeVariant::StructRef(ref_type) + | TypeVariant::UnionRef(ref_type) + | TypeVariant::EnumRef(ref_type) + | TypeVariant::Typedef(ref_type) => self.solve_typedef(ref_type)?, + TypeVariant::Struct(Struct { members, .. }) => { + let mut sum = 0u64; + // TODO default alignment, seems like default alignemnt is the field size + let align: u64 = 1; + let mut members = &members[..]; + loop { + let field_size = match members.get(0).map(|x| &x.member_type.type_variant) { + // no more members + None => break, + // if bit-field, condensate one or more to create a byte-field + Some(TypeVariant::Bitfield(bitfield)) => { + members = &members[1..]; + // NOTE it skips 0..n members + condensate_bitfields_from_struct(*bitfield, &mut members) + .get() + .into() + } + // get the inner type size + Some(_) => { + let first = &members[0]; + members = &members[1..]; + // next member + self.inner_type_size_bytes(&first.member_type)? + } + }; + let align_diff = sum % align; + if align_diff != 0 { + sum += align - align_diff; + } + sum += field_size; + } + sum + } + TypeVariant::Union(Union { members, .. }) => { + let mut max = 0; + for (_, member) in members { + let size = self.inner_type_size_bytes(member)?; + max = max.max(size); + } + max + } + TypeVariant::Enum(Enum { storage_size, .. }) => storage_size + .or(self.section.size_enum) + .map(|x| x.get()) + .unwrap_or(4) + .into(), + TypeVariant::Bitfield(bitfield) => bitfield.width.into(), + }) + } + + fn solve_typedef(&mut self, typedef: &Typedef) -> Option { + let idx = match typedef { + Typedef::Name(name) => { + // NOTE missing names may indicate a external type, just return no size + self.section.get_name_idx(name.as_ref()?)? + } + Typedef::Ordinal(ord) => self + .section + .get_ord_idx(crate::id0::Id0TilOrd { ord: (*ord).into() })?, + }; + // if cached return it + if let Some(solved) = self.cached(idx) { + return Some(solved); + } + if !self.solving.insert(idx) { + return None; + } + let inner_type = self.section.get_type_by_idx(idx); + let result = self.inner_type_size_bytes(&inner_type.tinfo); + self.solving.remove(&idx); + if let Some(result) = result { + assert!(self.solved.insert(idx, result).is_none()); + } + result + } +} + +fn condensate_bitfields_from_struct( + first_field: Bitfield, + rest: &mut &[StructMember], +) -> NonZeroU8 { + let field_bytes = first_field.nbytes; + let field_bits: u16 = u16::from(first_field.nbytes.get()) * 8; + let mut condensated_bits = first_field.width; + + loop { + let Some(TypeVariant::Bitfield(member)) = rest.get(0).map(|x| &x.member_type.type_variant) + else { + // no more bit-fields to condensate + break; + }; + let member_bits = u16::from(member.width); + // condensate the bit-field into the byte-field + condensated_bits += member_bits; + // check if this bit start the next field + if field_bytes != member.nbytes || condensated_bits > field_bits { + // NOTE this don't consume the current member + break; + } + + // advance to the next member + *rest = &rest[1..]; + } + return field_bytes; +} diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 762e483..c838bd7 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -5,9 +5,9 @@ use idb_rs::til::function::{CallingConvention, Function}; use idb_rs::til::pointer::Pointer; use idb_rs::til::r#enum::Enum; use idb_rs::til::r#struct::{Struct, StructMemberAtt}; -use idb_rs::til::section::{TILSection, TILTypeSizeSolver}; +use idb_rs::til::section::TILSection; use idb_rs::til::union::Union; -use idb_rs::til::{Basic, TILTypeInfo, Type, TypeVariant, Typedef}; +use idb_rs::til::{Basic, TILTypeInfo, TILTypeSizeSolver, Type, TypeVariant, Typedef}; use idb_rs::IDBParser; use std::fs::File; From 6ceee818877b9f8872ca50fe2292955c063f4952 Mon Sep 17 00:00:00 2001 From: rbran Date: Mon, 6 Jan 2025 15:37:56 -0300 Subject: [PATCH 25/53] improve til type size calculation --- src/til/size_calculator.rs | 60 +++++++++++++++++++++++++++++++++----- 1 file changed, 53 insertions(+), 7 deletions(-) diff --git a/src/til/size_calculator.rs b/src/til/size_calculator.rs index aa5f5a7..de1afcf 100644 --- a/src/til/size_calculator.rs +++ b/src/til/size_calculator.rs @@ -4,7 +4,7 @@ use std::num::NonZeroU8; use crate::til::bitfield::Bitfield; use super::r#enum::Enum; -use super::r#struct::{Struct, StructMember}; +use super::r#struct::StructMember; use super::section::TILSection; use super::union::Union; use super::{Basic, Type, TypeVariant, Typedef}; @@ -86,13 +86,14 @@ impl<'a> TILTypeSizeSolver<'a> { | TypeVariant::UnionRef(ref_type) | TypeVariant::EnumRef(ref_type) | TypeVariant::Typedef(ref_type) => self.solve_typedef(ref_type)?, - TypeVariant::Struct(Struct { members, .. }) => { + TypeVariant::Struct(til_struct) => { let mut sum = 0u64; // TODO default alignment, seems like default alignemnt is the field size let align: u64 = 1; - let mut members = &members[..]; + let mut members = &til_struct.members[..]; loop { - let field_size = match members.get(0).map(|x| &x.member_type.type_variant) { + let first_member = members.get(0); + let field_size = match first_member.map(|x| &x.member_type.type_variant) { // no more members None => break, // if bit-field, condensate one or more to create a byte-field @@ -111,9 +112,16 @@ impl<'a> TILTypeSizeSolver<'a> { self.inner_type_size_bytes(&first.member_type)? } }; - let align_diff = sum % align; - if align_diff != 0 { - sum += align - align_diff; + if !til_struct.is_unaligned { + let align = first_member + .map(|first| self.alignemnt(&first.member_type, field_size)) + .flatten() + .unwrap_or(align) + .max(1); + let align_diff = sum % align; + if align_diff != 0 { + sum += align - align_diff; + } } sum += field_size; } @@ -161,6 +169,44 @@ impl<'a> TILTypeSizeSolver<'a> { } result } + + fn alignemnt(&mut self, til: &Type, til_size: u64) -> Option { + match &til.type_variant { + // TODO basic types have a inherited alignment? + TypeVariant::Basic(_) | TypeVariant::Enum(_) | TypeVariant::Pointer(_) => { + Some(til_size) + } + TypeVariant::Array(array) => { + let size = self.inner_type_size_bytes(&array.elem_type); + self.alignemnt(&array.elem_type, size.unwrap_or(1)) + } + TypeVariant::EnumRef(ty) => { + let ty = match ty { + Typedef::Ordinal(ord) => self + .section + .get_ord(crate::id0::Id0TilOrd { ord: (*ord).into() }), + Typedef::Name(Some(name)) => self.section.get_name(name), + Typedef::Name(None) => None, + }; + ty.map(|ty| self.inner_type_size_bytes(&ty.tinfo)).flatten() + } + TypeVariant::Typedef(ty) => { + let ty = match ty { + Typedef::Ordinal(ord) => self + .section + .get_ord(crate::id0::Id0TilOrd { ord: (*ord).into() }), + Typedef::Name(Some(name)) => self.section.get_name(name), + Typedef::Name(None) => None, + }; + ty.map(|ty| { + let size = self.inner_type_size_bytes(&ty.tinfo).unwrap_or(1); + self.alignemnt(&ty.tinfo, size) + }) + .flatten() + } + _ => None, + } + } } fn condensate_bitfields_from_struct( From 7c91b3a636e73f9c199cee948c78217853b7a0ba Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 7 Jan 2025 08:45:33 -0300 Subject: [PATCH 26/53] fix til pointer flags --- src/til.rs | 2 ++ src/til/pointer.rs | 61 +++++++++++++++++++++++----------------------- src/tools/tilib.rs | 19 ++++++++------- 3 files changed, 43 insertions(+), 39 deletions(-) diff --git a/src/til.rs b/src/til.rs index b9f8ec7..6324e55 100644 --- a/src/til.rs +++ b/src/til.rs @@ -71,6 +71,8 @@ impl TILTypeInfo { let is_u64 = (flags >> 31) != 0; let ordinal = match (til.format, is_u64) { // formats below 0x12 doesn't have 64 bits ord + // TODO don't convert it directly into u64, tilib seems to handle + // u32 and u64 values diferently (0..=0x11, _) | (_, false) => cursor.read_u32()?.into(), (_, true) => cursor.read_u64()?, }; diff --git a/src/til/pointer.rs b/src/til/pointer.rs index e1870b9..c9985ae 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -7,9 +7,13 @@ use crate::til::{Type, TypeRaw, TAH}; #[derive(Debug, Clone)] pub struct Pointer { pub closure: PointerType, - pub modifier: Option, - pub shifted: Option<(Box, u32)>, pub typ: Box, + pub shifted: Option<(Box, u32)>, + pub is_ptr32: bool, + pub is_ptr64: bool, + pub is_restricted: bool, + pub is_unknown_ta10: bool, + pub ta_lower: u8, } impl Pointer { @@ -32,9 +36,13 @@ impl Pointer { Ok(Self { // TODO forward fields to closure? closure: PointerType::new(til, raw.closure)?, - modifier: raw.modifier, - shifted, typ, + shifted, + is_ptr32: raw.is_ptr32, + is_ptr64: raw.is_ptr64, + is_restricted: raw.is_restricted, + is_unknown_ta10: raw.is_unknown_ta10, + ta_lower: raw.ta_lower, }) } } @@ -66,19 +74,16 @@ impl PointerType { } } -#[derive(Debug, Clone, Copy)] -pub enum PointerModifier { - Ptr32, - Ptr64, - Restricted, -} - #[derive(Debug, Clone)] pub(crate) struct PointerRaw { pub closure: PointerTypeRaw, - pub modifier: Option, - pub shifted: Option<(Box, u32)>, pub typ: Box, + pub is_ptr32: bool, + pub is_ptr64: bool, + pub is_restricted: bool, + pub is_unknown_ta10: bool, + pub shifted: Option<(Box, u32)>, + pub ta_lower: u8, } impl PointerRaw { @@ -107,32 +112,28 @@ impl PointerRaw { let shifted = (tah.0 .0 & TAPTR_SHIFTED != 0) .then(|| -> Result<_> { // TODO allow typedef only? + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 print_til_type_att let typ = TypeRaw::read(&mut *input, header)?; let value = input.read_de()?; Ok((Box::new(typ), value)) }) .transpose()?; - - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 print_til_type_att - let modifier = match tah.0 .0 & (TAPTR_RESTRICT | TAPTR_PTR64 | TAPTR_PTR32) { - 0x00 => None, - TAPTR_PTR32 => Some(PointerModifier::Ptr32), - TAPTR_PTR64 => Some(PointerModifier::Ptr64), - TAPTR_RESTRICT => Some(PointerModifier::Restricted), - _ => unreachable!(), - }; - // TODO other values are known to exist - //let all_flags = TAPTR_RESTRICT | TAPTR_PTR64 | TAPTR_PTR32 | TAPTR_SHIFTED; - //anyhow::ensure!( - // tah.0 .0 & !all_flags == 0, - // "Unknown value for pointer modifier" - //); + let is_ptr32 = tah.0 .0 & TAPTR_PTR32 != 0; + let is_ptr64 = tah.0 .0 & TAPTR_PTR64 != 0; + let is_restricted = tah.0 .0 & TAPTR_RESTRICT != 0; + // TODO find the flag or doc for this + let is_unknown_ta10 = tah.0 .0 & 0x10 != 0; + let ta_lower = (tah.0 .0 & 0xf) as u8; Ok(Self { closure, - modifier, - shifted, typ: Box::new(typ), + shifted, + is_ptr32, + is_ptr64, + is_restricted, + is_unknown_ta10, + ta_lower, }) } } diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index c838bd7..93aeb65 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -465,13 +465,14 @@ fn print_til_type_pointer( if til_type.is_const { write!(fmt, "const ")?; } - match pointer.modifier { - None => {} - Some(idb_rs::til::pointer::PointerModifier::Ptr32) => write!(fmt, "__ptr32 ")?, - Some(idb_rs::til::pointer::PointerModifier::Ptr64) => write!(fmt, "__ptr64 ")?, - Some(idb_rs::til::pointer::PointerModifier::Restricted) => { - write!(fmt, "__restricted ")? - } + if pointer.is_ptr32 { + write!(fmt, "__ptr32 ")?; + } + if pointer.is_ptr64 { + write!(fmt, "__ptr64 ")?; + } + if pointer.is_restricted { + write!(fmt, "__restricted ")?; } if let Some((ty, value)) = &pointer.shifted { write!(fmt, "__shifted(")?; @@ -558,7 +559,7 @@ fn print_til_type_function( write!(fmt, ", ")?; } let param_name = param_name.as_ref().map(Vec::as_slice); - print_til_type(fmt, section, param_name, param, true, false, true)?; + print_til_type(fmt, section, param_name, param, true, true, true)?; } match til_function.calling_convention { Some(CallingConvention::Voidarg) => write!(fmt, "void")?, @@ -673,7 +674,7 @@ fn print_til_type_complex_ref( fmt.write_all(name)?; } } else { - print_til_type_typedef(fmt, section, name, til_type, typedef, print_prefix)?; + print_til_type_typedef(fmt, section, name, til_type, typedef, true)?; } Ok(()) } From 703d954b9d5f346f7c0bc36bbd89a236c0867a48 Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 7 Jan 2025 09:20:30 -0300 Subject: [PATCH 27/53] fix til dependencies --- src/til.rs | 2 +- src/til/section.rs | 30 ++++++++++++++++++------------ src/tools/dump_til.rs | 8 ++++---- src/tools/tilib.rs | 23 ++++++++++++----------- 4 files changed, 35 insertions(+), 28 deletions(-) diff --git a/src/til.rs b/src/til.rs index 6324e55..0d0e283 100644 --- a/src/til.rs +++ b/src/til.rs @@ -162,8 +162,8 @@ impl Type { let header = section::TILSectionHeader { format: 12, flags: section::TILSectionFlags(0), - title: Vec::new(), description: Vec::new(), + dependencies: Vec::new(), compiler_id: 0, cm: 0, size_enum: None, diff --git a/src/til/section.rs b/src/til/section.rs index ad91dea..955ec90 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -18,11 +18,11 @@ pub const TIL_SECTION_MAGIC: &[u8; 6] = b"IDATIL"; pub struct TILSection { pub format: u32, /// short file name (without path and extension) - pub title: Vec, + pub description: Vec, pub flags: TILSectionFlags, // TODO unclear what exacly dependency is for /// module required - pub dependency: Option>, + pub dependencies: Vec>, /// the compiler used to generated types pub compiler_id: Compiler, /// default calling convention @@ -58,8 +58,8 @@ pub struct TILSectionExtendedSizeofInfo { pub struct TILSectionHeader { pub format: u32, pub flags: TILSectionFlags, - pub title: Vec, pub description: Vec, + pub dependencies: Vec, pub compiler_id: u8, pub cm: u8, pub size_enum: Option, @@ -136,11 +136,17 @@ impl TILSection { let cn = CCPtrSize::from_cm_raw(header.cm, header.size_int); let cm = CCModel::from_cm_raw(header.cm); + let dependencies = header + .dependencies + .split(|x| *x == b',') + .map(<[_]>::to_vec) + .collect(); + Ok(TILSection { format: header.format, - title: header.title, + description: header.description, flags: header.flags, - dependency: header.description.is_empty().then_some(header.description), + dependencies, compiler_id: Compiler::from_value(header.compiler_id), cc, cn, @@ -232,19 +238,19 @@ impl TILSection { flags, }; - let title = input.read_bytes_len_u8()?; - let mut description = input.read_bytes_len_u8()?; + let description = input.read_bytes_len_u8()?; + let mut dependencies = input.read_bytes_len_u8()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x431f64 // remove the "_arm" from the description const MACOS_ARM_EXCEPTION: &[u8] = b"macosx_arm"; - if let Some(pos) = description + if let Some(pos) = dependencies .windows(MACOS_ARM_EXCEPTION.len()) .position(|window| window == MACOS_ARM_EXCEPTION) { - description = description[..pos + 6] + dependencies = dependencies[..pos + 6] .iter() - .chain(&description[pos + MACOS_ARM_EXCEPTION.len()..]) + .chain(&dependencies[pos + MACOS_ARM_EXCEPTION.len()..]) .copied() .collect::>(); } @@ -285,8 +291,8 @@ impl TILSection { Ok(TILSectionHeader { format: header1.format, flags: header1.flags, - title, description, + dependencies, compiler_id: header2.compiler_id, // TODO panic if None? size_enum: header2.size_enum.try_into().ok(), @@ -343,8 +349,8 @@ impl TILSection { def_align, }; bincode::serialize_into(&mut *output, &header1)?; - crate::write_string_len_u8(&mut *output, &header.title)?; crate::write_string_len_u8(&mut *output, &header.description)?; + crate::write_string_len_u8(&mut *output, &header.dependencies)?; bincode::serialize_into(&mut *output, &header2)?; if header.flags.have_extended_sizeof_info() { let sizes = header.extended_sizeof_info.unwrap(); diff --git a/src/tools/dump_til.rs b/src/tools/dump_til.rs index be92fd8..190f96c 100644 --- a/src/tools/dump_til.rs +++ b/src/tools/dump_til.rs @@ -28,9 +28,9 @@ pub fn dump_til(args: &Args) -> Result<()> { // this deconstruction is to changes on TILSection to force a review on this code let TILSection { format, - title, + description: title, flags: _, - dependency, + dependencies: dependency, compiler_id, cc, cm, @@ -50,8 +50,8 @@ pub fn dump_til(args: &Args) -> Result<()> { // write the header info println!("format: {format}"); println!("title: {}", String::from_utf8_lossy(title)); - if let Some(dependency) = dependency { - println!("dependency: {}", String::from_utf8_lossy(dependency)); + for (i, dependency) in dependency.iter().enumerate() { + println!("dependency-{i}: {}", String::from_utf8_lossy(dependency)); } println!("id: {compiler_id:?}"); println!("cc: {cc:?}"); diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 93aeb65..e2ce89d 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -37,11 +37,10 @@ pub fn tilib_print(args: &Args) -> anyhow::Result<()> { } fn print_til_section(mut fmt: impl Write, section: &TILSection) -> Result<()> { - if let Some(dependency) = §ion.dependency { + if !section.dependencies.is_empty() { // TODO open those files? What todo with then? - // TODO some files still missing this warning - if !dependency.is_empty() { - write!(fmt, "Warning: ")?; + write!(fmt, "Warning: ")?; + for dependency in §ion.dependencies { fmt.write_all(dependency)?; writeln!(fmt, ": No such file or directory")?; } @@ -80,7 +79,7 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { // the description of the file // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b710 write!(fmt, "Description: ")?; - fmt.write_all(§ion.title)?; + fmt.write_all(§ion.description)?; writeln!(fmt)?; // flags from the section header @@ -467,12 +466,14 @@ fn print_til_type_pointer( } if pointer.is_ptr32 { write!(fmt, "__ptr32 ")?; - } - if pointer.is_ptr64 { - write!(fmt, "__ptr64 ")?; - } - if pointer.is_restricted { - write!(fmt, "__restricted ")?; + } else { + if pointer.is_ptr64 { + write!(fmt, "__ptr64 ")?; + } else { + if pointer.is_restricted { + write!(fmt, "__restricted ")?; + } + } } if let Some((ty, value)) = &pointer.shifted { write!(fmt, "__shifted(")?; From 0b5a1234be7dc40022c55211f96b3ba0443cae5f Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 7 Jan 2025 09:23:33 -0300 Subject: [PATCH 28/53] Revert "fix til pointer flags" This reverts commit 7c91b3a636e73f9c199cee948c78217853b7a0ba. --- src/til.rs | 2 -- src/til/pointer.rs | 61 +++++++++++++++++++++++----------------------- src/tools/tilib.rs | 19 ++++++--------- 3 files changed, 38 insertions(+), 44 deletions(-) diff --git a/src/til.rs b/src/til.rs index 0d0e283..8de7918 100644 --- a/src/til.rs +++ b/src/til.rs @@ -71,8 +71,6 @@ impl TILTypeInfo { let is_u64 = (flags >> 31) != 0; let ordinal = match (til.format, is_u64) { // formats below 0x12 doesn't have 64 bits ord - // TODO don't convert it directly into u64, tilib seems to handle - // u32 and u64 values diferently (0..=0x11, _) | (_, false) => cursor.read_u32()?.into(), (_, true) => cursor.read_u64()?, }; diff --git a/src/til/pointer.rs b/src/til/pointer.rs index c9985ae..e1870b9 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -7,13 +7,9 @@ use crate::til::{Type, TypeRaw, TAH}; #[derive(Debug, Clone)] pub struct Pointer { pub closure: PointerType, - pub typ: Box, + pub modifier: Option, pub shifted: Option<(Box, u32)>, - pub is_ptr32: bool, - pub is_ptr64: bool, - pub is_restricted: bool, - pub is_unknown_ta10: bool, - pub ta_lower: u8, + pub typ: Box, } impl Pointer { @@ -36,13 +32,9 @@ impl Pointer { Ok(Self { // TODO forward fields to closure? closure: PointerType::new(til, raw.closure)?, - typ, + modifier: raw.modifier, shifted, - is_ptr32: raw.is_ptr32, - is_ptr64: raw.is_ptr64, - is_restricted: raw.is_restricted, - is_unknown_ta10: raw.is_unknown_ta10, - ta_lower: raw.ta_lower, + typ, }) } } @@ -74,16 +66,19 @@ impl PointerType { } } +#[derive(Debug, Clone, Copy)] +pub enum PointerModifier { + Ptr32, + Ptr64, + Restricted, +} + #[derive(Debug, Clone)] pub(crate) struct PointerRaw { pub closure: PointerTypeRaw, - pub typ: Box, - pub is_ptr32: bool, - pub is_ptr64: bool, - pub is_restricted: bool, - pub is_unknown_ta10: bool, + pub modifier: Option, pub shifted: Option<(Box, u32)>, - pub ta_lower: u8, + pub typ: Box, } impl PointerRaw { @@ -112,28 +107,32 @@ impl PointerRaw { let shifted = (tah.0 .0 & TAPTR_SHIFTED != 0) .then(|| -> Result<_> { // TODO allow typedef only? - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 print_til_type_att let typ = TypeRaw::read(&mut *input, header)?; let value = input.read_de()?; Ok((Box::new(typ), value)) }) .transpose()?; - let is_ptr32 = tah.0 .0 & TAPTR_PTR32 != 0; - let is_ptr64 = tah.0 .0 & TAPTR_PTR64 != 0; - let is_restricted = tah.0 .0 & TAPTR_RESTRICT != 0; - // TODO find the flag or doc for this - let is_unknown_ta10 = tah.0 .0 & 0x10 != 0; - let ta_lower = (tah.0 .0 & 0xf) as u8; + + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 print_til_type_att + let modifier = match tah.0 .0 & (TAPTR_RESTRICT | TAPTR_PTR64 | TAPTR_PTR32) { + 0x00 => None, + TAPTR_PTR32 => Some(PointerModifier::Ptr32), + TAPTR_PTR64 => Some(PointerModifier::Ptr64), + TAPTR_RESTRICT => Some(PointerModifier::Restricted), + _ => unreachable!(), + }; + // TODO other values are known to exist + //let all_flags = TAPTR_RESTRICT | TAPTR_PTR64 | TAPTR_PTR32 | TAPTR_SHIFTED; + //anyhow::ensure!( + // tah.0 .0 & !all_flags == 0, + // "Unknown value for pointer modifier" + //); Ok(Self { closure, - typ: Box::new(typ), + modifier, shifted, - is_ptr32, - is_ptr64, - is_restricted, - is_unknown_ta10, - ta_lower, + typ: Box::new(typ), }) } } diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index e2ce89d..772dd89 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -464,15 +464,12 @@ fn print_til_type_pointer( if til_type.is_const { write!(fmt, "const ")?; } - if pointer.is_ptr32 { - write!(fmt, "__ptr32 ")?; - } else { - if pointer.is_ptr64 { - write!(fmt, "__ptr64 ")?; - } else { - if pointer.is_restricted { - write!(fmt, "__restricted ")?; - } + match pointer.modifier { + None => {} + Some(idb_rs::til::pointer::PointerModifier::Ptr32) => write!(fmt, "__ptr32 ")?, + Some(idb_rs::til::pointer::PointerModifier::Ptr64) => write!(fmt, "__ptr64 ")?, + Some(idb_rs::til::pointer::PointerModifier::Restricted) => { + write!(fmt, "__restricted ")? } } if let Some((ty, value)) = &pointer.shifted { @@ -560,7 +557,7 @@ fn print_til_type_function( write!(fmt, ", ")?; } let param_name = param_name.as_ref().map(Vec::as_slice); - print_til_type(fmt, section, param_name, param, true, true, true)?; + print_til_type(fmt, section, param_name, param, true, false, true)?; } match til_function.calling_convention { Some(CallingConvention::Voidarg) => write!(fmt, "void")?, @@ -675,7 +672,7 @@ fn print_til_type_complex_ref( fmt.write_all(name)?; } } else { - print_til_type_typedef(fmt, section, name, til_type, typedef, true)?; + print_til_type_typedef(fmt, section, name, til_type, typedef, print_prefix)?; } Ok(()) } From 6d16ec90a5819f1d02190393070c73c4040a2f8c Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 7 Jan 2025 09:25:39 -0300 Subject: [PATCH 29/53] fix til pointer flags --- src/til/pointer.rs | 18 +++++++++++------- 1 file changed, 11 insertions(+), 7 deletions(-) diff --git a/src/til/pointer.rs b/src/til/pointer.rs index e1870b9..c241c4f 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -10,6 +10,8 @@ pub struct Pointer { pub modifier: Option, pub shifted: Option<(Box, u32)>, pub typ: Box, + pub is_unknown_ta10: bool, + pub ta_lower: u8, } impl Pointer { @@ -35,6 +37,8 @@ impl Pointer { modifier: raw.modifier, shifted, typ, + is_unknown_ta10: raw.is_unknown_ta10, + ta_lower: raw.ta_lower, }) } } @@ -79,6 +83,8 @@ pub(crate) struct PointerRaw { pub modifier: Option, pub shifted: Option<(Box, u32)>, pub typ: Box, + pub is_unknown_ta10: bool, + pub ta_lower: u8, } impl PointerRaw { @@ -114,25 +120,23 @@ impl PointerRaw { .transpose()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 print_til_type_att - let modifier = match tah.0 .0 & (TAPTR_RESTRICT | TAPTR_PTR64 | TAPTR_PTR32) { + let modifier = match tah.0 .0 & TAPTR_RESTRICT { 0x00 => None, TAPTR_PTR32 => Some(PointerModifier::Ptr32), TAPTR_PTR64 => Some(PointerModifier::Ptr64), TAPTR_RESTRICT => Some(PointerModifier::Restricted), _ => unreachable!(), }; - // TODO other values are known to exist - //let all_flags = TAPTR_RESTRICT | TAPTR_PTR64 | TAPTR_PTR32 | TAPTR_SHIFTED; - //anyhow::ensure!( - // tah.0 .0 & !all_flags == 0, - // "Unknown value for pointer modifier" - //); + let is_unknown_ta10 = tah.0 .0 & 0x10 != 0; + let ta_lower = (tah.0 .0 & 0xf) as u8; Ok(Self { closure, modifier, shifted, typ: Box::new(typ), + is_unknown_ta10, + ta_lower, }) } } From a2dc3007c334bfe3373d492cbbb64999b270b9d8 Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 7 Jan 2025 13:17:44 -0300 Subject: [PATCH 30/53] fix til dependencies --- src/til/pointer.rs | 2 ++ src/til/section.rs | 14 +++++++++----- 2 files changed, 11 insertions(+), 5 deletions(-) diff --git a/src/til/pointer.rs b/src/til/pointer.rs index c241c4f..a28615f 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -127,7 +127,9 @@ impl PointerRaw { TAPTR_RESTRICT => Some(PointerModifier::Restricted), _ => unreachable!(), }; + // TODO find menaing: commonly set as true let is_unknown_ta10 = tah.0 .0 & 0x10 != 0; + // TODO find meaning: normally 5 in one type at `vc10_64` and `ntddk64` let ta_lower = (tah.0 .0 & 0xf) as u8; Ok(Self { diff --git a/src/til/section.rs b/src/til/section.rs index 955ec90..87ae61b 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -136,11 +136,15 @@ impl TILSection { let cn = CCPtrSize::from_cm_raw(header.cm, header.size_int); let cm = CCModel::from_cm_raw(header.cm); - let dependencies = header - .dependencies - .split(|x| *x == b',') - .map(<[_]>::to_vec) - .collect(); + let dependencies = if header.dependencies.len() != 0 { + header + .dependencies + .split(|x| *x == b',') + .map(<[_]>::to_vec) + .collect() + } else { + vec![] + }; Ok(TILSection { format: header.format, From ef8453ecad88ff4b8c4d5095bf91c3ab324e99db Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 08:44:41 -0300 Subject: [PATCH 31/53] move type attribute read into ida_reader --- src/ida_reader.rs | 89 ++++++++++++++++++++++++++++++++++++++ src/til.rs | 89 ++++---------------------------------- src/til/array.rs | 18 +++----- src/til/bitfield.rs | 16 ++++++- src/til/enum.rs | 15 ++++--- src/til/function.rs | 4 +- src/til/pointer.rs | 14 +++--- src/til/size_calculator.rs | 3 +- src/til/struct.rs | 27 ++++++------ src/til/union.rs | 10 +++-- src/tools/tilib.rs | 4 +- 11 files changed, 160 insertions(+), 129 deletions(-) diff --git a/src/ida_reader.rs b/src/ida_reader.rs index 731b22d..71798cd 100644 --- a/src/ida_reader.rs +++ b/src/ida_reader.rs @@ -3,6 +3,8 @@ use anyhow::{anyhow, ensure, Result}; use std::io::{BufRead, ErrorKind, Read, Seek}; use std::ops::Range; +use crate::til::{TypeAttribute, TypeAttributeExt}; + pub trait IdbReader: Seek + IdaGenericBufUnpack {} impl IdbReader for R {} @@ -257,6 +259,39 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { } Ok(acc) } + + fn read_tah(&mut self) -> Result> { + // TODO TAH in each type have a especial meaning, verify those + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x477080 + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452830 + let Some(tah) = self.peek_u8()? else { + return Err(anyhow!(std::io::Error::new( + std::io::ErrorKind::UnexpectedEof, + "Unexpected EoF on DA" + ))); + }; + if tah == 0xFE { + Ok(Some(self.read_type_attribute()?)) + } else { + Ok(None) + } + } + + fn read_sdacl(&mut self) -> Result> { + let Some(sdacl) = self.peek_u8()? else { + return Err(anyhow!(std::io::Error::new( + std::io::ErrorKind::UnexpectedEof, + "Unexpected EoF on SDACL" + ))); + }; + + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x477eff + match sdacl { + //NOTE: original op ((sdacl & 0xcf) ^ 0xC0) <= 0x01 + 0xd0..=0xff | 0xc0 | 0xc1 => Ok(Some(self.read_type_attribute()?)), + _ => Ok(None), + } + } } impl IdaGenericBufUnpack for R {} @@ -461,6 +496,60 @@ pub trait IdaGenericUnpack: Read { } } + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452830 + fn read_type_attribute(&mut self) -> Result { + use crate::til::flag::tattr_ext::*; + let byte0: u8 = self.read_u8()?; + let mut tattr = 0; + if byte0 != 0xfe { + tattr = ((byte0 as u16 & 1) | ((byte0 as u16 >> 3) & 6)) + 1; + } + if byte0 == 0xFE || tattr == 8 { + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452878 + let mut shift = 0; + // TODO limit the loop to only 0..n + loop { + let next_byte: u8 = self.read_u8()?; + ensure!( + next_byte != 0, + "Failed to parse TypeAttribute, byte is zero" + ); + tattr |= ((next_byte & 0x7F) as u16) << shift; + if next_byte & 0x80 == 0 { + break; + } + shift += 7; + ensure!( + shift < u16::BITS, + "Failed to find the end of type attribute" + ); + } + } + + if tattr & TAH_HASATTRS == 0 { + return Ok(TypeAttribute { + tattr, + extended: None, + }); + } + tattr &= !TAH_HASATTRS; + + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x45289e + let loop_cnt = self.read_dt()?; + let extended = (0..loop_cnt) + .map(|_| { + let _value1 = self.unpack_dt_bytes()?; + let _value2 = self.unpack_dt_bytes()?; + // TODO maybe more... + Ok(TypeAttributeExt { _value1, _value2 }) + }) + .collect::>()?; + return Ok(TypeAttribute { + tattr, + extended: Some(extended), + }); + } + fn read_bytes_len_u16(&mut self) -> Result> { let len = self.read_u16()?; let mut bytes = vec![0u8; len.into()]; diff --git a/src/til.rs b/src/til.rs index 8de7918..a1ca104 100644 --- a/src/til.rs +++ b/src/til.rs @@ -68,6 +68,7 @@ impl TILTypeInfo { let flags: u32 = cursor.read_u32()?; // TODO verify if flags equal to 0x7fff_fffe? let name = cursor.read_c_string_raw()?; + println!("{}", String::from_utf8_lossy(&name)); let is_u64 = (flags >> 31) != 0; let ordinal = match (til.format, is_u64) { // formats below 0x12 doesn't have 64 bits ord @@ -571,88 +572,16 @@ pub struct TypeFlag(pub u8); #[derive(Clone, Copy, Debug)] pub struct CallingConventionFlag(pub u8); -#[derive(Clone, Copy, Debug)] -pub struct TypeAttribute(pub u16); -impl TypeAttribute { - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452830 - fn read(input: &mut impl IdaGenericUnpack) -> Result { - let byte0: u8 = input.read_u8()?; - let mut val = 0; - if byte0 != 0xfe { - val = ((byte0 as u16 & 1) | ((byte0 as u16 >> 3) & 6)) + 1; - } - if byte0 == 0xFE || val == 8 { - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452878 - let mut shift = 0; - // TODO limit the loop to only 0..n - loop { - let next_byte: u8 = input.read_u8()?; - ensure!( - next_byte != 0, - "Failed to parse TypeAttribute, byte is zero" - ); - val |= ((next_byte & 0x7F) as u16) << shift; - if next_byte & 0x80 == 0 { - break; - } - shift += 7; - } - } - - if val & 0x10 == 0 { - return Ok(TypeAttribute(val)); - } - - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x45289e - let loop_cnt = input.read_dt()?; - for _ in 0..loop_cnt { - let _string = input.unpack_dt_bytes()?; - let _other_thing = input.unpack_dt_bytes()?; - // TODO maybe more... - } - Ok(TypeAttribute(val)) - } -} - -#[derive(Clone, Copy, Debug)] -pub struct TAH(pub TypeAttribute); -impl TAH { - fn read(input: &mut impl IdaGenericBufUnpack) -> Result { - // TODO TAH in each type have a especial meaning, verify those - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x477080 - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452830 - let Some(tah) = input.fill_buf()?.first().copied() else { - return Err(anyhow!(std::io::Error::new( - std::io::ErrorKind::UnexpectedEof, - "Unexpected EoF on DA" - ))); - }; - if tah == 0xFE { - Ok(Self(TypeAttribute::read(input)?)) - } else { - Ok(Self(TypeAttribute(0))) - } - } +#[derive(Clone, Debug)] +pub struct TypeAttribute { + pub tattr: u16, + pub extended: Option>, } -#[derive(Clone, Copy, Debug)] -pub struct SDACL(pub TypeAttribute); -impl SDACL { - fn read(input: &mut impl IdaGenericBufUnpack) -> Result { - let Some(sdacl) = input.fill_buf()?.first().copied() else { - return Err(anyhow!(std::io::Error::new( - std::io::ErrorKind::UnexpectedEof, - "Unexpected EoF on SDACL" - ))); - }; - - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x477eff - match sdacl { - //NOTE: original op ((sdacl & 0xcf) ^ 0xC0) <= 0x01 - 0xd0..=0xff | 0xc0 | 0xc1 => Ok(Self(TypeAttribute::read(input)?)), - _ => Ok(Self(TypeAttribute(0))), - } - } +#[derive(Clone, Debug)] +pub struct TypeAttributeExt { + pub _value1: Vec, + pub _value2: Vec, } fn serialize_dt(value: u16) -> Result> { diff --git a/src/til/array.rs b/src/til/array.rs index 14120ff..52e38f7 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -1,13 +1,13 @@ +use std::num::NonZeroU16; + use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; -use crate::til::{Type, TypeRaw, TAH}; +use crate::til::{Type, TypeRaw}; #[derive(Clone, Debug)] pub struct Array { pub base: u8, - // TODO make this Option? - pub nelem: u16, - pub tah: TAH, + pub nelem: Option, pub elem_type: Box, } impl Array { @@ -19,7 +19,6 @@ impl Array { Ok(Self { base: value.base, nelem: value.nelem, - tah: value.tah, elem_type: Type::new(til, *value.elem_type, fields).map(Box::new)?, }) } @@ -28,8 +27,7 @@ impl Array { #[derive(Clone, Debug)] pub(crate) struct ArrayRaw { pub base: u8, - pub nelem: u16, - pub tah: TAH, + pub nelem: Option, pub elem_type: Box, } @@ -42,7 +40,6 @@ impl ArrayRaw { use crate::til::flag::tf_array::*; let (base, nelem) = match metadata { BTMT_NONBASED => { - // TODO if num_elem==0 then the array size is unknown let nelem = input.read_dt()?; (0, nelem) } @@ -53,12 +50,11 @@ impl ArrayRaw { } }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48078e - let tah = TAH::read(&mut *input)?; + let _tah = input.read_tah()?; let elem_type = TypeRaw::read(&mut *input, header)?; Ok(ArrayRaw { base, - nelem, - tah, + nelem: NonZeroU16::new(nelem), elem_type: Box::new(elem_type), }) } diff --git a/src/til/bitfield.rs b/src/til/bitfield.rs index 4a694f5..ba279c8 100644 --- a/src/til/bitfield.rs +++ b/src/til/bitfield.rs @@ -1,11 +1,23 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; -use crate::til::TAH; #[derive(Debug, Clone, Copy)] pub struct Bitfield { pub unsigned: bool, + // TODO what a 0 width bitfield means? The start of a new byte-field? + // ntddk_win10.til + // struct _D3DKMDT_DISPLAYMODE_FLAGS { + // unsigned __int32 ValidatedAgainstMonitorCaps : 1; + // unsigned __int32 RoundedFakeMode : 1; + // unsigned __int32 : 0; + // __int32 ModePruningReason : 4; + // unsigned __int32 Stereo : 1; + // unsigned __int32 AdvancedScanCapable : 1; + // unsigned __int32 PreferredTiming : 1; + // unsigned __int32 PhysicalModeSupported : 1; + // unsigned __int32 Reserved : 24; + // }; pub width: u16, pub nbytes: NonZeroU8, } @@ -23,7 +35,7 @@ impl Bitfield { let dt = input.read_dt()?; let width = dt >> 1; let unsigned = (dt & 1) > 0; - let _tag = TAH::read(&mut *input)?; + let _tah = input.read_tah()?; Ok(Self { unsigned, width, diff --git a/src/til/enum.rs b/src/til/enum.rs index e6e7337..b04c241 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -2,7 +2,7 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; -use crate::til::{flag, StructModifierRaw, TypeRaw, TypeVariantRaw, SDACL, TAH}; +use crate::til::{flag, StructModifierRaw, TypeRaw, TypeVariantRaw}; use anyhow::{anyhow, ensure}; #[derive(Clone, Debug)] @@ -61,15 +61,14 @@ impl EnumRaw { // is ref // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4803b4 let ref_type = TypeRaw::read_ref(&mut *input, header)?; - let _taenum_bits = SDACL::read(&mut *input)?.0; + let _taenum_bits = input.read_sdacl()?; let TypeVariantRaw::Typedef(ref_type) = ref_type.variant else { return Err(anyhow!("EnumRef Non Typedef")); }; return Ok(TypeVariantRaw::EnumRef(ref_type)); }; - let taenum_bits = TAH::read(&mut *input)?.0; - let _modifiers = StructModifierRaw::from_value(taenum_bits.0); + let taenum_bits = input.read_tah()?; // TODO parse ext attr let bte = input.read_u8()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452312 deserialize_enum @@ -103,11 +102,13 @@ impl EnumRaw { }; // TODO ensure no bits from bte or taenum_bits are unparsed - let is_signed = taenum_bits.0 & TAENUM_SIGNED != 0; - let is_unsigned = taenum_bits.0 & TAENUM_UNSIGNED != 0; + let taenum_bits = taenum_bits.as_ref().map(|x| x.tattr).unwrap_or(0); + let _modifiers = StructModifierRaw::from_value(taenum_bits); + let is_signed = taenum_bits & TAENUM_SIGNED != 0; + let is_unsigned = taenum_bits & TAENUM_UNSIGNED != 0; // TODO ensure only signed/unsigned is allowed? // - let is_64 = (taenum_bits.0 & TAENUM_64BIT) != 0; + let is_64 = (taenum_bits & TAENUM_64BIT) != 0; let mut low_acc: u32 = 0; let mut high_acc: u32 = 0; let mut group_acc = 0; diff --git a/src/til/function.rs b/src/til/function.rs index 0362890..6173435 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -2,7 +2,7 @@ use std::num::NonZeroU8; use crate::ida_reader::{IdaGenericBufUnpack, IdaGenericUnpack}; use crate::til::section::TILSectionHeader; -use crate::til::{Basic, Type, TypeRaw, TAH}; +use crate::til::{Basic, Type, TypeRaw}; use anyhow::{anyhow, ensure, Result}; use super::TypeVariantRaw; @@ -164,7 +164,7 @@ impl FunctionRaw { flags &= !0x0100; ensure!(flags == 0, "unknown function attrs({flags:04X})"); - let _tah = TAH::read(&mut *input)?; + let _tah = input.read_tah()?; let ret = TypeRaw::read(&mut *input, header)?; // TODO double check documentation for [flag::tf_func::BT_FUN] diff --git a/src/til/pointer.rs b/src/til/pointer.rs index a28615f..bb873dd 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -2,7 +2,7 @@ use anyhow::Result; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; -use crate::til::{Type, TypeRaw, TAH}; +use crate::til::{Type, TypeRaw}; #[derive(Debug, Clone)] pub struct Pointer { @@ -107,10 +107,12 @@ impl PointerRaw { }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4804fa // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459b7e - let tah = TAH::read(&mut *input)?; + let tah = input.read_tah()?; + // TODO handle ext att + let tah = tah.map(|x| x.tattr).unwrap_or(0); let typ = TypeRaw::read(&mut *input, header)?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 - let shifted = (tah.0 .0 & TAPTR_SHIFTED != 0) + let shifted = (tah & TAPTR_SHIFTED != 0) .then(|| -> Result<_> { // TODO allow typedef only? let typ = TypeRaw::read(&mut *input, header)?; @@ -120,7 +122,7 @@ impl PointerRaw { .transpose()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 print_til_type_att - let modifier = match tah.0 .0 & TAPTR_RESTRICT { + let modifier = match tah & TAPTR_RESTRICT { 0x00 => None, TAPTR_PTR32 => Some(PointerModifier::Ptr32), TAPTR_PTR64 => Some(PointerModifier::Ptr64), @@ -128,9 +130,9 @@ impl PointerRaw { _ => unreachable!(), }; // TODO find menaing: commonly set as true - let is_unknown_ta10 = tah.0 .0 & 0x10 != 0; + let is_unknown_ta10 = tah & 0x10 != 0; // TODO find meaning: normally 5 in one type at `vc10_64` and `ntddk64` - let ta_lower = (tah.0 .0 & 0xf) as u8; + let ta_lower = (tah & 0xf) as u8; Ok(Self { closure, diff --git a/src/til/size_calculator.rs b/src/til/size_calculator.rs index de1afcf..8e9e164 100644 --- a/src/til/size_calculator.rs +++ b/src/til/size_calculator.rs @@ -80,7 +80,8 @@ impl<'a> TILTypeSizeSolver<'a> { TypeVariant::Function(_) => 0, // function type dont have a size, only a pointer to it TypeVariant::Array(array) => { let element_len = self.inner_type_size_bytes(&array.elem_type)?; - element_len * array.nelem as u64 + let nelem = array.nelem.map(|x| x.get()).unwrap_or(0) as u64; + element_len * nelem } TypeVariant::StructRef(ref_type) | TypeVariant::UnionRef(ref_type) diff --git a/src/til/struct.rs b/src/til/struct.rs index bd8becb..abc68f1 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -2,7 +2,7 @@ use std::num::{NonZeroU16, NonZeroU8}; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; -use crate::til::{Type, TypeRaw, SDACL}; +use crate::til::{Type, TypeRaw}; use anyhow::{anyhow, Result}; use num_enum::{FromPrimitive, IntoPrimitive, TryFromPrimitive}; @@ -70,7 +70,7 @@ impl StructRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4803b4 // simple reference let ref_type = TypeRaw::read_ref(&mut *input, header)?; - let _taudt_bits = SDACL::read(&mut *input)?; + let _taudt_bits = input.read_sdacl()?; let TypeVariantRaw::Typedef(ref_type) = ref_type.variant else { return Err(anyhow!("StructRef Non Typedef")); }; @@ -83,22 +83,24 @@ impl StructRaw { let alpow = n & 7; let effective_alignment = (alpow != 0).then(|| NonZeroU8::new(1 << (alpow - 1)).unwrap()); // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459c97 - let mut taudt_bits = SDACL::read(&mut *input)?; + let taudt_bits = input.read_sdacl()?; + // TODO check ext atts + let mut taudt_bits = taudt_bits.map(|x| x.tattr).unwrap_or(0); // consume the is_bit used by the StructMemberRaw // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 - let is_bitset = taudt_bits.0 .0 & 0x200 != 0; + let is_bitset = taudt_bits & 0x200 != 0; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47822d // TODO this value can't be right, it defines the alignment! - let is_bitset2 = taudt_bits.0 .0 & 0x4 != 0; - taudt_bits.0 .0 &= !0x200; // NOTE don't consume 0x4, it's used somewhere else + let is_bitset2 = taudt_bits & 0x4 != 0; + taudt_bits &= !0x200; // NOTE don't consume 0x4, it's used somewhere else let members = (0..mem_cnt) .map(|_| StructMemberRaw::read(&mut *input, header, is_bitset, is_bitset2)) .collect::>()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x46c4fc print_til_types_att - let modifier = StructModifierRaw::from_value(taudt_bits.0 .0); + let modifier = StructModifierRaw::from_value(taudt_bits); Ok(TypeVariantRaw::Struct(Self { effective_alignment, modifier, @@ -111,7 +113,6 @@ impl StructRaw { pub struct StructMember { pub name: Option>, pub member_type: Type, - pub sdacl: SDACL, pub att: Option, } @@ -125,7 +126,6 @@ impl StructMember { Ok(Self { name, member_type: Type::new(til, m.ty, fields)?, - sdacl: m.sdacl, att: m.att, }) } @@ -133,7 +133,6 @@ impl StructMember { #[derive(Clone, Debug)] pub(crate) struct StructMemberRaw { pub ty: TypeRaw, - pub sdacl: SDACL, pub att: Option, } @@ -152,19 +151,19 @@ impl StructMemberRaw { .transpose()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47825d - let mut sdacl = SDACL(crate::til::TypeAttribute(0)); if !is_bit_set || matches!(att, Some(_att1)) { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47825d - sdacl = SDACL::read(&mut *input)?; + let sdacl = input.read_sdacl()?; + let sdacl_value = sdacl.as_ref().map(|x| x.tattr).unwrap_or(0); // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47822d - if is_bit_set2 && sdacl.0 .0 & 0x200 == 0 { + if is_bit_set2 && sdacl_value & 0x200 == 0 { // TODO there is more to this impl? // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478411 // todo!(); } } - Ok(Self { ty, sdacl, att }) + Ok(Self { ty, att }) } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x486cd0 diff --git a/src/til/union.rs b/src/til/union.rs index 3ee6977..8a1f750 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -4,7 +4,7 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; -use crate::til::{Type, TypeRaw, SDACL}; +use crate::til::{Type, TypeRaw}; use super::{StructModifierRaw, TypeVariantRaw}; @@ -57,7 +57,7 @@ impl UnionRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4803b4 // is ref let ref_type = TypeRaw::read_ref(&mut *input, header)?; - let _taudt_bits = SDACL::read(&mut *input)?; + let _taudt_bits = input.read_sdacl()?; let TypeVariantRaw::Typedef(ref_type) = ref_type.variant else { return Err(anyhow!("UnionRef Non Typedef")); }; @@ -68,8 +68,10 @@ impl UnionRaw { let alpow = n & 7; let mem_cnt = n >> 3; let effective_alignment = if alpow == 0 { 0 } else { 1 << (alpow - 1) }; - let taudt_bits = SDACL::read(&mut *input)?; - let modifiers = StructModifierRaw::from_value(taudt_bits.0 .0); + let taudt_bits = input.read_sdacl()?; + // TODO handle ext atts + let taudt_bits = taudt_bits.as_ref().map(|x| x.tattr).unwrap_or(0); + let modifiers = StructModifierRaw::from_value(taudt_bits); // TODO check InnerRef to how to handle modifiers let alignment = modifiers.alignment; let members = (0..mem_cnt) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 772dd89..7571360 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -604,8 +604,8 @@ fn print_til_type_array( } fmt.write_all(name)?; } - if til_array.nelem != 0 { - write!(fmt, "[{}]", til_array.nelem)?; + if let Some(nelem) = til_array.nelem { + write!(fmt, "[{nelem}]")?; } else { write!(fmt, "[]")?; } From 778d38d6a62826256a56894209ccb5014dfbd07b Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 10:13:51 -0300 Subject: [PATCH 32/53] add tilib enum type attribute verifications --- src/ida_reader.rs | 1 + src/til/enum.rs | 57 +++++++++++++++++++++++++++++++++++------------ 2 files changed, 44 insertions(+), 14 deletions(-) diff --git a/src/ida_reader.rs b/src/ida_reader.rs index 71798cd..7962a7b 100644 --- a/src/ida_reader.rs +++ b/src/ida_reader.rs @@ -532,6 +532,7 @@ pub trait IdaGenericUnpack: Read { extended: None, }); } + // consume this flag tattr &= !TAH_HASATTRS; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x45289e diff --git a/src/til/enum.rs b/src/til/enum.rs index b04c241..809b09a 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -2,7 +2,7 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; -use crate::til::{flag, StructModifierRaw, TypeRaw, TypeVariantRaw}; +use crate::til::{flag, TypeAttribute, TypeRaw, TypeVariantRaw}; use anyhow::{anyhow, ensure}; #[derive(Clone, Debug)] @@ -61,6 +61,7 @@ impl EnumRaw { // is ref // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4803b4 let ref_type = TypeRaw::read_ref(&mut *input, header)?; + // TODO ensure all bits from sdacl are parsed let _taenum_bits = input.read_sdacl()?; let TypeVariantRaw::Typedef(ref_type) = ref_type.variant else { return Err(anyhow!("EnumRef Non Typedef")); @@ -69,14 +70,50 @@ impl EnumRaw { }; let taenum_bits = input.read_tah()?; - // TODO parse ext attr + let (is_64, is_signed, is_unsigned) = match taenum_bits { + None => (false, false, false), + Some(TypeAttribute { + tattr, + extended: None, + }) => { + let is_64 = tattr & TAENUM_64BIT != 0; + let is_signed = tattr & TAENUM_SIGNED != 0; + let is_unsigned = tattr & TAENUM_UNSIGNED != 0; + ensure!( + tattr & !(TAENUM_64BIT | TAENUM_SIGNED | TAENUM_UNSIGNED) == 0, + "Invalid Enum taenum_bits {tattr:x}" + ); + ensure!( + !(is_signed && is_unsigned), + "Enum can't be signed and unsigned at the same time" + ); + (is_64, is_signed, is_unsigned) + } + // TODO parse ext attr? + Some(TypeAttribute { + tattr: _, + extended: Some(_), + }) => { + return Err(anyhow!("Unable to parse extended attributes for enum")); + } + }; + + // all BTE bits are consumed let bte = input.read_u8()?; + let storage_size_raw = bte & BTE_SIZE_MASK; + ensure!( + bte & BTE_RESERVED == 0, + "Enum BTE including the Always off sub-field" + ); + let have_subarrays = bte & BTE_BITFIELD != 0; + let output_format_raw = bte & BTE_OUT_MASK; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452312 deserialize_enum ensure!( bte & BTE_ALWAYS != 0, - "Enum BTE missing the Always sub-field" + "Enum BTE missing the Always on sub-field" ); - let storage_size: Option = match bte & BTE_SIZE_MASK { + + let storage_size: Option = match storage_size_raw { 0 => None, emsize @ 1..=4 => Some((1 << (emsize - 1)).try_into().unwrap()), // Allowed at InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4523c8 deserialize_enum @@ -93,7 +130,7 @@ impl EnumRaw { u64::MAX >> (u64::BITS - (storage_size_final as u32 * 8)) }; - let output_format = match bte & BTE_OUT_MASK { + let output_format = match output_format_raw { BTE_HEX => EnumFormat::Hex, BTE_CHAR => EnumFormat::Char, BTE_SDEC => EnumFormat::SignedDecimal, @@ -101,18 +138,10 @@ impl EnumRaw { _ => unreachable!(), }; - // TODO ensure no bits from bte or taenum_bits are unparsed - let taenum_bits = taenum_bits.as_ref().map(|x| x.tattr).unwrap_or(0); - let _modifiers = StructModifierRaw::from_value(taenum_bits); - let is_signed = taenum_bits & TAENUM_SIGNED != 0; - let is_unsigned = taenum_bits & TAENUM_UNSIGNED != 0; - // TODO ensure only signed/unsigned is allowed? - // - let is_64 = (taenum_bits & TAENUM_64BIT) != 0; let mut low_acc: u32 = 0; let mut high_acc: u32 = 0; let mut group_acc = 0; - let mut groups = (bte & BTE_BITFIELD != 0).then_some(vec![]); + let mut groups = have_subarrays.then_some(vec![]); let members = (0..member_num) .map(|_member_idx| { if let Some(groups) = &mut groups { From e904ae02a1f4dbb38c2d96bf29c25bf8ddf16568 Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 12:06:56 -0300 Subject: [PATCH 33/53] add tilib pointer type attribute ext verifications --- src/til/pointer.rs | 40 +++++++++++++++++++++++----------------- 1 file changed, 23 insertions(+), 17 deletions(-) diff --git a/src/til/pointer.rs b/src/til/pointer.rs index bb873dd..db45cee 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -2,7 +2,7 @@ use anyhow::Result; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; -use crate::til::{Type, TypeRaw}; +use crate::til::{Type, TypeAttribute, TypeRaw}; #[derive(Debug, Clone)] pub struct Pointer { @@ -10,8 +10,6 @@ pub struct Pointer { pub modifier: Option, pub shifted: Option<(Box, u32)>, pub typ: Box, - pub is_unknown_ta10: bool, - pub ta_lower: u8, } impl Pointer { @@ -37,8 +35,6 @@ impl Pointer { modifier: raw.modifier, shifted, typ, - is_unknown_ta10: raw.is_unknown_ta10, - ta_lower: raw.ta_lower, }) } } @@ -83,8 +79,8 @@ pub(crate) struct PointerRaw { pub modifier: Option, pub shifted: Option<(Box, u32)>, pub typ: Box, - pub is_unknown_ta10: bool, - pub ta_lower: u8, + // TODO find meaning: normally 5 in one type at `vc10_64` and `ntddk64` + pub _ta_lower: u8, } impl PointerRaw { @@ -108,11 +104,26 @@ impl PointerRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4804fa // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459b7e let tah = input.read_tah()?; - // TODO handle ext att - let tah = tah.map(|x| x.tattr).unwrap_or(0); + let (_ta_lower, is_shifted, ptr_type_raw) = match tah { + None => (0, false, 0), + Some(TypeAttribute { tattr, extended }) => { + // all bits of tattr are consumed + let ta_lower = (tattr & 0xf) as u8; + let is_shifted = tattr & TAPTR_SHIFTED != 0; + let ptr_type = tattr & TAPTR_RESTRICT; + if let Some(_extended) = extended { + // TODO parse extended values, known: + // "__org_arrdim" :"\xac\xXX" + // "__org_typedef":..., + // "__argz_create":"\xac\xac" + } + (ta_lower, is_shifted, ptr_type) + } + }; + let typ = TypeRaw::read(&mut *input, header)?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 - let shifted = (tah & TAPTR_SHIFTED != 0) + let shifted = is_shifted .then(|| -> Result<_> { // TODO allow typedef only? let typ = TypeRaw::read(&mut *input, header)?; @@ -122,25 +133,20 @@ impl PointerRaw { .transpose()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459bc6 print_til_type_att - let modifier = match tah & TAPTR_RESTRICT { + let modifier = match ptr_type_raw { 0x00 => None, TAPTR_PTR32 => Some(PointerModifier::Ptr32), TAPTR_PTR64 => Some(PointerModifier::Ptr64), TAPTR_RESTRICT => Some(PointerModifier::Restricted), _ => unreachable!(), }; - // TODO find menaing: commonly set as true - let is_unknown_ta10 = tah & 0x10 != 0; - // TODO find meaning: normally 5 in one type at `vc10_64` and `ntddk64` - let ta_lower = (tah & 0xf) as u8; Ok(Self { closure, modifier, shifted, typ: Box::new(typ), - is_unknown_ta10, - ta_lower, + _ta_lower, }) } } From d8a144a92dff6406b20c389ae1a437bcb5b87e17 Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 12:07:08 -0300 Subject: [PATCH 34/53] add context to error messages --- src/til.rs | 21 ++++++++++++++------- src/til/function.rs | 17 +++++++++++------ src/til/struct.rs | 7 +++++-- src/til/union.rs | 4 ++-- 4 files changed, 32 insertions(+), 17 deletions(-) diff --git a/src/til.rs b/src/til.rs index a1ca104..1453fac 100644 --- a/src/til.rs +++ b/src/til.rs @@ -68,15 +68,18 @@ impl TILTypeInfo { let flags: u32 = cursor.read_u32()?; // TODO verify if flags equal to 0x7fff_fffe? let name = cursor.read_c_string_raw()?; - println!("{}", String::from_utf8_lossy(&name)); let is_u64 = (flags >> 31) != 0; let ordinal = match (til.format, is_u64) { // formats below 0x12 doesn't have 64 bits ord (0..=0x11, _) | (_, false) => cursor.read_u32()?.into(), (_, true) => cursor.read_u64()?, }; - let tinfo_raw = - TypeRaw::read(&mut *cursor, til).context("parsing `TILTypeInfo::tiinfo`")?; + let tinfo_raw = TypeRaw::read(&mut *cursor, til).with_context(|| { + format!( + "parsing `TILTypeInfo::tiinfo` for type \"{}\"", + String::from_utf8_lossy(&name) + ) + })?; let _info = cursor.read_c_string_raw()?; let cmt = cursor.read_c_string_raw()?; let fields = cursor.read_c_string_vec()?; @@ -88,7 +91,11 @@ impl TILTypeInfo { .into_iter() .map(|field| if field.is_empty() { None } else { Some(field) }); let tinfo = Type::new(til, tinfo_raw, &mut fields_iter)?; - ensure!(fields_iter.next().is_none(), "Extra fields found for til"); + ensure!( + fields_iter.next().is_none(), + "Extra fields found for til type \"{}\"", + String::from_utf8_lossy(&name) + ); Ok(Self { _flags: flags, @@ -237,9 +244,9 @@ impl TypeRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x480335 // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x472e13 print_til_type let variant = match (type_base, type_flags) { - (..=flag::tf_last_basic::BT_LAST_BASIC, _) => { - Basic::new(til, type_base, type_flags).map(TypeVariantRaw::Basic)? - } + (..=flag::tf_last_basic::BT_LAST_BASIC, _) => Basic::new(til, type_base, type_flags) + .context("Type::Basic") + .map(TypeVariantRaw::Basic)?, // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4804d7 (flag::tf_ptr::BT_PTR, _) => PointerRaw::read(input, til, type_flags) .context("Type::Pointer") diff --git a/src/til/function.rs b/src/til/function.rs index 6173435..bfded55 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -3,7 +3,7 @@ use std::num::NonZeroU8; use crate::ida_reader::{IdaGenericBufUnpack, IdaGenericUnpack}; use crate::til::section::TILSectionHeader; use crate::til::{Basic, Type, TypeRaw}; -use anyhow::{anyhow, ensure, Result}; +use anyhow::{anyhow, ensure, Context, Result}; use super::TypeVariantRaw; @@ -166,12 +166,15 @@ impl FunctionRaw { let _tah = input.read_tah()?; - let ret = TypeRaw::read(&mut *input, header)?; + let ret = TypeRaw::read(&mut *input, header).context("Return Argument")?; // TODO double check documentation for [flag::tf_func::BT_FUN] let is_special_pe = cc.map(CallingConvention::is_special_pe).unwrap_or(false); let have_retloc = is_special_pe && !matches!(&ret.variant, TypeVariantRaw::Basic(Basic::Void)); - let retloc = have_retloc.then(|| ArgLoc::read(&mut *input)).transpose()?; + let retloc = have_retloc + .then(|| ArgLoc::read(&mut *input)) + .transpose() + .context("Retloc")?; let mut result = Self { calling_convention: cc, @@ -195,17 +198,19 @@ impl FunctionRaw { let n = input.read_dt()?; result.args = (0..n) - .map(|_| -> Result<_> { + .map(|i| -> Result<_> { let tmp = input.peek_u8()?; if tmp == Some(0xFF) { input.consume(1); // TODO what is this? let _flags = input.read_de()?; } - let tinfo = TypeRaw::read(&mut *input, header)?; + let tinfo = TypeRaw::read(&mut *input, header) + .with_context(|| format!("Argument Type {i}"))?; let argloc = is_special_pe .then(|| ArgLoc::read(&mut *input)) - .transpose()?; + .transpose() + .with_context(|| format!("Argument Argloc {i}"))?; Ok((tinfo, argloc)) }) diff --git a/src/til/struct.rs b/src/til/struct.rs index abc68f1..30589d5 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -3,7 +3,7 @@ use std::num::{NonZeroU16, NonZeroU8}; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeRaw}; -use anyhow::{anyhow, Result}; +use anyhow::{anyhow, Context, Result}; use num_enum::{FromPrimitive, IntoPrimitive, TryFromPrimitive}; use super::{StructModifierRaw, TypeVariantRaw}; @@ -96,7 +96,10 @@ impl StructRaw { taudt_bits &= !0x200; // NOTE don't consume 0x4, it's used somewhere else let members = (0..mem_cnt) - .map(|_| StructMemberRaw::read(&mut *input, header, is_bitset, is_bitset2)) + .map(|i| { + StructMemberRaw::read(&mut *input, header, is_bitset, is_bitset2) + .with_context(|| format!("Member {i}")) + }) .collect::>()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x46c4fc print_til_types_att diff --git a/src/til/union.rs b/src/til/union.rs index 8a1f750..0d449d9 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -1,4 +1,4 @@ -use anyhow::anyhow; +use anyhow::{anyhow, Context}; use std::num::NonZeroU8; @@ -75,7 +75,7 @@ impl UnionRaw { // TODO check InnerRef to how to handle modifiers let alignment = modifiers.alignment; let members = (0..mem_cnt) - .map(|_| TypeRaw::read(&mut *input, header)) + .map(|i| TypeRaw::read(&mut *input, header).with_context(|| format!("Member {i}"))) .collect::>()?; Ok(TypeVariantRaw::Union(Self { effective_alignment, From c58e053a1b0715ee3c4c54f7a9c6940c69b7041b Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 12:52:07 -0300 Subject: [PATCH 35/53] add tilib array type attribute ext verifications --- src/til/array.rs | 27 ++++++++++++++++++++++++--- src/til/enum.rs | 4 ++-- src/til/pointer.rs | 6 +++--- 3 files changed, 29 insertions(+), 8 deletions(-) diff --git a/src/til/array.rs b/src/til/array.rs index 52e38f7..1383c24 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -1,11 +1,14 @@ -use std::num::NonZeroU16; +use std::num::{NonZeroU16, NonZeroU8}; + +use anyhow::ensure; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; -use crate::til::{Type, TypeRaw}; +use crate::til::{Type, TypeAttribute, TypeRaw}; #[derive(Clone, Debug)] pub struct Array { + pub align: Option, pub base: u8, pub nelem: Option, pub elem_type: Box, @@ -17,6 +20,7 @@ impl Array { fields: &mut impl Iterator>>, ) -> anyhow::Result { Ok(Self { + align: value.align, base: value.base, nelem: value.nelem, elem_type: Type::new(til, *value.elem_type, fields).map(Box::new)?, @@ -26,6 +30,7 @@ impl Array { #[derive(Clone, Debug)] pub(crate) struct ArrayRaw { + pub align: Option, pub base: u8, pub nelem: Option, pub elem_type: Box, @@ -37,6 +42,7 @@ impl ArrayRaw { header: &TILSectionHeader, metadata: u8, ) -> anyhow::Result { + use crate::til::flag::tattr::*; use crate::til::flag::tf_array::*; let (base, nelem) = match metadata { BTMT_NONBASED => { @@ -50,10 +56,25 @@ impl ArrayRaw { } }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48078e - let _tah = input.read_tah()?; + let align = match input.read_tah()? { + None => None, + Some(TypeAttribute { tattr, extended }) => { + let align = (tattr & MAX_DECL_ALIGN) as u8; + ensure!( + tattr & !MAX_DECL_ALIGN == 0, + "unknown TypeAttribute {tattr:x}" + ); + ensure!( + extended.is_none(), + "unknown TypeAttribute ext {extended:x?}" + ); + NonZeroU8::new(align) + } + }; let elem_type = TypeRaw::read(&mut *input, header)?; Ok(ArrayRaw { base, + align, nelem: NonZeroU16::new(nelem), elem_type: Box::new(elem_type), }) diff --git a/src/til/enum.rs b/src/til/enum.rs index 809b09a..6f562ce 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -69,13 +69,13 @@ impl EnumRaw { return Ok(TypeVariantRaw::EnumRef(ref_type)); }; - let taenum_bits = input.read_tah()?; - let (is_64, is_signed, is_unsigned) = match taenum_bits { + let (is_64, is_signed, is_unsigned) = match input.read_tah()? { None => (false, false, false), Some(TypeAttribute { tattr, extended: None, }) => { + // TODO enum have an align field (MAX_DECL_ALIGN) in tattr? let is_64 = tattr & TAENUM_64BIT != 0; let is_signed = tattr & TAENUM_SIGNED != 0; let is_unsigned = tattr & TAENUM_UNSIGNED != 0; diff --git a/src/til/pointer.rs b/src/til/pointer.rs index db45cee..aecc3bf 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -89,6 +89,7 @@ impl PointerRaw { header: &TILSectionHeader, metadata: u8, ) -> Result { + use crate::til::flag::tattr::*; use crate::til::flag::tattr_ptr::*; use crate::til::flag::tf_ptr::*; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478d67 @@ -103,12 +104,11 @@ impl PointerRaw { }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4804fa // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459b7e - let tah = input.read_tah()?; - let (_ta_lower, is_shifted, ptr_type_raw) = match tah { + let (_ta_lower, is_shifted, ptr_type_raw) = match input.read_tah()? { None => (0, false, 0), Some(TypeAttribute { tattr, extended }) => { // all bits of tattr are consumed - let ta_lower = (tattr & 0xf) as u8; + let ta_lower = (tattr & MAX_DECL_ALIGN) as u8; let is_shifted = tattr & TAPTR_SHIFTED != 0; let ptr_type = tattr & TAPTR_RESTRICT; if let Some(_extended) = extended { From 0d8fa3a41df336b24f93044814652949cf18902c Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 14:51:17 -0300 Subject: [PATCH 36/53] fix read sdacl --- src/ida_reader.rs | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/src/ida_reader.rs b/src/ida_reader.rs index 7962a7b..8e8d466 100644 --- a/src/ida_reader.rs +++ b/src/ida_reader.rs @@ -286,11 +286,10 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x477eff - match sdacl { - //NOTE: original op ((sdacl & 0xcf) ^ 0xC0) <= 0x01 - 0xd0..=0xff | 0xc0 | 0xc1 => Ok(Some(self.read_type_attribute()?)), - _ => Ok(None), - } + //NOTE: original op ((sdacl as u8 & 0xcf) ^ 0xC0) as i32 <= 0x01 + matches!(sdacl, 0xC0..=0xC1 | 0xD0..=0xD1 | 0xE0..=0xE1 | 0xF0..=0xF1) + .then(|| self.read_type_attribute()) + .transpose() } } impl IdaGenericBufUnpack for R {} From f65024f1322e523278096e8ab558cc59d564258d Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 15:55:01 -0300 Subject: [PATCH 37/53] add tilib udt type attribute ext verifications --- src/til.rs | 55 +-------------- src/til/pointer.rs | 6 +- src/til/struct.rs | 172 +++++++++++++++++++++++++++++++++++---------- src/til/union.rs | 38 +++++++--- src/tools/tilib.rs | 9 +-- 5 files changed, 173 insertions(+), 107 deletions(-) diff --git a/src/til.rs b/src/til.rs index 1453fac..9ebee66 100644 --- a/src/til.rs +++ b/src/til.rs @@ -13,7 +13,7 @@ mod size_calculator; pub use size_calculator::*; -use std::num::{NonZeroU16, NonZeroU8}; +use std::num::NonZeroU8; use anyhow::{anyhow, ensure, Context, Result}; @@ -605,56 +605,3 @@ fn serialize_dt(value: u16) -> Result> { result.push(hi as u8); Ok(result) } - -#[derive(Clone, Copy, Debug)] -pub struct StructModifierRaw { - /// Unaligned struct - is_unaligned: bool, - /// Gcc msstruct attribute - is_msstruct: bool, - /// C++ object, not simple pod type - is_cpp_obj: bool, - /// Virtual function table - is_vftable: bool, - // TODO unknown meaning - is_unknown_8: bool, - /// Alignment in bytes - alignment: Option, - /// other unknown value - others: Option, -} - -impl StructModifierRaw { - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x46c4fc print_til_types_att - pub fn from_value(value: u16) -> StructModifierRaw { - use flag::tattr_udt::*; - - // TODO 0x8 seems to be a the packed flag in structs - const TAUDT_ALIGN_MASK: u16 = 0x7; - // TODO find the flag for this and the InnerRef - let is_msstruct = value & TAUDT_MSSTRUCT != 0; - let is_cpp_obj = value & TAUDT_CPPOBJ != 0; - let is_unaligned = value & TAUDT_UNALIGNED != 0; - let is_vftable = value & TAUDT_VFTABLE != 0; - let alignment_raw = value & TAUDT_ALIGN_MASK; - let is_unknown_8 = value & 0x8 != 0; - let alignment = - (alignment_raw != 0).then(|| NonZeroU8::new(1 << (alignment_raw - 1)).unwrap()); - let all_masks = TAUDT_MSSTRUCT - | TAUDT_CPPOBJ - | TAUDT_UNALIGNED - | TAUDT_VFTABLE - | TAUDT_ALIGN_MASK - | 0x8; - let others = NonZeroU16::new(value & !all_masks); - Self { - is_unaligned, - is_msstruct, - is_cpp_obj, - is_vftable, - alignment, - is_unknown_8, - others, - } - } -} diff --git a/src/til/pointer.rs b/src/til/pointer.rs index aecc3bf..744e918 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -1,4 +1,4 @@ -use anyhow::Result; +use anyhow::{ensure, Result}; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; @@ -111,6 +111,10 @@ impl PointerRaw { let ta_lower = (tattr & MAX_DECL_ALIGN) as u8; let is_shifted = tattr & TAPTR_SHIFTED != 0; let ptr_type = tattr & TAPTR_RESTRICT; + ensure!( + tattr & !(TAPTR_SHIFTED | TAPTR_RESTRICT | MAX_DECL_ALIGN) == 0, + "Invalid Pointer taenum_bits {tattr:x}" + ); if let Some(_extended) = extended { // TODO parse extended values, known: // "__org_arrdim" :"\xac\xXX" diff --git a/src/til/struct.rs b/src/til/struct.rs index 30589d5..1583d61 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -1,12 +1,12 @@ -use std::num::{NonZeroU16, NonZeroU8}; +use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeRaw}; -use anyhow::{anyhow, Context, Result}; +use anyhow::{anyhow, ensure, Context, Result}; use num_enum::{FromPrimitive, IntoPrimitive, TryFromPrimitive}; -use super::{StructModifierRaw, TypeVariantRaw}; +use super::{TypeAttribute, TypeVariantRaw}; #[derive(Clone, Debug)] pub struct Struct { @@ -17,16 +17,13 @@ pub struct Struct { /// Gcc msstruct attribute pub is_msstruct: bool, /// C++ object, not simple pod type - pub is_cpp_obj: bool, + pub is_cppobj: bool, /// Virtual function table - pub is_vftable: bool, + pub is_vft: bool, /// Unknown meaning, use at your own risk pub is_uknown_8: bool, /// Alignment in bytes pub alignment: Option, - // TODO delete others, parse all values or return an error - /// other unparsed values from the type attribute - pub others: Option, } impl Struct { pub(crate) fn new( @@ -42,13 +39,12 @@ impl Struct { Ok(Struct { effective_alignment: value.effective_alignment, members, - is_unaligned: value.modifier.is_unaligned, - is_msstruct: value.modifier.is_msstruct, - is_cpp_obj: value.modifier.is_cpp_obj, - is_vftable: value.modifier.is_vftable, - is_uknown_8: value.modifier.is_unknown_8, - alignment: value.modifier.alignment, - others: value.modifier.others, + is_unaligned: value.is_unaligned, + is_msstruct: value.is_msstruct, + is_cppobj: value.is_cppobj, + is_vft: value.is_vft, + is_uknown_8: value.is_unknown_8, + alignment: value.alignment, }) } } @@ -56,8 +52,20 @@ impl Struct { #[derive(Clone, Debug)] pub(crate) struct StructRaw { effective_alignment: Option, - modifier: StructModifierRaw, members: Vec, + + /// Unaligned struct + is_unaligned: bool, + /// Gcc msstruct attribute + is_msstruct: bool, + /// C++ object, not simple pod type + is_cppobj: bool, + /// Virtual function table + is_vft: bool, + // TODO unknown meaning + is_unknown_8: bool, + /// Alignment in bytes + alignment: Option, } impl StructRaw { @@ -83,31 +91,68 @@ impl StructRaw { let alpow = n & 7; let effective_alignment = (alpow != 0).then(|| NonZeroU8::new(1 << (alpow - 1)).unwrap()); // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459c97 - let taudt_bits = input.read_sdacl()?; - // TODO check ext atts - let mut taudt_bits = taudt_bits.map(|x| x.tattr).unwrap_or(0); - - // consume the is_bit used by the StructMemberRaw - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 - let is_bitset = taudt_bits & 0x200 != 0; - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47822d - // TODO this value can't be right, it defines the alignment! - let is_bitset2 = taudt_bits & 0x4 != 0; - taudt_bits &= !0x200; // NOTE don't consume 0x4, it's used somewhere else + let mut alignment = None; + let mut is_unknown_8 = false; + let mut is_msstruct = false; + let mut is_unaligned = false; + let mut is_cppobj = false; + let mut is_vft = false; + let mut is_method = false; + let mut is_bitset2 = false; + if let Some(TypeAttribute { tattr, extended }) = input.read_sdacl()? { + use crate::til::flag::tattr::*; + use crate::til::flag::tattr_field::*; + use crate::til::flag::tattr_udt::*; + + let align_raw = (tattr & MAX_DECL_ALIGN) as u8; + + // TODO WHY? + is_unknown_8 = align_raw & 0x8 != 0; + alignment = NonZeroU8::new(align_raw & 0x7); + + is_msstruct = tattr & TAUDT_MSSTRUCT != 0; + is_unaligned = tattr & TAUDT_UNALIGNED != 0; + is_cppobj = tattr & TAUDT_CPPOBJ != 0; + is_vft = tattr & TAUDT_VFTABLE != 0; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 + // TODO using a field flag on the struct seems out-of-place + is_method = tattr & TAFLD_METHOD != 0; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47822d + // TODO this value can't be right, it defines the alignment! + is_bitset2 = align_raw & 0x4 != 0; + + const ALL_FLAGS: u16 = MAX_DECL_ALIGN + | TAUDT_MSSTRUCT + | TAUDT_UNALIGNED + | TAUDT_CPPOBJ + | TAUDT_VFTABLE + | TAFLD_METHOD; + ensure!( + tattr & !ALL_FLAGS == 0, + "Invalid Struct taenum_bits {tattr:x}" + ); + ensure!( + extended.is_none(), + "Unable to parse extended attributes for struct" + ); + } let members = (0..mem_cnt) .map(|i| { - StructMemberRaw::read(&mut *input, header, is_bitset, is_bitset2) + StructMemberRaw::read(&mut *input, header, is_method, is_bitset2) .with_context(|| format!("Member {i}")) }) .collect::>()?; - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x46c4fc print_til_types_att - let modifier = StructModifierRaw::from_value(taudt_bits); Ok(TypeVariantRaw::Struct(Self { effective_alignment, - modifier, members, + is_unaligned, + is_msstruct, + is_cppobj, + is_vft, + is_unknown_8, + alignment, })) } } @@ -117,6 +162,12 @@ pub struct StructMember { pub name: Option>, pub member_type: Type, pub att: Option, + + pub alignment: Option, + pub is_baseclass: bool, + pub is_unaligned: bool, + pub is_vft: bool, + pub is_method: bool, } impl StructMember { @@ -130,6 +181,11 @@ impl StructMember { name, member_type: Type::new(til, m.ty, fields)?, att: m.att, + alignment: m.alignment, + is_baseclass: m.is_baseclass, + is_unaligned: m.is_unaligned, + is_vft: m.is_vft, + is_method: m.is_method, }) } } @@ -137,6 +193,11 @@ impl StructMember { pub(crate) struct StructMemberRaw { pub ty: TypeRaw, pub att: Option, + pub alignment: Option, + pub is_baseclass: bool, + pub is_unaligned: bool, + pub is_vft: bool, + pub is_method: bool, } impl StructMemberRaw { @@ -153,20 +214,59 @@ impl StructMemberRaw { .then(|| Self::read_member_att_1(input, header)) .transpose()?; + let mut alignment = None; + let mut is_baseclass = false; + let mut is_unaligned = false; + let mut is_vft = false; + let mut is_method = false; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47825d - if !is_bit_set || matches!(att, Some(_att1)) { + if !is_bit_set || att.is_some() { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47825d - let sdacl = input.read_sdacl()?; - let sdacl_value = sdacl.as_ref().map(|x| x.tattr).unwrap_or(0); + if let Some(TypeAttribute { tattr, extended }) = input.read_sdacl()? { + use crate::til::flag::tattr::*; + use crate::til::flag::tattr_field::*; + + alignment = NonZeroU8::new((tattr & MAX_DECL_ALIGN) as u8); + is_baseclass = tattr & TAFLD_BASECLASS != 0; + is_unaligned = tattr & TAFLD_UNALIGNED != 0; + let is_virtbase = tattr & TAFLD_VIRTBASE != 0; + ensure!(!is_virtbase, "UDT Member virtual base is not supported yet"); + is_vft = tattr & TAFLD_VFTABLE != 0; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 + is_method = tattr & TAFLD_METHOD != 0; + const ALL_FLAGS: u16 = MAX_DECL_ALIGN + | TAFLD_BASECLASS + | TAFLD_UNALIGNED + | TAFLD_VFTABLE + | TAFLD_METHOD; + ensure!( + tattr & !ALL_FLAGS == 0, + "Invalid Struct taenum_bits {tattr:x}" + ); + ensure!( + extended.is_none(), + "Unable to parse extended attributes for struct member" + ); + } + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47822d - if is_bit_set2 && sdacl_value & 0x200 == 0 { + if is_bit_set2 && !is_method { // TODO there is more to this impl? // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478411 // todo!(); } } - Ok(Self { ty, att }) + Ok(Self { + ty, + att, + alignment, + is_baseclass, + is_unaligned, + is_vft, + is_method, + }) } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x486cd0 diff --git a/src/til/union.rs b/src/til/union.rs index 0d449d9..af42b60 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -1,4 +1,4 @@ -use anyhow::{anyhow, Context}; +use anyhow::{anyhow, ensure, Context}; use std::num::NonZeroU8; @@ -6,15 +6,15 @@ use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeRaw}; -use super::{StructModifierRaw, TypeVariantRaw}; +use super::{TypeAttribute, TypeVariantRaw}; #[derive(Clone, Debug)] pub struct Union { pub effective_alignment: u16, pub alignment: Option, pub members: Vec<(Option>, Type)>, - // TODO parse type attributes - //others: StructMemberRaw, + + pub is_unaligned: bool, } impl Union { pub(crate) fn new( @@ -35,6 +35,7 @@ impl Union { effective_alignment: value.effective_alignment, alignment: value.alignment, members, + is_unaligned: value.is_unaligned, }) } } @@ -46,6 +47,7 @@ pub(crate) struct UnionRaw { effective_alignment: u16, alignment: Option, members: Vec, + is_unaligned: bool, } impl UnionRaw { @@ -68,12 +70,27 @@ impl UnionRaw { let alpow = n & 7; let mem_cnt = n >> 3; let effective_alignment = if alpow == 0 { 0 } else { 1 << (alpow - 1) }; - let taudt_bits = input.read_sdacl()?; - // TODO handle ext atts - let taudt_bits = taudt_bits.as_ref().map(|x| x.tattr).unwrap_or(0); - let modifiers = StructModifierRaw::from_value(taudt_bits); - // TODO check InnerRef to how to handle modifiers - let alignment = modifiers.alignment; + + let mut alignment = None; + let mut is_unaligned = false; + if let Some(TypeAttribute { tattr, extended }) = input.read_sdacl()? { + use crate::til::flag::tattr::*; + use crate::til::flag::tattr_udt::*; + + alignment = NonZeroU8::new((tattr & MAX_DECL_ALIGN) as u8); + is_unaligned = tattr & TAUDT_UNALIGNED != 0; + + const ALL_FLAGS: u16 = MAX_DECL_ALIGN | TAUDT_UNALIGNED; + ensure!( + tattr & !ALL_FLAGS == 0, + "Invalid Union taenum_bits {tattr:x}" + ); + ensure!( + extended.is_none(), + "Unable to parse extended attributes for union" + ); + } + let members = (0..mem_cnt) .map(|i| TypeRaw::read(&mut *input, header).with_context(|| format!("Member {i}"))) .collect::>()?; @@ -81,6 +98,7 @@ impl UnionRaw { effective_alignment, alignment, members, + is_unaligned, })) } } diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 7571360..e90e38b 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -696,18 +696,15 @@ fn print_til_type_struct( if til_struct.is_msstruct { write!(fmt, "__attribute__((msstruct)) ")?; } - if til_struct.is_cpp_obj { + if til_struct.is_cppobj { write!(fmt, "__cppobj ")?; } - if til_struct.is_vftable { + if til_struct.is_vft { write!(fmt, "/*VFT*/ ")?; } if let Some(align) = til_struct.alignment { write!(fmt, "__attribute__((aligned({align}))) ")?; } - if let Some(others) = til_struct.others { - write!(fmt, "__other({others:04x}) ")?; - } if let Some(name) = name { if print_name { fmt.write_all(name)?; @@ -1181,7 +1178,7 @@ fn is_vft(section: &TILSection, typ: &Type) -> bool { // propagate the search? //TypeVariant::Pointer(pointer) => todo!(), // TODO struct with only function-pointers is also vftable? - TypeVariant::Struct(ty) => ty.is_vftable, + TypeVariant::Struct(ty) => ty.is_vft, TypeVariant::Typedef(typedef) | TypeVariant::StructRef(typedef) => { let inner_type = match typedef { Typedef::Ordinal(ord) => section.get_ord(Id0TilOrd { ord: (*ord).into() }), From 692281d1503233ae19a42e667b6591596eed4e6e Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 16:00:46 -0300 Subject: [PATCH 38/53] follow clippy sugestions --- src/ida_reader.rs | 4 ++-- src/til/section.rs | 2 +- src/til/size_calculator.rs | 17 +++++++---------- src/tools/tilib.rs | 4 ++-- 4 files changed, 12 insertions(+), 15 deletions(-) diff --git a/src/ida_reader.rs b/src/ida_reader.rs index 8e8d466..57fc053 100644 --- a/src/ida_reader.rs +++ b/src/ida_reader.rs @@ -544,10 +544,10 @@ pub trait IdaGenericUnpack: Read { Ok(TypeAttributeExt { _value1, _value2 }) }) .collect::>()?; - return Ok(TypeAttribute { + Ok(TypeAttribute { tattr, extended: Some(extended), - }); + }) } fn read_bytes_len_u16(&mut self) -> Result> { diff --git a/src/til/section.rs b/src/til/section.rs index 87ae61b..4b29bdd 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -136,7 +136,7 @@ impl TILSection { let cn = CCPtrSize::from_cm_raw(header.cm, header.size_int); let cm = CCModel::from_cm_raw(header.cm); - let dependencies = if header.dependencies.len() != 0 { + let dependencies = if !header.dependencies.is_empty() { header .dependencies .split(|x| *x == b',') diff --git a/src/til/size_calculator.rs b/src/til/size_calculator.rs index 8e9e164..1e4913a 100644 --- a/src/til/size_calculator.rs +++ b/src/til/size_calculator.rs @@ -93,7 +93,7 @@ impl<'a> TILTypeSizeSolver<'a> { let align: u64 = 1; let mut members = &til_struct.members[..]; loop { - let first_member = members.get(0); + let first_member = members.first(); let field_size = match first_member.map(|x| &x.member_type.type_variant) { // no more members None => break, @@ -115,8 +115,7 @@ impl<'a> TILTypeSizeSolver<'a> { }; if !til_struct.is_unaligned { let align = first_member - .map(|first| self.alignemnt(&first.member_type, field_size)) - .flatten() + .and_then(|first| self.alignemnt(&first.member_type, field_size)) .unwrap_or(align) .max(1); let align_diff = sum % align; @@ -189,7 +188,7 @@ impl<'a> TILTypeSizeSolver<'a> { Typedef::Name(Some(name)) => self.section.get_name(name), Typedef::Name(None) => None, }; - ty.map(|ty| self.inner_type_size_bytes(&ty.tinfo)).flatten() + ty.and_then(|ty| self.inner_type_size_bytes(&ty.tinfo)) } TypeVariant::Typedef(ty) => { let ty = match ty { @@ -199,11 +198,10 @@ impl<'a> TILTypeSizeSolver<'a> { Typedef::Name(Some(name)) => self.section.get_name(name), Typedef::Name(None) => None, }; - ty.map(|ty| { + ty.and_then(|ty| { let size = self.inner_type_size_bytes(&ty.tinfo).unwrap_or(1); self.alignemnt(&ty.tinfo, size) }) - .flatten() } _ => None, } @@ -219,14 +217,13 @@ fn condensate_bitfields_from_struct( let mut condensated_bits = first_field.width; loop { - let Some(TypeVariant::Bitfield(member)) = rest.get(0).map(|x| &x.member_type.type_variant) + let Some(TypeVariant::Bitfield(member)) = rest.first().map(|x| &x.member_type.type_variant) else { // no more bit-fields to condensate break; }; - let member_bits = u16::from(member.width); // condensate the bit-field into the byte-field - condensated_bits += member_bits; + condensated_bits += member.width; // check if this bit start the next field if field_bytes != member.nbytes || condensated_bits > field_bits { // NOTE this don't consume the current member @@ -236,5 +233,5 @@ fn condensate_bitfields_from_struct( // advance to the next member *rest = &rest[1..]; } - return field_bytes; + field_bytes } diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index e90e38b..162a688 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -234,7 +234,7 @@ fn print_symbols( write!(fmt, " {} ", sym_kind)?; // TODO investiage this - let name = if symbol.ordinal == 0 && symbol.name.get(0) == Some(&b'_') { + let name = if symbol.ordinal == 0 && symbol.name.first() == Some(&b'_') { // remove the first "_", if any &symbol.name[1..] } else { @@ -640,7 +640,7 @@ fn print_til_type_typedef( } idb_rs::til::Typedef::Name(Some(name)) => { // NOTE don't need to get the inner type, we already have it's name - fmt.write_all(&name)?; + fmt.write_all(name)?; true } // Nothing to print From 1743e1cf63489c63f8f2070a2621b2a21ea58193 Mon Sep 17 00:00:00 2001 From: rbran Date: Wed, 8 Jan 2025 16:21:02 -0300 Subject: [PATCH 39/53] add tilib function type attribute ext verifications --- src/til/function.rs | 48 ++++++++++++++++++++++----------------------- 1 file changed, 23 insertions(+), 25 deletions(-) diff --git a/src/til/function.rs b/src/til/function.rs index bfded55..4bcde71 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -127,7 +127,7 @@ impl FunctionRaw { }; // TODO InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x473bf1 print_til_type - let (cc, mut flags, _spoiled) = read_cc(&mut *input)?; + let (cc, flags, _spoiled) = read_cc(&mut *input)?; let cc = CallingConvention::from_cm_raw(cc)?; // TODO investigate why this don't hold true @@ -141,30 +141,28 @@ impl FunctionRaw { // consume the flags and verify if a unknown value is present // TODO find those in flags - let _have_spoiled = flags & 0x0001 != 0; - flags &= !1; - let is_noret = flags & 0x0002 != 0; - flags &= !0x0002; - let is_pure = flags & 0x0004 != 0; - flags &= !0x0004; - let is_high = flags & 0x0008 != 0; - flags &= !0x0008; - let is_static = flags & 0x0010 != 0; - flags &= !0x0010; - let is_virtual = flags & 0x0020 != 0; - flags &= !0x0020; - // TODO find this flag meaning - //let is_TODO = flags & 0x0200 != 0; - flags &= !0x0200; - let is_const = flags & 0x00400 != 0; - flags &= !0x0400; - let is_constructor = flags & 0x0800 != 0; - flags &= !0x0800; - let is_destructor = flags & 0x1000 != 0; - flags &= !0x0100; - ensure!(flags == 0, "unknown function attrs({flags:04X})"); - - let _tah = input.read_tah()?; + let have_spoiled = flags & 0x0001 != 0; + if !have_spoiled { + ensure!(_spoiled.is_empty()); + } + let flags_lower = ((flags & 0xFF) >> 1) as u8; + + let is_noret = flags_lower & BFA_NORET != 0; + let is_pure = flags_lower & BFA_PURE != 0; + let is_high = flags_lower & BFA_HIGH != 0; + let is_static = flags_lower & BFA_STATIC != 0; + let is_virtual = flags_lower & BFA_VIRTUAL != 0; + ensure!(flags_lower & !(BFA_NORET | BFA_PURE | BFA_HIGH | BFA_STATIC | BFA_VIRTUAL) == 0); + + // TODO find those flags + const BFA_CONST: u8 = 0x4; + const BFA_CONSTRUCTOR: u8 = 0x8; + const BFA_DESTRUCTOR: u8 = 0x10; + let flags_upper = ((flags & 0xFF00) >> 8) as u8; + let is_const = flags_upper & BFA_CONST != 0; + let is_constructor = flags_upper & BFA_CONSTRUCTOR != 0; + let is_destructor = flags_upper & BFA_DESTRUCTOR != 0; + ensure!(flags_upper & !(BFA_CONST | BFA_CONSTRUCTOR | BFA_DESTRUCTOR) == 0); let ret = TypeRaw::read(&mut *input, header).context("Return Argument")?; // TODO double check documentation for [flag::tf_func::BT_FUN] From b99ce5f9f42c07363c1b60477c3ef5c0c629b702 Mon Sep 17 00:00:00 2001 From: rbran Date: Thu, 9 Jan 2025 13:09:55 -0300 Subject: [PATCH 40/53] add a permissive feature The permissive feature will make allow a more "relaxed" parsing of files, making fewer checks and defaulting to 0 if EoF is found. --- Cargo.toml | 4 ++ src/ida_reader.rs | 130 ++++++++++++++++++++++++++++++++++++++------ src/lib.rs | 68 +++++++++++++---------- src/til.rs | 10 +++- src/til/array.rs | 17 +++--- src/til/bitfield.rs | 22 +++++++- src/til/enum.rs | 62 +++++++++++---------- src/til/function.rs | 24 +++++--- src/til/pointer.rs | 12 ++-- src/til/section.rs | 10 +++- src/til/struct.rs | 28 +++++++--- src/til/union.rs | 28 ++++++---- 12 files changed, 297 insertions(+), 118 deletions(-) diff --git a/Cargo.toml b/Cargo.toml index 1e45a7c..3d2d581 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -14,6 +14,10 @@ flate2 = "1.0.31" serde = { version = "1.0", features = ["derive"] } num_enum = "0.7.3" +[features] +default = [] +permissive = [] + [[bin]] name = "idb-tools" path = "src/tools/tools.rs" diff --git a/src/ida_reader.rs b/src/ida_reader.rs index 57fc053..f314bed 100644 --- a/src/ida_reader.rs +++ b/src/ida_reader.rs @@ -43,9 +43,12 @@ pub trait IdaUnpack: IdaGenericUnpack { if self.is_64() { let start = self.unpack_dq()?; let len = self.unpack_dq()?; + #[cfg(not(feature = "permissive"))] let end = start .checked_add(len) .ok_or_else(|| anyhow!("Function range overflows"))?; + #[cfg(feature = "permissive")] + let end = start.saturating_add(len); Ok(start..end) } else { let start = self.unpack_dd_ext_max()?; @@ -54,7 +57,10 @@ pub trait IdaUnpack: IdaGenericUnpack { let end = match start.checked_add(len.into()) { Some(0xFFFF_FFFF) => u64::MAX, Some(value) => value, + #[cfg(not(feature = "permissive"))] None => return Err(anyhow!("Function range overflows")), + #[cfg(feature = "permissive")] + None => u64::MAX, }; Ok(start..end) } @@ -172,11 +178,14 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { let mut nelem = 0; // TODO check no more then 9 bytes are read loop { - let Some(typ) = self.fill_buf()?.first().copied() else { + let Some(typ) = self.peek_u8()? else { + #[cfg(not(feature = "permissive"))] return Err(anyhow!(std::io::Error::new( std::io::ErrorKind::UnexpectedEof, "Unexpected EoF on DA" ))); + #[cfg(feature = "permissive")] + return Ok((nelem, base)); }; if typ & 0x80 == 0 { break; @@ -192,11 +201,14 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { } nelem = (z >> 4) & 7; loop { - let Some(y) = self.fill_buf()?.first().copied() else { + let Some(y) = self.peek_u8()? else { + #[cfg(not(feature = "permissive"))] return Err(anyhow!(std::io::Error::new( std::io::ErrorKind::UnexpectedEof, "Unexpected EoF on DA" ))); + #[cfg(feature = "permissive")] + return Ok((nelem, base)); }; if (y & 0x80) == 0 { break; @@ -218,7 +230,13 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { let mut buf = vec![]; self.read_until(b'\x00', &mut buf)?; // last char need to be \x00 or we found a EoF - ensure!(buf.pop() == Some(b'\x00'), "Unexpected EoF on CStr"); + if let Some(b'\x00') = buf.last() { + let _ = buf.pop(); // remove the \x00 from the end + } else { + // found EOF, aka could not find the \x00 for the string end + #[cfg(not(feature = "permissive"))] + return Err(anyhow!("Unexpected EoF on CStr")); + } Ok(buf) } @@ -249,6 +267,7 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { if (start_value >> bit) & 1 != 0 { let value = self.read_u8()?; // TODO is this an error or expect possible value? + #[cfg(not(feature = "permissive"))] ensure!(value != 0); acc |= (value as u64) << byte; } @@ -301,6 +320,13 @@ pub trait IdaGenericUnpack: Read { Ok(data[0]) } + #[cfg(feature = "permissive")] + fn read_u8_or_nothing(&mut self) -> Result> { + let mut data = [0; 1]; + let read = self.read_exact_or_nothing(&mut data)?; + Ok((read == data.len()).then_some(data[0])) + } + fn read_u16(&mut self) -> Result { let mut data = [0; 2]; self.read_exact(&mut data)?; @@ -339,7 +365,13 @@ pub trait IdaGenericUnpack: Read { // NOTE: the original implementation never fails, if input hit EoF it a partial result or 0 /// Reads 1 to 3 bytes. fn unpack_dw(&mut self) -> Result { - let b1: u8 = bincode::deserialize_from(&mut *self)?; + #[cfg(not(feature = "permissive"))] + let b1 = self.read_u8()?; + #[cfg(feature = "permissive")] + let Some(b1) = self.read_u8_or_nothing()? + else { + return Ok(0); + }; match b1 { // 7 bit value // [0xxx xxxx] @@ -347,7 +379,10 @@ pub trait IdaGenericUnpack: Read { // 14 bits value // [10xx xxxx] xxxx xxxx 0x80..=0xBF => { - let lo: u8 = bincode::deserialize_from(&mut *self)?; + #[cfg(not(feature = "permissive"))] + let lo = self.read_u8()?; + #[cfg(feature = "permissive")] + let lo = self.read_u8_or_nothing()?.unwrap_or(0); Ok(u16::from_be_bytes([b1 & 0x3F, lo])) } // 16 bits value @@ -355,7 +390,16 @@ pub trait IdaGenericUnpack: Read { 0xC0..=0xFF => { // NOTE first byte 6 bits seems to be ignored //ensure!(header != 0xC0 && header != 0xFF); - Ok(u16::from_be_bytes(bincode::deserialize_from(&mut *self)?)) + #[cfg(not(feature = "permissive"))] + let (lo, hi) = (self.read_u8()?, self.read_u8()?); + + #[cfg(feature = "permissive")] + let (lo, hi) = ( + self.read_u8_or_nothing()?.unwrap_or(0), + self.read_u8_or_nothing()?.unwrap_or(0), + ); + + Ok(u16::from_be_bytes([lo, hi])) } } } @@ -364,7 +408,13 @@ pub trait IdaGenericUnpack: Read { // NOTE the orignal implementation never fails, if input hit EoF it a partial result or 0 /// Reads 1 to 5 bytes. fn unpack_dd(&mut self) -> Result { - let b1: u8 = bincode::deserialize_from(&mut *self)?; + #[cfg(not(feature = "permissive"))] + let b1 = self.read_u8()?; + #[cfg(feature = "permissive")] + let Some(b1) = self.read_u8_or_nothing()? + else { + return Ok(0); + }; match b1 { // 7 bit value // [0xxx xxxx] @@ -372,13 +422,20 @@ pub trait IdaGenericUnpack: Read { // 14 bits value // [10xx xxxx] xxxx xxxx 0x80..=0xBF => { - let lo: u8 = bincode::deserialize_from(&mut *self)?; + #[cfg(not(feature = "permissive"))] + let lo = self.read_u8()?; + #[cfg(feature = "permissive")] + let lo = self.read_u8_or_nothing()?.unwrap_or(0); Ok(u32::from_be_bytes([0, 0, b1 & 0x3F, lo])) } // 29 bit value: // [110x xxxx] xxxx xxxx xxxx xxxx xxxx xxxx 0xC0..=0xDF => { - let bytes: [u8; 3] = bincode::deserialize_from(&mut *self)?; + let mut bytes: [u8; 3] = [0; 3]; + #[cfg(not(feature = "permissive"))] + self.read_exact(&mut bytes)?; + #[cfg(feature = "permissive")] + let _size = self.read_exact_or_nothing(&mut bytes)?; Ok(u32::from_be_bytes([ b1 & 0x1F, bytes[0], @@ -391,7 +448,12 @@ pub trait IdaGenericUnpack: Read { 0xE0..=0xFF => { // NOTE first byte 5 bits seems to be ignored //ensure!(header != 0xE0 && header != 0xFF); - Ok(u32::from_be_bytes(bincode::deserialize_from(&mut *self)?)) + let mut bytes: [u8; 4] = [0; 4]; + #[cfg(not(feature = "permissive"))] + self.read_exact(&mut bytes)?; + #[cfg(feature = "permissive")] + let _size = self.read_exact_or_nothing(&mut bytes)?; + Ok(u32::from_be_bytes(bytes)) } } } @@ -418,14 +480,20 @@ pub trait IdaGenericUnpack: Read { fn unpack_ds(&mut self) -> Result> { let len = self.unpack_dd()?; let mut result = vec![0; len.try_into()?]; + #[cfg(not(feature = "permissive"))] self.read_exact(&mut result)?; + #[cfg(feature = "permissive")] + let _size = self.read_exact_or_nothing(&mut result)?; Ok(result) } fn unpack_dt_bytes(&mut self) -> Result> { let buf_len = self.read_dt()?; let mut buf = vec![0; buf_len.into()]; + #[cfg(not(feature = "permissive"))] self.read_exact(&mut buf)?; + #[cfg(feature = "permissive")] + let _size = self.read_exact_or_nothing(&mut buf)?; Ok(buf) } @@ -437,13 +505,19 @@ pub trait IdaGenericUnpack: Read { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48cdb0 let mut acc: u32 = 0; for _ in 0..5 { - let b: u32 = self.read_u8()?.into(); + #[cfg(not(feature = "permissive"))] + let b = self.read_u8()?; + #[cfg(feature = "permissive")] + let Some(b) = self.read_u8_or_nothing()? + else { + return Ok(acc); + }; if b & 0x80 == 0 { - acc = (b & 0x3F) | (acc << 6); + acc = (b & 0x3F) as u32 | (acc << 6); return Ok(acc); } - acc = (acc << 7) | (b & 0x7F); + acc = (acc << 7) | (b & 0x7F) as u32; } Err(anyhow!("Can't find the end of DE")) } @@ -454,12 +528,19 @@ pub trait IdaGenericUnpack: Read { fn read_dt(&mut self) -> Result { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48cd60 let value = match self.read_u8()? { + #[cfg(not(feature = "permissive"))] 0 => return Err(anyhow!("DT can't have 0 value")), + #[cfg(feature = "permissive")] + 0 => return Ok(0), //SEG = 2 value @ 0x80.. => { - let inter: u16 = self.read_u8()?.into(); + #[cfg(not(feature = "permissive"))] + let inter = self.read_u8()?; + #[cfg(feature = "permissive")] + let inter = self.read_u8_or_nothing()?.unwrap_or(0); + #[cfg(not(feature = "permissive"))] ensure!(inter != 0, "DT can't have a following 0 value"); - value as u16 & 0x7F | inter << 7 + value as u16 & 0x7F | (inter as u16) << 7 } //SEG = 1 value @ ..=0x7F => value.into(), @@ -498,7 +579,16 @@ pub trait IdaGenericUnpack: Read { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452830 fn read_type_attribute(&mut self) -> Result { use crate::til::flag::tattr_ext::*; - let byte0: u8 = self.read_u8()?; + #[cfg(not(feature = "permissive"))] + let byte0 = self.read_u8()?; + #[cfg(feature = "permissive")] + let Some(byte0) = self.read_u8_or_nothing()? + else { + return Ok(TypeAttribute { + tattr: 0, + extended: None, + }); + }; let mut tattr = 0; if byte0 != 0xfe { tattr = ((byte0 as u16 & 1) | ((byte0 as u16 >> 3) & 6)) + 1; @@ -508,7 +598,13 @@ pub trait IdaGenericUnpack: Read { let mut shift = 0; // TODO limit the loop to only 0..n loop { - let next_byte: u8 = self.read_u8()?; + #[cfg(not(feature = "permissive"))] + let next_byte = self.read_u8()?; + #[cfg(feature = "permissive")] + let Some(next_byte) = self.read_u8_or_nothing()? + else { + break; + }; ensure!( next_byte != 0, "Failed to parse TypeAttribute, byte is zero" diff --git a/src/lib.rs b/src/lib.rs index b5873b2..5c8f389 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -1,3 +1,4 @@ +#[forbid(unsafe_code)] pub mod id0; pub mod id1; pub(crate) mod ida_reader; @@ -111,7 +112,7 @@ impl IDBParser { let mut input = std::io::Read::take(&mut self.input, section_header.len); match section_header.compress { IDBSectionCompression::Zlib => { - let mut input = flate2::read::ZlibDecoder::new(input); + let mut input = flate2::bufread::ZlibDecoder::new(input); let _ = std::io::copy(&mut input, output)?; } IDBSectionCompression::None => { @@ -295,15 +296,18 @@ impl IDBHeader { ) -> Result { #[derive(Debug, Deserialize)] struct V1Raw { - id2_offset: u32, + _id2_offset: u32, checksums: [u32; 3], - unk30_zeroed: u32, + _unk30_zeroed: u32, unk33_checksum: u32, } let v1_raw: V1Raw = bincode::deserialize_from(input)?; - ensure!(v1_raw.unk30_zeroed == 0, "unk30 not zeroed"); - ensure!(v1_raw.id2_offset == 0, "id2 in V1 is not zeroed"); + #[cfg(not(feature = "permissive"))] + { + ensure!(v1_raw._unk30_zeroed == 0, "unk30 not zeroed"); + ensure!(v1_raw._id2_offset == 0, "id2 in V1 is not zeroed"); + } // TODO ensure all offsets point to after the header Ok(Self { @@ -328,20 +332,23 @@ impl IDBHeader { ) -> Result { #[derive(Debug, Deserialize)] struct V4Raw { - id2_offset: u32, + _id2_offset: u32, checksums: [u32; 3], - unk30_zeroed: u32, + _unk30_zeroed: u32, unk33_checksum: u32, - unk38_zeroed: [u8; 8], - unk40_v5c: u32, + _unk38_zeroed: [u8; 8], + _unk40_v5c: u32, } let v4_raw: V4Raw = bincode::deserialize_from(input)?; - ensure!(v4_raw.unk30_zeroed == 0, "unk30 not zeroed"); - ensure!(v4_raw.id2_offset == 0, "id2 in V4 is not zeroed"); - ensure!(v4_raw.unk38_zeroed == [0; 8], "unk38 is not zeroed"); - ensure!(v4_raw.unk40_v5c == 0x5c, "unk40 is not 0x5C"); + #[cfg(not(feature = "permissive"))] + { + ensure!(v4_raw._unk30_zeroed == 0, "unk30 not zeroed"); + ensure!(v4_raw._id2_offset == 0, "id2 in V4 is not zeroed"); + ensure!(v4_raw._unk38_zeroed == [0; 8], "unk38 is not zeroed"); + ensure!(v4_raw._unk40_v5c == 0x5c, "unk40 is not 0x5C"); + } // TODO ensure all offsets point to after the header Ok(Self { @@ -367,14 +374,14 @@ impl IDBHeader { #[derive(Debug, Deserialize)] struct V5Raw { nam_offset: u64, - seg_offset_zeroed: u64, + _seg_offset_zeroed: u64, til_offset: u64, initial_checksums: [u32; 3], - unk4_zeroed: u32, + _unk4_zeroed: u32, unk_checksum: u32, - id2_offset_zeroed: u64, + _id2_offset_zeroed: u64, final_checksum: u32, - unk0_v7c: u32, + _unk0_v7c: u32, } let v5_raw: V5Raw = bincode::deserialize_from(input)?; let id0_offset = @@ -383,11 +390,13 @@ impl IDBHeader { u64::from_le(u64::from(header_raw.offsets[3]) << 32 | u64::from(header_raw.offsets[2])); // TODO Final checksum is always zero on v5? - - ensure!(v5_raw.unk4_zeroed == 0, "unk4 not zeroed"); - ensure!(v5_raw.id2_offset_zeroed == 0, "id2 in V5 is not zeroed"); - ensure!(v5_raw.seg_offset_zeroed == 0, "seg in V5 is not zeroed"); - ensure!(v5_raw.unk0_v7c == 0x7C, "unk0 not 0x7C"); + #[cfg(not(feature = "permissive"))] + { + ensure!(v5_raw._unk4_zeroed == 0, "unk4 not zeroed"); + ensure!(v5_raw._id2_offset_zeroed == 0, "id2 in V5 is not zeroed"); + ensure!(v5_raw._seg_offset_zeroed == 0, "seg in V5 is not zeroed"); + ensure!(v5_raw._unk0_v7c == 0x7C, "unk0 not 0x7C"); + } // TODO ensure all offsets point to after the header Ok(Self { @@ -414,14 +423,14 @@ impl IDBHeader { #[derive(Debug, Deserialize)] struct V6Raw { nam_offset: u64, - seg_offset_zeroed: u64, + _seg_offset_zeroed: u64, til_offset: u64, initial_checksums: [u32; 3], - unk4_zeroed: [u8; 4], + _unk4_zeroed: [u8; 4], unk5_checksum: u32, id2_offset: u64, final_checksum: u32, - unk0_v7c: u32, + _unk0_v7c: u32, } let v6_raw: V6Raw = bincode::deserialize_from(input)?; let id0_offset = @@ -429,9 +438,12 @@ impl IDBHeader { let id1_offset = u64::from_le(u64::from(header_raw.offsets[3]) << 32 | u64::from(header_raw.offsets[2])); - ensure!(v6_raw.unk4_zeroed == [0; 4], "unk4 not zeroed"); - ensure!(v6_raw.seg_offset_zeroed == 0, "seg in V6 is not zeroed"); - ensure!(v6_raw.unk0_v7c == 0x7C, "unk0 not 0x7C"); + #[cfg(not(feature = "permissive"))] + { + ensure!(v6_raw._unk4_zeroed == [0; 4], "unk4 not zeroed"); + ensure!(v6_raw._seg_offset_zeroed == 0, "seg in V6 is not zeroed"); + ensure!(v6_raw._unk0_v7c == 0x7C, "unk0 not 0x7C"); + } // TODO ensure all offsets point to after the header Ok(Self { diff --git a/src/til.rs b/src/til.rs index 9ebee66..f8f2bf0 100644 --- a/src/til.rs +++ b/src/til.rs @@ -91,6 +91,7 @@ impl TILTypeInfo { .into_iter() .map(|field| if field.is_empty() { None } else { Some(field) }); let tinfo = Type::new(til, tinfo_raw, &mut fields_iter)?; + #[cfg(not(feature = "permissive"))] ensure!( fields_iter.next().is_none(), "Extra fields found for til type \"{}\"", @@ -186,10 +187,11 @@ impl Type { &[b'\x00'] => {} // in continuations, the \x00 may be missing &[] => {} - rest => { + _rest => { + #[cfg(not(feature = "permissive"))] return Err(anyhow!( "Extra {} bytes after reading TIL from ID0", - rest.len() + _rest.len() )); } } @@ -198,6 +200,7 @@ impl Type { .into_iter() .map(|field| if field.is_empty() { None } else { Some(field) }); let result = Self::new(&header, type_raw, &mut fields_iter)?; + #[cfg(not(feature = "permissive"))] ensure!( fields_iter.next().is_none(), "Extra fields found for id0 til" @@ -514,6 +517,7 @@ impl TILMacro { let have_param = flag & 0x100 != 0; let param_num = have_param.then_some((flag & 0xFF) as u8); if !have_param { + #[cfg(not(feature = "permissive"))] ensure!(flag & 0xFF == 0, "Unknown/Invalid value for TILMacro flag"); } // TODO find the InnerRef for this @@ -547,12 +551,14 @@ impl TILMacro { (_, None) => {} // having params, where should not (None, Some(_max)) => { + #[cfg(not(feature = "permissive"))] return Err(anyhow!( "Macro value have params but it is not declared in the flag", )) } // only using params that exist (Some(params), Some(max)) if max <= params => { + #[cfg(not(feature = "permissive"))] ensure!( max <= params, "Macro value have more params then declared in the flag" diff --git a/src/til/array.rs b/src/til/array.rs index 1383c24..a299f32 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -1,7 +1,5 @@ use std::num::{NonZeroU16, NonZeroU8}; -use anyhow::ensure; - use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeAttribute, TypeRaw}; @@ -58,15 +56,20 @@ impl ArrayRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48078e let align = match input.read_tah()? { None => None, - Some(TypeAttribute { tattr, extended }) => { + Some(TypeAttribute { + tattr, + extended: _extended, + }) => { let align = (tattr & MAX_DECL_ALIGN) as u8; - ensure!( + #[cfg(not(feature = "permissive"))] + anyhow::ensure!( tattr & !MAX_DECL_ALIGN == 0, "unknown TypeAttribute {tattr:x}" ); - ensure!( - extended.is_none(), - "unknown TypeAttribute ext {extended:x?}" + #[cfg(not(feature = "permissive"))] + anyhow::ensure!( + _extended.is_none(), + "unknown TypeAttribute ext {_extended:x?}" ); NonZeroU8::new(align) } diff --git a/src/til/bitfield.rs b/src/til/bitfield.rs index ba279c8..e1660ff 100644 --- a/src/til/bitfield.rs +++ b/src/til/bitfield.rs @@ -1,7 +1,11 @@ use std::num::NonZeroU8; +use anyhow::Result; + use crate::ida_reader::IdaGenericBufUnpack; +use super::TypeAttribute; + #[derive(Debug, Clone, Copy)] pub struct Bitfield { pub unsigned: bool, @@ -23,7 +27,7 @@ pub struct Bitfield { } impl Bitfield { - pub(crate) fn read(input: &mut impl IdaGenericBufUnpack, metadata: u8) -> anyhow::Result { + pub(crate) fn read(input: &mut impl IdaGenericBufUnpack, metadata: u8) -> Result { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x472f3c print_til_type let nbytes = match metadata { super::flag::tf_complex::BTMT_BFLDI8 => 1, @@ -35,7 +39,21 @@ impl Bitfield { let dt = input.read_dt()?; let width = dt >> 1; let unsigned = (dt & 1) > 0; - let _tah = input.read_tah()?; + match input.read_tah()? { + None => {} + Some(TypeAttribute { + tattr: _tattr, + extended: _extended, + }) => { + #[cfg(not(feature = "permissive"))] + anyhow::ensure!(_tattr == 0, "Unknown TypeAttribute {_tattr:x}"); + #[cfg(not(feature = "permissive"))] + anyhow::ensure!( + _extended.is_none(), + "Unknown TypeAttribute ext {_extended:x?}" + ); + } + } Ok(Self { unsigned, width, diff --git a/src/til/enum.rs b/src/til/enum.rs index 6f562ce..95c7c42 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -69,38 +69,39 @@ impl EnumRaw { return Ok(TypeVariantRaw::EnumRef(ref_type)); }; - let (is_64, is_signed, is_unsigned) = match input.read_tah()? { - None => (false, false, false), - Some(TypeAttribute { - tattr, - extended: None, - }) => { - // TODO enum have an align field (MAX_DECL_ALIGN) in tattr? - let is_64 = tattr & TAENUM_64BIT != 0; - let is_signed = tattr & TAENUM_SIGNED != 0; - let is_unsigned = tattr & TAENUM_UNSIGNED != 0; - ensure!( - tattr & !(TAENUM_64BIT | TAENUM_SIGNED | TAENUM_UNSIGNED) == 0, - "Invalid Enum taenum_bits {tattr:x}" - ); - ensure!( - !(is_signed && is_unsigned), - "Enum can't be signed and unsigned at the same time" - ); - (is_64, is_signed, is_unsigned) - } - // TODO parse ext attr? - Some(TypeAttribute { - tattr: _, - extended: Some(_), - }) => { - return Err(anyhow!("Unable to parse extended attributes for enum")); - } - }; + let mut is_64 = false; + let mut is_signed = false; + let mut is_unsigned = false; + if let Some(TypeAttribute { + tattr, + extended: _extended, + }) = input.read_sdacl()? + { + // TODO enum have an align field (MAX_DECL_ALIGN) in tattr? + is_64 = tattr & TAENUM_64BIT != 0; + is_signed = tattr & TAENUM_SIGNED != 0; + is_unsigned = tattr & TAENUM_UNSIGNED != 0; + #[cfg(not(feature = "permissive"))] + ensure!( + tattr & !(TAENUM_64BIT | TAENUM_SIGNED | TAENUM_UNSIGNED) == 0, + "Invalid Enum taenum_bits {tattr:x}" + ); + #[cfg(not(feature = "permissive"))] + ensure!( + !(is_signed && is_unsigned), + "Enum can't be signed and unsigned at the same time" + ); + #[cfg(not(feature = "permissive"))] + ensure!( + _extended.is_none(), + "Unable to parse extended attributes for Enum" + ); + } // all BTE bits are consumed let bte = input.read_u8()?; let storage_size_raw = bte & BTE_SIZE_MASK; + #[cfg(not(feature = "permissive"))] ensure!( bte & BTE_RESERVED == 0, "Enum BTE including the Always off sub-field" @@ -123,9 +124,10 @@ impl EnumRaw { // TODO enum size defaults to 4? let storage_size_final = storage_size.map(NonZeroU8::get).unwrap_or(4); let mask: u64 = if storage_size_final >= 16 { - // is saturating valid? - //u64::MAX + #[cfg(not(feature = "permissive"))] return Err(anyhow!("Bytes size is too big")); + #[cfg(feature = "permissive")] + u64::MAX } else { u64::MAX >> (u64::BITS - (storage_size_final as u32 * 8)) }; diff --git a/src/til/function.rs b/src/til/function.rs index 4bcde71..a45b749 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -152,6 +152,7 @@ impl FunctionRaw { let is_high = flags_lower & BFA_HIGH != 0; let is_static = flags_lower & BFA_STATIC != 0; let is_virtual = flags_lower & BFA_VIRTUAL != 0; + #[cfg(not(feature = "permissive"))] ensure!(flags_lower & !(BFA_NORET | BFA_PURE | BFA_HIGH | BFA_STATIC | BFA_VIRTUAL) == 0); // TODO find those flags @@ -162,6 +163,7 @@ impl FunctionRaw { let is_const = flags_upper & BFA_CONST != 0; let is_constructor = flags_upper & BFA_CONSTRUCTOR != 0; let is_destructor = flags_upper & BFA_DESTRUCTOR != 0; + #[cfg(not(feature = "permissive"))] ensure!(flags_upper & !(BFA_CONST | BFA_CONSTRUCTOR | BFA_DESTRUCTOR) == 0); let ret = TypeRaw::read(&mut *input, header).context("Return Argument")?; @@ -275,7 +277,10 @@ impl ArgLoc { let sval = input.read_de()?; Ok(Self::Static(sval)) } + #[cfg(not(feature = "permissive"))] ALOC_CUSTOM.. => Err(anyhow!("Custom implementation for ArgLoc")), + #[cfg(feature = "permissive")] + ALOC_CUSTOM.. => Ok(Self::None), } } } @@ -373,19 +378,19 @@ impl CCPtrSize { pub const fn near_bytes(self) -> NonZeroU8 { match self { - CCPtrSize::N8F16 => unsafe { NonZeroU8::new_unchecked(1) }, - CCPtrSize::N16F32 => unsafe { NonZeroU8::new_unchecked(2) }, - CCPtrSize::N32F48 => unsafe { NonZeroU8::new_unchecked(4) }, - CCPtrSize::N64 => unsafe { NonZeroU8::new_unchecked(8) }, + CCPtrSize::N8F16 => NonZeroU8::new(1).unwrap(), + CCPtrSize::N16F32 => NonZeroU8::new(2).unwrap(), + CCPtrSize::N32F48 => NonZeroU8::new(4).unwrap(), + CCPtrSize::N64 => NonZeroU8::new(8).unwrap(), } } pub const fn far_bytes(self) -> NonZeroU8 { match self { - CCPtrSize::N8F16 => unsafe { NonZeroU8::new_unchecked(2) }, - CCPtrSize::N16F32 => unsafe { NonZeroU8::new_unchecked(4) }, - CCPtrSize::N32F48 => unsafe { NonZeroU8::new_unchecked(6) }, - CCPtrSize::N64 => unsafe { NonZeroU8::new_unchecked(8) }, + CCPtrSize::N8F16 => NonZeroU8::new(2).unwrap(), + CCPtrSize::N16F32 => NonZeroU8::new(4).unwrap(), + CCPtrSize::N32F48 => NonZeroU8::new(6).unwrap(), + CCPtrSize::N64 => NonZeroU8::new(8).unwrap(), } } } @@ -516,9 +521,12 @@ fn read_cc_spoiled( } else { let size = (b >> 4) + 1; // TODO what if (b & 0xF) == 0? + #[cfg(not(feature = "permissive"))] let reg = (b & 0xF) .checked_sub(1) .ok_or_else(|| anyhow!("invalid spoiled reg value"))?; + #[cfg(feature = "permissive")] + let reg = (b & 0xF).saturating_sub(1); spoiled.push((reg.into(), size)) } } diff --git a/src/til/pointer.rs b/src/til/pointer.rs index 744e918..52ae45a 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -1,4 +1,4 @@ -use anyhow::{ensure, Result}; +use anyhow::Result; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::section::TILSectionHeader; @@ -106,16 +106,20 @@ impl PointerRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459b7e let (_ta_lower, is_shifted, ptr_type_raw) = match input.read_tah()? { None => (0, false, 0), - Some(TypeAttribute { tattr, extended }) => { + Some(TypeAttribute { + tattr, + extended: _extended, + }) => { // all bits of tattr are consumed let ta_lower = (tattr & MAX_DECL_ALIGN) as u8; let is_shifted = tattr & TAPTR_SHIFTED != 0; let ptr_type = tattr & TAPTR_RESTRICT; - ensure!( + #[cfg(not(feature = "permissive"))] + anyhow::ensure!( tattr & !(TAPTR_SHIFTED | TAPTR_RESTRICT | MAX_DECL_ALIGN) == 0, "Invalid Pointer taenum_bits {tattr:x}" ); - if let Some(_extended) = extended { + if let Some(_extended) = _extended { // TODO parse extended values, known: // "__org_arrdim" :"\xac\xXX" // "__org_typedef":..., diff --git a/src/til/section.rs b/src/til/section.rs index 4b29bdd..342e508 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -285,7 +285,7 @@ impl TILSection { let size_long_double = header1 .flags .has_size_long_double() - .then(|| bincode::deserialize_from::<_, u8>(&mut *input)) + .then(|| input.read_u8()) .transpose()? .map(|size| size.try_into()) .transpose()?; @@ -468,6 +468,7 @@ impl TILSection { pub struct TILSectionFlags(pub(crate) u16); impl TILSectionFlags { fn new(value: u32) -> Result { + #[cfg(not(feature = "permissive"))] ensure!( value < (flag::til::TIL_SLD as u32) << 1, "Unknown flag values for TILSectionFlags" @@ -585,6 +586,7 @@ impl TILSection { next_ordinal, ordinal_alias, )?; + #[cfg(not(feature = "permissive"))] ensure!( compressed_input.limit() == 0, "TypeBucket compressed data is smaller then expected" @@ -613,6 +615,7 @@ impl TILSection { let type_info = (0..ndefs) .map(|i| TILTypeInfo::read(&mut input, header, i == ndefs - 1)) .collect::>()?; + #[cfg(not(feature = "permissive"))] ensure!( input.limit() == 0, "TypeBucket total data is smaller then expected" @@ -637,6 +640,7 @@ impl TILSection { let type_info = (0..ndefs) .map(|_| TILMacro::read(&mut input)) .collect::>()?; + #[cfg(not(feature = "permissive"))] ensure!( input.limit() == 0, "TypeBucket macro total data is smaller then expected" @@ -655,10 +659,12 @@ impl TILSection { .map(|_| TILMacro::read(&mut decompressed_input)) .collect::, _>>()?; // make sure the input was fully consumed + #[cfg(not(feature = "permissive"))] ensure!( decompressed_input.limit() == 0, "TypeBucket macros data is smaller then expected" ); + #[cfg(not(feature = "permissive"))] ensure!( compressed_input.limit() == 0, "TypeBucket macros compressed data is smaller then expected" @@ -678,10 +684,12 @@ impl TILSection { let inflate = flate2::read::ZlibDecoder::new(&mut compressed_input); let mut decompressed_input = inflate.take(len.into()); std::io::copy(&mut decompressed_input, output)?; + #[cfg(not(feature = "permissive"))] ensure!( decompressed_input.limit() == 0, "TypeBucket data is smaller then expected" ); + #[cfg(not(feature = "permissive"))] ensure!( compressed_input.limit() == 0, "TypeBucket compressed data is smaller then expected" diff --git a/src/til/struct.rs b/src/til/struct.rs index 1583d61..508f41e 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -99,7 +99,11 @@ impl StructRaw { let mut is_vft = false; let mut is_method = false; let mut is_bitset2 = false; - if let Some(TypeAttribute { tattr, extended }) = input.read_sdacl()? { + if let Some(TypeAttribute { + tattr, + extended: _extended, + }) = input.read_sdacl()? + { use crate::til::flag::tattr::*; use crate::til::flag::tattr_field::*; use crate::til::flag::tattr_udt::*; @@ -121,18 +125,20 @@ impl StructRaw { // TODO this value can't be right, it defines the alignment! is_bitset2 = align_raw & 0x4 != 0; - const ALL_FLAGS: u16 = MAX_DECL_ALIGN + const _ALL_FLAGS: u16 = MAX_DECL_ALIGN | TAUDT_MSSTRUCT | TAUDT_UNALIGNED | TAUDT_CPPOBJ | TAUDT_VFTABLE | TAFLD_METHOD; + #[cfg(not(feature = "permissive"))] ensure!( - tattr & !ALL_FLAGS == 0, + tattr & !_ALL_FLAGS == 0, "Invalid Struct taenum_bits {tattr:x}" ); + #[cfg(not(feature = "permissive"))] ensure!( - extended.is_none(), + _extended.is_none(), "Unable to parse extended attributes for struct" ); } @@ -223,7 +229,11 @@ impl StructMemberRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47825d if !is_bit_set || att.is_some() { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47825d - if let Some(TypeAttribute { tattr, extended }) = input.read_sdacl()? { + if let Some(TypeAttribute { + tattr, + extended: _extended, + }) = input.read_sdacl()? + { use crate::til::flag::tattr::*; use crate::til::flag::tattr_field::*; @@ -235,17 +245,19 @@ impl StructMemberRaw { is_vft = tattr & TAFLD_VFTABLE != 0; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 is_method = tattr & TAFLD_METHOD != 0; - const ALL_FLAGS: u16 = MAX_DECL_ALIGN + const _ALL_FLAGS: u16 = MAX_DECL_ALIGN | TAFLD_BASECLASS | TAFLD_UNALIGNED | TAFLD_VFTABLE | TAFLD_METHOD; + #[cfg(not(feature = "permissive"))] ensure!( - tattr & !ALL_FLAGS == 0, + tattr & !_ALL_FLAGS == 0, "Invalid Struct taenum_bits {tattr:x}" ); + #[cfg(not(feature = "permissive"))] ensure!( - extended.is_none(), + _extended.is_none(), "Unable to parse extended attributes for struct member" ); } diff --git a/src/til/union.rs b/src/til/union.rs index af42b60..68a1012 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -1,4 +1,4 @@ -use anyhow::{anyhow, ensure, Context}; +use anyhow::{anyhow, Context, Result}; use std::num::NonZeroU8; @@ -21,7 +21,7 @@ impl Union { til: &TILSectionHeader, value: UnionRaw, fields: &mut impl Iterator>>, - ) -> anyhow::Result { + ) -> Result { let members = value .members .into_iter() @@ -30,7 +30,7 @@ impl Union { let new_member = Type::new(til, member, &mut *fields)?; Ok((field_name, new_member)) }) - .collect::>()?; + .collect::>()?; Ok(Union { effective_alignment: value.effective_alignment, alignment: value.alignment, @@ -54,7 +54,7 @@ impl UnionRaw { pub fn read( input: &mut impl IdaGenericBufUnpack, header: &TILSectionHeader, - ) -> anyhow::Result { + ) -> Result { let Some(n) = input.read_dt_de()? else { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4803b4 // is ref @@ -73,27 +73,33 @@ impl UnionRaw { let mut alignment = None; let mut is_unaligned = false; - if let Some(TypeAttribute { tattr, extended }) = input.read_sdacl()? { + if let Some(TypeAttribute { + tattr, + extended: _extended, + }) = input.read_sdacl()? + { use crate::til::flag::tattr::*; use crate::til::flag::tattr_udt::*; alignment = NonZeroU8::new((tattr & MAX_DECL_ALIGN) as u8); is_unaligned = tattr & TAUDT_UNALIGNED != 0; - const ALL_FLAGS: u16 = MAX_DECL_ALIGN | TAUDT_UNALIGNED; - ensure!( - tattr & !ALL_FLAGS == 0, + const _ALL_FLAGS: u16 = MAX_DECL_ALIGN | TAUDT_UNALIGNED; + #[cfg(not(feature = "permissive"))] + anyhow::ensure!( + tattr & !_ALL_FLAGS == 0, "Invalid Union taenum_bits {tattr:x}" ); - ensure!( - extended.is_none(), + #[cfg(not(feature = "permissive"))] + anyhow::ensure!( + _extended.is_none(), "Unable to parse extended attributes for union" ); } let members = (0..mem_cnt) .map(|i| TypeRaw::read(&mut *input, header).with_context(|| format!("Member {i}"))) - .collect::>()?; + .collect::>()?; Ok(TypeVariantRaw::Union(Self { effective_alignment, alignment, From ce745027f0818ff7fb2ced484a9b6ec4a64f9b3a Mon Sep 17 00:00:00 2001 From: rbran Date: Thu, 9 Jan 2025 13:52:06 -0300 Subject: [PATCH 41/53] fix til enum ext att parsing --- src/til/enum.rs | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/til/enum.rs b/src/til/enum.rs index 95c7c42..eb1e530 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -75,7 +75,7 @@ impl EnumRaw { if let Some(TypeAttribute { tattr, extended: _extended, - }) = input.read_sdacl()? + }) = input.read_tah()? { // TODO enum have an align field (MAX_DECL_ALIGN) in tattr? is_64 = tattr & TAENUM_64BIT != 0; From 7aae35600fb1fc3af381169a371995a727ca045f Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 10 Jan 2025 07:38:35 -0300 Subject: [PATCH 42/53] replace the permissive feature with the restrictive feature Tests usually use the --all-features to make more complete coverage. Because not having the "permissive" feature is more likelly to causes errors, having it replaced with "restrictive" feature create better tests. --- src/ida_reader.rs | 80 ++++++++++++++++++++++----------------------- src/lib.rs | 8 ++--- src/til.rs | 12 +++---- src/til/array.rs | 4 +-- src/til/bitfield.rs | 4 +-- src/til/enum.rs | 12 +++---- src/til/function.rs | 12 +++---- src/til/pointer.rs | 2 +- src/til/section.rs | 41 ++++++++++++----------- src/til/struct.rs | 8 ++--- src/til/union.rs | 4 +-- 11 files changed, 95 insertions(+), 92 deletions(-) diff --git a/src/ida_reader.rs b/src/ida_reader.rs index f314bed..0a605f5 100644 --- a/src/ida_reader.rs +++ b/src/ida_reader.rs @@ -43,11 +43,11 @@ pub trait IdaUnpack: IdaGenericUnpack { if self.is_64() { let start = self.unpack_dq()?; let len = self.unpack_dq()?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let end = start .checked_add(len) .ok_or_else(|| anyhow!("Function range overflows"))?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let end = start.saturating_add(len); Ok(start..end) } else { @@ -57,9 +57,9 @@ pub trait IdaUnpack: IdaGenericUnpack { let end = match start.checked_add(len.into()) { Some(0xFFFF_FFFF) => u64::MAX, Some(value) => value, - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] None => return Err(anyhow!("Function range overflows")), - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] None => u64::MAX, }; Ok(start..end) @@ -179,12 +179,12 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { // TODO check no more then 9 bytes are read loop { let Some(typ) = self.peek_u8()? else { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] return Err(anyhow!(std::io::Error::new( std::io::ErrorKind::UnexpectedEof, "Unexpected EoF on DA" ))); - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] return Ok((nelem, base)); }; if typ & 0x80 == 0 { @@ -202,12 +202,12 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { nelem = (z >> 4) & 7; loop { let Some(y) = self.peek_u8()? else { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] return Err(anyhow!(std::io::Error::new( std::io::ErrorKind::UnexpectedEof, "Unexpected EoF on DA" ))); - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] return Ok((nelem, base)); }; if (y & 0x80) == 0 { @@ -234,7 +234,7 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { let _ = buf.pop(); // remove the \x00 from the end } else { // found EOF, aka could not find the \x00 for the string end - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] return Err(anyhow!("Unexpected EoF on CStr")); } Ok(buf) @@ -267,7 +267,7 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { if (start_value >> bit) & 1 != 0 { let value = self.read_u8()?; // TODO is this an error or expect possible value? - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!(value != 0); acc |= (value as u64) << byte; } @@ -320,7 +320,7 @@ pub trait IdaGenericUnpack: Read { Ok(data[0]) } - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] fn read_u8_or_nothing(&mut self) -> Result> { let mut data = [0; 1]; let read = self.read_exact_or_nothing(&mut data)?; @@ -365,9 +365,9 @@ pub trait IdaGenericUnpack: Read { // NOTE: the original implementation never fails, if input hit EoF it a partial result or 0 /// Reads 1 to 3 bytes. fn unpack_dw(&mut self) -> Result { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let b1 = self.read_u8()?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let Some(b1) = self.read_u8_or_nothing()? else { return Ok(0); @@ -379,9 +379,9 @@ pub trait IdaGenericUnpack: Read { // 14 bits value // [10xx xxxx] xxxx xxxx 0x80..=0xBF => { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let lo = self.read_u8()?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let lo = self.read_u8_or_nothing()?.unwrap_or(0); Ok(u16::from_be_bytes([b1 & 0x3F, lo])) } @@ -390,10 +390,10 @@ pub trait IdaGenericUnpack: Read { 0xC0..=0xFF => { // NOTE first byte 6 bits seems to be ignored //ensure!(header != 0xC0 && header != 0xFF); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let (lo, hi) = (self.read_u8()?, self.read_u8()?); - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let (lo, hi) = ( self.read_u8_or_nothing()?.unwrap_or(0), self.read_u8_or_nothing()?.unwrap_or(0), @@ -408,9 +408,9 @@ pub trait IdaGenericUnpack: Read { // NOTE the orignal implementation never fails, if input hit EoF it a partial result or 0 /// Reads 1 to 5 bytes. fn unpack_dd(&mut self) -> Result { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let b1 = self.read_u8()?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let Some(b1) = self.read_u8_or_nothing()? else { return Ok(0); @@ -422,9 +422,9 @@ pub trait IdaGenericUnpack: Read { // 14 bits value // [10xx xxxx] xxxx xxxx 0x80..=0xBF => { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let lo = self.read_u8()?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let lo = self.read_u8_or_nothing()?.unwrap_or(0); Ok(u32::from_be_bytes([0, 0, b1 & 0x3F, lo])) } @@ -432,9 +432,9 @@ pub trait IdaGenericUnpack: Read { // [110x xxxx] xxxx xxxx xxxx xxxx xxxx xxxx 0xC0..=0xDF => { let mut bytes: [u8; 3] = [0; 3]; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] self.read_exact(&mut bytes)?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let _size = self.read_exact_or_nothing(&mut bytes)?; Ok(u32::from_be_bytes([ b1 & 0x1F, @@ -449,9 +449,9 @@ pub trait IdaGenericUnpack: Read { // NOTE first byte 5 bits seems to be ignored //ensure!(header != 0xE0 && header != 0xFF); let mut bytes: [u8; 4] = [0; 4]; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] self.read_exact(&mut bytes)?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let _size = self.read_exact_or_nothing(&mut bytes)?; Ok(u32::from_be_bytes(bytes)) } @@ -480,9 +480,9 @@ pub trait IdaGenericUnpack: Read { fn unpack_ds(&mut self) -> Result> { let len = self.unpack_dd()?; let mut result = vec![0; len.try_into()?]; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] self.read_exact(&mut result)?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let _size = self.read_exact_or_nothing(&mut result)?; Ok(result) } @@ -490,9 +490,9 @@ pub trait IdaGenericUnpack: Read { fn unpack_dt_bytes(&mut self) -> Result> { let buf_len = self.read_dt()?; let mut buf = vec![0; buf_len.into()]; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] self.read_exact(&mut buf)?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let _size = self.read_exact_or_nothing(&mut buf)?; Ok(buf) } @@ -505,9 +505,9 @@ pub trait IdaGenericUnpack: Read { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48cdb0 let mut acc: u32 = 0; for _ in 0..5 { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let b = self.read_u8()?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let Some(b) = self.read_u8_or_nothing()? else { return Ok(acc); @@ -528,17 +528,17 @@ pub trait IdaGenericUnpack: Read { fn read_dt(&mut self) -> Result { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48cd60 let value = match self.read_u8()? { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] 0 => return Err(anyhow!("DT can't have 0 value")), - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] 0 => return Ok(0), //SEG = 2 value @ 0x80.. => { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let inter = self.read_u8()?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let inter = self.read_u8_or_nothing()?.unwrap_or(0); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!(inter != 0, "DT can't have a following 0 value"); value as u16 & 0x7F | (inter as u16) << 7 } @@ -579,9 +579,9 @@ pub trait IdaGenericUnpack: Read { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x452830 fn read_type_attribute(&mut self) -> Result { use crate::til::flag::tattr_ext::*; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let byte0 = self.read_u8()?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let Some(byte0) = self.read_u8_or_nothing()? else { return Ok(TypeAttribute { @@ -598,9 +598,9 @@ pub trait IdaGenericUnpack: Read { let mut shift = 0; // TODO limit the loop to only 0..n loop { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let next_byte = self.read_u8()?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let Some(next_byte) = self.read_u8_or_nothing()? else { break; diff --git a/src/lib.rs b/src/lib.rs index 5c8f389..a2e18fb 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -303,7 +303,7 @@ impl IDBHeader { } let v1_raw: V1Raw = bincode::deserialize_from(input)?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] { ensure!(v1_raw._unk30_zeroed == 0, "unk30 not zeroed"); ensure!(v1_raw._id2_offset == 0, "id2 in V1 is not zeroed"); @@ -342,7 +342,7 @@ impl IDBHeader { let v4_raw: V4Raw = bincode::deserialize_from(input)?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] { ensure!(v4_raw._unk30_zeroed == 0, "unk30 not zeroed"); ensure!(v4_raw._id2_offset == 0, "id2 in V4 is not zeroed"); @@ -390,7 +390,7 @@ impl IDBHeader { u64::from_le(u64::from(header_raw.offsets[3]) << 32 | u64::from(header_raw.offsets[2])); // TODO Final checksum is always zero on v5? - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] { ensure!(v5_raw._unk4_zeroed == 0, "unk4 not zeroed"); ensure!(v5_raw._id2_offset_zeroed == 0, "id2 in V5 is not zeroed"); @@ -438,7 +438,7 @@ impl IDBHeader { let id1_offset = u64::from_le(u64::from(header_raw.offsets[3]) << 32 | u64::from(header_raw.offsets[2])); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] { ensure!(v6_raw._unk4_zeroed == [0; 4], "unk4 not zeroed"); ensure!(v6_raw._seg_offset_zeroed == 0, "seg in V6 is not zeroed"); diff --git a/src/til.rs b/src/til.rs index f8f2bf0..4696d9c 100644 --- a/src/til.rs +++ b/src/til.rs @@ -91,7 +91,7 @@ impl TILTypeInfo { .into_iter() .map(|field| if field.is_empty() { None } else { Some(field) }); let tinfo = Type::new(til, tinfo_raw, &mut fields_iter)?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( fields_iter.next().is_none(), "Extra fields found for til type \"{}\"", @@ -188,7 +188,7 @@ impl Type { // in continuations, the \x00 may be missing &[] => {} _rest => { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] return Err(anyhow!( "Extra {} bytes after reading TIL from ID0", _rest.len() @@ -200,7 +200,7 @@ impl Type { .into_iter() .map(|field| if field.is_empty() { None } else { Some(field) }); let result = Self::new(&header, type_raw, &mut fields_iter)?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( fields_iter.next().is_none(), "Extra fields found for id0 til" @@ -517,7 +517,7 @@ impl TILMacro { let have_param = flag & 0x100 != 0; let param_num = have_param.then_some((flag & 0xFF) as u8); if !have_param { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!(flag & 0xFF == 0, "Unknown/Invalid value for TILMacro flag"); } // TODO find the InnerRef for this @@ -551,14 +551,14 @@ impl TILMacro { (_, None) => {} // having params, where should not (None, Some(_max)) => { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] return Err(anyhow!( "Macro value have params but it is not declared in the flag", )) } // only using params that exist (Some(params), Some(max)) if max <= params => { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( max <= params, "Macro value have more params then declared in the flag" diff --git a/src/til/array.rs b/src/til/array.rs index a299f32..3d0e221 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -61,12 +61,12 @@ impl ArrayRaw { extended: _extended, }) => { let align = (tattr & MAX_DECL_ALIGN) as u8; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] anyhow::ensure!( tattr & !MAX_DECL_ALIGN == 0, "unknown TypeAttribute {tattr:x}" ); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] anyhow::ensure!( _extended.is_none(), "unknown TypeAttribute ext {_extended:x?}" diff --git a/src/til/bitfield.rs b/src/til/bitfield.rs index e1660ff..a289307 100644 --- a/src/til/bitfield.rs +++ b/src/til/bitfield.rs @@ -45,9 +45,9 @@ impl Bitfield { tattr: _tattr, extended: _extended, }) => { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] anyhow::ensure!(_tattr == 0, "Unknown TypeAttribute {_tattr:x}"); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] anyhow::ensure!( _extended.is_none(), "Unknown TypeAttribute ext {_extended:x?}" diff --git a/src/til/enum.rs b/src/til/enum.rs index eb1e530..4e7fd0c 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -81,17 +81,17 @@ impl EnumRaw { is_64 = tattr & TAENUM_64BIT != 0; is_signed = tattr & TAENUM_SIGNED != 0; is_unsigned = tattr & TAENUM_UNSIGNED != 0; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( tattr & !(TAENUM_64BIT | TAENUM_SIGNED | TAENUM_UNSIGNED) == 0, "Invalid Enum taenum_bits {tattr:x}" ); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( !(is_signed && is_unsigned), "Enum can't be signed and unsigned at the same time" ); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( _extended.is_none(), "Unable to parse extended attributes for Enum" @@ -101,7 +101,7 @@ impl EnumRaw { // all BTE bits are consumed let bte = input.read_u8()?; let storage_size_raw = bte & BTE_SIZE_MASK; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( bte & BTE_RESERVED == 0, "Enum BTE including the Always off sub-field" @@ -124,9 +124,9 @@ impl EnumRaw { // TODO enum size defaults to 4? let storage_size_final = storage_size.map(NonZeroU8::get).unwrap_or(4); let mask: u64 = if storage_size_final >= 16 { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] return Err(anyhow!("Bytes size is too big")); - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] u64::MAX } else { u64::MAX >> (u64::BITS - (storage_size_final as u32 * 8)) diff --git a/src/til/function.rs b/src/til/function.rs index a45b749..925b6b1 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -152,7 +152,7 @@ impl FunctionRaw { let is_high = flags_lower & BFA_HIGH != 0; let is_static = flags_lower & BFA_STATIC != 0; let is_virtual = flags_lower & BFA_VIRTUAL != 0; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!(flags_lower & !(BFA_NORET | BFA_PURE | BFA_HIGH | BFA_STATIC | BFA_VIRTUAL) == 0); // TODO find those flags @@ -163,7 +163,7 @@ impl FunctionRaw { let is_const = flags_upper & BFA_CONST != 0; let is_constructor = flags_upper & BFA_CONSTRUCTOR != 0; let is_destructor = flags_upper & BFA_DESTRUCTOR != 0; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!(flags_upper & !(BFA_CONST | BFA_CONSTRUCTOR | BFA_DESTRUCTOR) == 0); let ret = TypeRaw::read(&mut *input, header).context("Return Argument")?; @@ -277,9 +277,9 @@ impl ArgLoc { let sval = input.read_de()?; Ok(Self::Static(sval)) } - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ALOC_CUSTOM.. => Err(anyhow!("Custom implementation for ArgLoc")), - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] ALOC_CUSTOM.. => Ok(Self::None), } } @@ -521,11 +521,11 @@ fn read_cc_spoiled( } else { let size = (b >> 4) + 1; // TODO what if (b & 0xF) == 0? - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] let reg = (b & 0xF) .checked_sub(1) .ok_or_else(|| anyhow!("invalid spoiled reg value"))?; - #[cfg(feature = "permissive")] + #[cfg(not(feature = "restrictive"))] let reg = (b & 0xF).saturating_sub(1); spoiled.push((reg.into(), size)) } diff --git a/src/til/pointer.rs b/src/til/pointer.rs index 52ae45a..56d9a68 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -114,7 +114,7 @@ impl PointerRaw { let ta_lower = (tattr & MAX_DECL_ALIGN) as u8; let is_shifted = tattr & TAPTR_SHIFTED != 0; let ptr_type = tattr & TAPTR_RESTRICT; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] anyhow::ensure!( tattr & !(TAPTR_SHIFTED | TAPTR_RESTRICT | MAX_DECL_ALIGN) == 0, "Invalid Pointer taenum_bits {tattr:x}" diff --git a/src/til/section.rs b/src/til/section.rs index 342e508..4aa4d23 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -99,7 +99,7 @@ impl TILSection { match compress { IDBSectionCompression::None => Self::read_inner(input), IDBSectionCompression::Zlib => { - let mut input = BufReader::new(flate2::read::ZlibDecoder::new(input)); + let mut input = BufReader::new(flate2::bufread::ZlibDecoder::new(input)); Self::read_inner(&mut input) } } @@ -310,20 +310,23 @@ impl TILSection { } pub fn decompress( - input: &mut impl IdaGenericUnpack, + input: &mut impl IdaGenericBufUnpack, output: &mut impl Write, compress: IDBSectionCompression, ) -> Result<()> { match compress { IDBSectionCompression::Zlib => { - let mut input = flate2::read::ZlibDecoder::new(input); + let mut input = BufReader::new(flate2::bufread::ZlibDecoder::new(input)); Self::decompress_inner(&mut input, output) } IDBSectionCompression::None => Self::decompress_inner(input, output), } } - fn decompress_inner(input: &mut impl IdaGenericUnpack, output: &mut impl Write) -> Result<()> { + fn decompress_inner( + input: &mut impl IdaGenericBufUnpack, + output: &mut impl Write, + ) -> Result<()> { let mut header = Self::read_header(&mut *input)?; let og_flags = header.flags; // disable the zip flag @@ -385,7 +388,7 @@ impl TILSection { .flags .has_ordinal() .then(|| -> Result { - let result: u32 = bincode::deserialize_from(&mut *input)?; + let result = input.read_u32()?; bincode::serialize_into(&mut *output, &result)?; Ok(result) }) @@ -468,7 +471,7 @@ impl TILSection { pub struct TILSectionFlags(pub(crate) u16); impl TILSectionFlags { fn new(value: u32) -> Result { - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( value < (flag::til::TIL_SLD as u32) << 1, "Unknown flag values for TILSectionFlags" @@ -568,7 +571,7 @@ impl TILSection { } fn read_bucket_zip( - input: &mut impl IdaGenericUnpack, + input: &mut impl IdaGenericBufUnpack, header: &TILSectionHeader, next_ordinal: Option, ordinal_alias: Option<&[(u32, u32)]>, @@ -576,7 +579,7 @@ impl TILSection { let (ndefs, len, compressed_len) = Self::read_bucket_zip_header(&mut *input)?; // make sure the decompressor don't read out-of-bounds let mut compressed_input = input.take(compressed_len.into()); - let mut inflate = BufReader::new(flate2::read::ZlibDecoder::new(&mut compressed_input)); + let mut inflate = BufReader::new(flate2::bufread::ZlibDecoder::new(&mut compressed_input)); // make sure only the defined size is decompressed let type_info = Self::read_bucket_inner( &mut inflate, @@ -586,7 +589,7 @@ impl TILSection { next_ordinal, ordinal_alias, )?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( compressed_input.limit() == 0, "TypeBucket compressed data is smaller then expected" @@ -615,7 +618,7 @@ impl TILSection { let type_info = (0..ndefs) .map(|i| TILTypeInfo::read(&mut input, header, i == ndefs - 1)) .collect::>()?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( input.limit() == 0, "TypeBucket total data is smaller then expected" @@ -640,7 +643,7 @@ impl TILSection { let type_info = (0..ndefs) .map(|_| TILMacro::read(&mut input)) .collect::>()?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( input.limit() == 0, "TypeBucket macro total data is smaller then expected" @@ -648,23 +651,23 @@ impl TILSection { Ok(type_info) } - fn read_macros_zip(input: &mut impl IdaGenericUnpack) -> Result> { + fn read_macros_zip(input: &mut impl IdaGenericBufUnpack) -> Result> { let (ndefs, len, compressed_len) = Self::read_bucket_zip_header(&mut *input)?; // make sure the decompressor don't read out-of-bounds let mut compressed_input = input.take(compressed_len.into()); - let inflate = BufReader::new(flate2::read::ZlibDecoder::new(&mut compressed_input)); + let inflate = BufReader::new(flate2::bufread::ZlibDecoder::new(&mut compressed_input)); // make sure only the defined size is decompressed let mut decompressed_input = inflate.take(len.into()); let type_info = (0..ndefs.try_into().unwrap()) .map(|_| TILMacro::read(&mut decompressed_input)) .collect::, _>>()?; // make sure the input was fully consumed - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( decompressed_input.limit() == 0, "TypeBucket macros data is smaller then expected" ); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( compressed_input.limit() == 0, "TypeBucket macros compressed data is smaller then expected" @@ -674,22 +677,22 @@ impl TILSection { #[allow(dead_code)] fn decompress_bucket( - input: &mut impl IdaGenericUnpack, + input: &mut impl IdaGenericBufUnpack, output: &mut impl std::io::Write, ) -> Result<()> { let (ndefs, len, compressed_len) = Self::read_bucket_zip_header(&mut *input)?; bincode::serialize_into(&mut *output, &TILBucketRaw { len, ndefs })?; // write the decompressed data let mut compressed_input = input.take(compressed_len.into()); - let inflate = flate2::read::ZlibDecoder::new(&mut compressed_input); + let inflate = flate2::bufread::ZlibDecoder::new(&mut compressed_input); let mut decompressed_input = inflate.take(len.into()); std::io::copy(&mut decompressed_input, output)?; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( decompressed_input.limit() == 0, "TypeBucket data is smaller then expected" ); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( compressed_input.limit() == 0, "TypeBucket compressed data is smaller then expected" diff --git a/src/til/struct.rs b/src/til/struct.rs index 508f41e..50307a5 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -131,12 +131,12 @@ impl StructRaw { | TAUDT_CPPOBJ | TAUDT_VFTABLE | TAFLD_METHOD; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( tattr & !_ALL_FLAGS == 0, "Invalid Struct taenum_bits {tattr:x}" ); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( _extended.is_none(), "Unable to parse extended attributes for struct" @@ -250,12 +250,12 @@ impl StructMemberRaw { | TAFLD_UNALIGNED | TAFLD_VFTABLE | TAFLD_METHOD; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( tattr & !_ALL_FLAGS == 0, "Invalid Struct taenum_bits {tattr:x}" ); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] ensure!( _extended.is_none(), "Unable to parse extended attributes for struct member" diff --git a/src/til/union.rs b/src/til/union.rs index 68a1012..ffa9052 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -85,12 +85,12 @@ impl UnionRaw { is_unaligned = tattr & TAUDT_UNALIGNED != 0; const _ALL_FLAGS: u16 = MAX_DECL_ALIGN | TAUDT_UNALIGNED; - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] anyhow::ensure!( tattr & !_ALL_FLAGS == 0, "Invalid Union taenum_bits {tattr:x}" ); - #[cfg(not(feature = "permissive"))] + #[cfg(feature = "restrictive")] anyhow::ensure!( _extended.is_none(), "Unable to parse extended attributes for union" From 3220e3415f7494df2cd8b41e90201a704fa3ed69 Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 10 Jan 2025 08:24:02 -0300 Subject: [PATCH 43/53] fix id0 dirtree not hadling EoF correctly --- Cargo.toml | 2 +- src/id0/dirtree.rs | 20 +++++++++++++------- src/ida_reader.rs | 21 +++++++++++++++------ 3 files changed, 29 insertions(+), 14 deletions(-) diff --git a/Cargo.toml b/Cargo.toml index 3d2d581..fe1cb87 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -16,7 +16,7 @@ num_enum = "0.7.3" [features] default = [] -permissive = [] +restrictive = [] [[bin]] name = "idb-tools" diff --git a/src/id0/dirtree.rs b/src/id0/dirtree.rs index 287e0ed..174d88d 100644 --- a/src/id0/dirtree.rs +++ b/src/id0/dirtree.rs @@ -203,8 +203,7 @@ impl DirTreeEntryRaw { let mut entries = vec![]; for is_value in core::iter::successors(Some(false), |x| Some(!(*x))) { // TODO unpack_dw/u8? - // TODO diferenciate an error from EoF - let Ok(entries_len) = data.unpack_dd() else { + let Some(entries_len) = data.unpack_dd_or_eof()? else { break; }; parse_entries(&mut *data, &mut entries, entries_len, is_value)?; @@ -264,6 +263,7 @@ impl DirTreeEntryRaw { // this value had known values of 0 and 4, as long it's smaller then 0x80 there no // much of a problem, otherwise this could be a unpack_dw/unpack_dd let _unknown: u8 = bincode::deserialize_from(&mut *data)?; + #[cfg(feature = "restrictive")] ensure!(_unknown < 0x80); // TODO unpack_dw/u8? let entries_len = data.unpack_dd()?; @@ -280,11 +280,17 @@ impl DirTreeEntryRaw { // NOTE in case the folder have 0 elements, there will be a 0 value, but don't take that for granted for is_value in core::iter::successors(Some(false), |x| Some(!(*x))) { // TODO unpack_dw/u8? - let num = match data.unpack_dd() { - Ok(num) => num, - // this is an empty folder, so the last value is optional - Err(_) if entries_len == 0 => break, - Err(e) => return Err(e), + let Some(num) = data.unpack_dd_or_eof()? else { + if entries_len == 0 { + // this is an empty folder, so the last value is optional + break; + } else { + return Err(std::io::Error::new( + std::io::ErrorKind::UnexpectedEof, + "Unexpected EoF while reading dirtree entries", + ) + .into()); + } }; let num = usize::try_from(num).map_err(|_| anyhow!("Invalid number of entries"))?; ensure!( diff --git a/src/ida_reader.rs b/src/ida_reader.rs index 0a605f5..52b110c 100644 --- a/src/ida_reader.rs +++ b/src/ida_reader.rs @@ -251,6 +251,17 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { Ok(self.fill_buf()?.first().copied()) } + // InnerRef b47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x46b690 unpack_dd + // NOTE the orignal implementation never fails, if input hit EoF it a partial result or 0 + /// Reads 1 to 5 bytes. + fn unpack_dd_or_eof(&mut self) -> Result> { + let Some(b1) = self.peek_u8()? else { + return Ok(None); + }; + self.consume(1); + self.unpack_dd_from_byte(b1).map(Option::Some) + } + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48ce40 fn read_ext_att(&mut self) -> Result { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48cec0 @@ -408,13 +419,11 @@ pub trait IdaGenericUnpack: Read { // NOTE the orignal implementation never fails, if input hit EoF it a partial result or 0 /// Reads 1 to 5 bytes. fn unpack_dd(&mut self) -> Result { - #[cfg(feature = "restrictive")] let b1 = self.read_u8()?; - #[cfg(not(feature = "restrictive"))] - let Some(b1) = self.read_u8_or_nothing()? - else { - return Ok(0); - }; + self.unpack_dd_from_byte(b1) + } + + fn unpack_dd_from_byte(&mut self, b1: u8) -> Result { match b1 { // 7 bit value // [0xxx xxxx] From 67bb5fdf74e4cbf5782c0777eee3e353aa2d2bbd Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 10 Jan 2025 14:47:24 -0300 Subject: [PATCH 44/53] fix til type alignment --- src/til/array.rs | 51 +++++++++++++++++++++++++---------------------- src/til/struct.rs | 13 ++++++++++-- src/til/union.rs | 10 +++++++++- 3 files changed, 47 insertions(+), 27 deletions(-) diff --git a/src/til/array.rs b/src/til/array.rs index 3d0e221..2ed4262 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -6,7 +6,7 @@ use crate::til::{Type, TypeAttribute, TypeRaw}; #[derive(Clone, Debug)] pub struct Array { - pub align: Option, + pub alignment: Option, pub base: u8, pub nelem: Option, pub elem_type: Box, @@ -18,7 +18,7 @@ impl Array { fields: &mut impl Iterator>>, ) -> anyhow::Result { Ok(Self { - align: value.align, + alignment: value.alignment, base: value.base, nelem: value.nelem, elem_type: Type::new(til, *value.elem_type, fields).map(Box::new)?, @@ -28,7 +28,7 @@ impl Array { #[derive(Clone, Debug)] pub(crate) struct ArrayRaw { - pub align: Option, + pub alignment: Option, pub base: u8, pub nelem: Option, pub elem_type: Box, @@ -54,30 +54,33 @@ impl ArrayRaw { } }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48078e - let align = match input.read_tah()? { - None => None, - Some(TypeAttribute { - tattr, - extended: _extended, - }) => { - let align = (tattr & MAX_DECL_ALIGN) as u8; - #[cfg(feature = "restrictive")] - anyhow::ensure!( - tattr & !MAX_DECL_ALIGN == 0, - "unknown TypeAttribute {tattr:x}" - ); - #[cfg(feature = "restrictive")] - anyhow::ensure!( - _extended.is_none(), - "unknown TypeAttribute ext {_extended:x?}" - ); - NonZeroU8::new(align) - } - }; + let mut alignment = None; + if let Some(TypeAttribute { + tattr, + extended: _extended, + }) = input.read_tah()? + { + let alignment_raw = (tattr & MAX_DECL_ALIGN) as u8; + let _is_unknown_8 = alignment_raw & 0x8 != 0; + #[cfg(feature = "restrictive")] + anyhow::ensure!(!_is_unknown_8, "Unknown flat 8 set on Array"); + alignment = ((alignment_raw & 0x7) != 0) + .then(|| NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap()); + #[cfg(feature = "restrictive")] + anyhow::ensure!( + tattr & !MAX_DECL_ALIGN == 0, + "unknown TypeAttribute {tattr:x}" + ); + #[cfg(feature = "restrictive")] + anyhow::ensure!( + _extended.is_none(), + "unknown TypeAttribute ext {_extended:x?}" + ); + } let elem_type = TypeRaw::read(&mut *input, header)?; Ok(ArrayRaw { base, - align, + alignment, nelem: NonZeroU16::new(nelem), elem_type: Box::new(elem_type), }) diff --git a/src/til/struct.rs b/src/til/struct.rs index 50307a5..0fad21d 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -112,7 +112,8 @@ impl StructRaw { // TODO WHY? is_unknown_8 = align_raw & 0x8 != 0; - alignment = NonZeroU8::new(align_raw & 0x7); + alignment = (align_raw & 0x7 != 0) + .then(|| NonZeroU8::new(1 << ((align_raw & 0x7) - 1)).unwrap()); is_msstruct = tattr & TAUDT_MSSTRUCT != 0; is_unaligned = tattr & TAUDT_UNALIGNED != 0; @@ -174,6 +175,7 @@ pub struct StructMember { pub is_unaligned: bool, pub is_vft: bool, pub is_method: bool, + pub is_unknown_8: bool, } impl StructMember { @@ -192,6 +194,7 @@ impl StructMember { is_unaligned: m.is_unaligned, is_vft: m.is_vft, is_method: m.is_method, + is_unknown_8: m.is_unknown_8, }) } } @@ -204,6 +207,7 @@ pub(crate) struct StructMemberRaw { pub is_unaligned: bool, pub is_vft: bool, pub is_method: bool, + pub is_unknown_8: bool, } impl StructMemberRaw { @@ -225,6 +229,7 @@ impl StructMemberRaw { let mut is_unaligned = false; let mut is_vft = false; let mut is_method = false; + let mut is_unknown_8 = false; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47825d if !is_bit_set || att.is_some() { @@ -237,7 +242,10 @@ impl StructMemberRaw { use crate::til::flag::tattr::*; use crate::til::flag::tattr_field::*; - alignment = NonZeroU8::new((tattr & MAX_DECL_ALIGN) as u8); + let alignment_raw = (tattr & MAX_DECL_ALIGN) as u8; + is_unknown_8 = alignment_raw & 0x8 != 0; + alignment = ((alignment_raw & 0x7) != 0) + .then(|| NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap()); is_baseclass = tattr & TAFLD_BASECLASS != 0; is_unaligned = tattr & TAFLD_UNALIGNED != 0; let is_virtbase = tattr & TAFLD_VIRTBASE != 0; @@ -278,6 +286,7 @@ impl StructMemberRaw { is_unaligned, is_vft, is_method, + is_unknown_8, }) } diff --git a/src/til/union.rs b/src/til/union.rs index ffa9052..13bd82b 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -15,6 +15,7 @@ pub struct Union { pub members: Vec<(Option>, Type)>, pub is_unaligned: bool, + pub is_unknown_8: bool, } impl Union { pub(crate) fn new( @@ -36,6 +37,7 @@ impl Union { alignment: value.alignment, members, is_unaligned: value.is_unaligned, + is_unknown_8: value.is_unknown_8, }) } } @@ -48,6 +50,7 @@ pub(crate) struct UnionRaw { alignment: Option, members: Vec, is_unaligned: bool, + is_unknown_8: bool, } impl UnionRaw { @@ -73,6 +76,7 @@ impl UnionRaw { let mut alignment = None; let mut is_unaligned = false; + let mut is_unknown_8 = false; if let Some(TypeAttribute { tattr, extended: _extended, @@ -81,7 +85,10 @@ impl UnionRaw { use crate::til::flag::tattr::*; use crate::til::flag::tattr_udt::*; - alignment = NonZeroU8::new((tattr & MAX_DECL_ALIGN) as u8); + let alignment_raw = (tattr & MAX_DECL_ALIGN) as u8; + is_unknown_8 = alignment_raw & 0x8 != 0; + alignment = ((alignment_raw & 0x7) != 0) + .then(|| NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap()); is_unaligned = tattr & TAUDT_UNALIGNED != 0; const _ALL_FLAGS: u16 = MAX_DECL_ALIGN | TAUDT_UNALIGNED; @@ -105,6 +112,7 @@ impl UnionRaw { alignment, members, is_unaligned, + is_unknown_8, })) } } From ba9cf317151fd7d5ad229144202493400c412a8a Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 10 Jan 2025 15:02:03 -0300 Subject: [PATCH 45/53] improve til type size calculation --- src/til/size_calculator.rs | 24 +++++++++++++++--------- 1 file changed, 15 insertions(+), 9 deletions(-) diff --git a/src/til/size_calculator.rs b/src/til/size_calculator.rs index 1e4913a..a64f185 100644 --- a/src/til/size_calculator.rs +++ b/src/til/size_calculator.rs @@ -93,12 +93,13 @@ impl<'a> TILTypeSizeSolver<'a> { let align: u64 = 1; let mut members = &til_struct.members[..]; loop { - let first_member = members.first(); - let field_size = match first_member.map(|x| &x.member_type.type_variant) { + let Some(first_member) = members.first() else { // no more members - None => break, + break; + }; + let field_size = match &first_member.member_type.type_variant { // if bit-field, condensate one or more to create a byte-field - Some(TypeVariant::Bitfield(bitfield)) => { + TypeVariant::Bitfield(bitfield) => { members = &members[1..]; // NOTE it skips 0..n members condensate_bitfields_from_struct(*bitfield, &mut members) @@ -106,7 +107,7 @@ impl<'a> TILTypeSizeSolver<'a> { .into() } // get the inner type size - Some(_) => { + _ => { let first = &members[0]; members = &members[1..]; // next member @@ -114,10 +115,15 @@ impl<'a> TILTypeSizeSolver<'a> { } }; if !til_struct.is_unaligned { - let align = first_member - .and_then(|first| self.alignemnt(&first.member_type, field_size)) - .unwrap_or(align) - .max(1); + let align = match ( + first_member.alignment.map(|x| x.get().into()), + self.alignemnt(&first_member.member_type, field_size), + ) { + (Some(a), Some(b)) => a.max(b), + (Some(a), None) | (None, Some(a)) => a, + (None, None) => align, + }; + let align = align.max(1); let align_diff = sum % align; if align_diff != 0 { sum += align - align_diff; From ec1e84b9a31926a199aa3e4c6e7ba88568159c6e Mon Sep 17 00:00:00 2001 From: rbran Date: Fri, 10 Jan 2025 15:14:55 -0300 Subject: [PATCH 46/53] add tilib cppobj print --- src/tools/tilib.rs | 15 ++++++++++++++- 1 file changed, 14 insertions(+), 1 deletion(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 162a688..a06b801 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -711,8 +711,21 @@ fn print_til_type_struct( write!(fmt, " ")?; } } + let mut members = &til_struct.members[..]; + if til_struct.is_cppobj { + match members.first() { + Some(baseclass) if baseclass.is_baseclass /*&& x.name.is_none()*/=> { + members = &members[1..]; + write!(fmt, ": ")?; + print_til_type(fmt, section, None, &baseclass.member_type, true, true, false)?; + write!(fmt, " ")?; + } + _ => {}, + } + } + write!(fmt, "{{")?; - for member in &til_struct.members { + for member in members { let member_name = member.name.as_deref(); print_til_type_complex_member( fmt, From 8f8739a15bfd7a98e34a0562804e796690f228de Mon Sep 17 00:00:00 2001 From: rbran Date: Sat, 11 Jan 2025 13:08:27 -0300 Subject: [PATCH 47/53] change max line width to 80 chars To maximize compatibility with IBM putched cards, configure rust-fmt to only allow 80 characters each line. --- .rustfmt.toml | 1 + src/id0.rs | 46 +++++-- src/id0/address_info.rs | 22 +++- src/id0/btree.rs | 159 ++++++++++++++++------- src/id0/dirtree.rs | 59 ++++++--- src/id0/root_info.rs | 12 +- src/id0/segment.rs | 7 +- src/id1.rs | 108 +++++++++++----- src/ida_reader.rs | 15 ++- src/lib.rs | 114 +++++++++++----- src/nam.rs | 30 +++-- src/til.rs | 144 ++++++++++++++------- src/til/array.rs | 8 +- src/til/bitfield.rs | 10 +- src/til/flag.rs | 13 +- src/til/function.rs | 38 ++++-- src/til/pointer.rs | 11 +- src/til/section.rs | 92 +++++++++---- src/til/size_calculator.rs | 84 +++++++----- src/til/struct.rs | 49 +++++-- src/til/union.rs | 10 +- src/tools/decompress_til.rs | 12 +- src/tools/dump_addr_info.rs | 13 +- src/tools/dump_dirtree.rs | 5 +- src/tools/dump_dirtree_funcs.rs | 8 +- src/tools/dump_dirtree_types.rs | 16 ++- src/tools/dump_functions.rs | 4 +- src/tools/dump_segments.rs | 8 +- src/tools/dump_til.rs | 14 +- src/tools/tilib.rs | 221 ++++++++++++++++++++++++-------- src/tools/tools.rs | 22 +++- 31 files changed, 966 insertions(+), 389 deletions(-) create mode 100644 .rustfmt.toml diff --git a/.rustfmt.toml b/.rustfmt.toml new file mode 100644 index 0000000..df99c69 --- /dev/null +++ b/.rustfmt.toml @@ -0,0 +1 @@ +max_width = 80 diff --git a/src/id0.rs b/src/id0.rs index 4fdd705..10ab02f 100644 --- a/src/id0.rs +++ b/src/id0.rs @@ -26,7 +26,12 @@ pub struct IDBFileRegions { } impl IDBFileRegions { - fn read(_key: &[u8], data: &[u8], version: u16, is_64: bool) -> Result { + fn read( + _key: &[u8], + data: &[u8], + version: u16, + is_64: bool, + ) -> Result { let mut input = IdaUnpacker::new(data, is_64); // TODO detect versions with more accuracy let (start, end, eva) = match version { @@ -38,9 +43,9 @@ impl IDBFileRegions { } 700.. => { let start = input.unpack_usize()?; - let end = start - .checked_add(input.unpack_usize()?) - .ok_or_else(|| anyhow!("Overflow address in File Regions"))?; + let end = start.checked_add(input.unpack_usize()?).ok_or_else( + || anyhow!("Overflow address in File Regions"), + )?; let rva = input.unpack_usize()?; // TODO some may include an extra 0 byte at the end? if let Ok(_unknown) = input.unpack_usize() { @@ -73,9 +78,13 @@ impl<'a> FunctionsAndComments<'a> { ensure!(parse_maybe_cstr(value) == Some(&b"$ funcs"[..])); Ok(Self::Name) } - b'S' => IDBFunction::read(sub_key, value, is_64).map(Self::Function), + b'S' => { + IDBFunction::read(sub_key, value, is_64).map(Self::Function) + } // some kind of style setting, maybe setting font and background color - b'R' | b'C' if value.starts_with(&[4, 3, 2, 1]) => Ok(Self::Unknown { key, value }), + b'R' | b'C' if value.starts_with(&[4, 3, 2, 1]) => { + Ok(Self::Unknown { key, value }) + } b'C' => { let address = parse_number(sub_key, true, is_64) .ok_or_else(|| anyhow!("Invalid Comment address"))?; @@ -87,8 +96,10 @@ impl<'a> FunctionsAndComments<'a> { .ok_or_else(|| anyhow!("Invalid Comment string")) } b'R' => { - let address = parse_number(sub_key, true, is_64) - .ok_or_else(|| anyhow!("Invalid Repetable Comment address"))?; + let address = + parse_number(sub_key, true, is_64).ok_or_else(|| { + anyhow!("Invalid Repetable Comment address") + })?; parse_maybe_cstr(value) .map(|value| Self::Comment { address, @@ -145,7 +156,9 @@ impl IDBFunction { }) } - fn read_extra_regular(mut input: impl IdaUnpack) -> Result { + fn read_extra_regular( + mut input: impl IdaUnpack, + ) -> Result { // TODO Undertand the sub operation at InnerRef 5c1b89aa-5277-4c98-98f6-cec08e1946ec 0x28f98f let frame = input.unpack_usize_ext_max()?; let _unknown4 = input.unpack_dw()?; @@ -155,7 +168,10 @@ impl IDBFunction { Ok(IDBFunctionExtra::NonTail { frame }) } - fn read_extra_tail(mut input: impl IdaUnpack, address_start: u64) -> Result { + fn read_extra_tail( + mut input: impl IdaUnpack, + address_start: u64, + ) -> Result { // offset of the function owner in relation to the function start let owner_offset = input.unpack_usize()? as i64; let owner = match address_start.checked_add_signed(owner_offset) { @@ -240,12 +256,18 @@ pub struct EntryPoint { pub entry_type: Option, } -pub(crate) fn parse_number(data: &[u8], big_endian: bool, is_64: bool) -> Option { +pub(crate) fn parse_number( + data: &[u8], + big_endian: bool, + is_64: bool, +) -> Option { Some(match (data.len(), is_64, big_endian) { (8, true, true) => u64::from_be_bytes(data.try_into().unwrap()), (8, true, false) => u64::from_le_bytes(data.try_into().unwrap()), (4, false, true) => u32::from_be_bytes(data.try_into().unwrap()).into(), - (4, false, false) => u32::from_le_bytes(data.try_into().unwrap()).into(), + (4, false, false) => { + u32::from_le_bytes(data.try_into().unwrap()).into() + } _ => return None, }) } diff --git a/src/id0/address_info.rs b/src/id0/address_info.rs index 114181a..85b0878 100644 --- a/src/id0/address_info.rs +++ b/src/id0/address_info.rs @@ -32,13 +32,18 @@ impl<'a> Comments<'a> { } } -pub(crate) struct SectionAddressInfoIter<'a, I: Iterator>> { +pub(crate) struct SectionAddressInfoIter< + 'a, + I: Iterator>, +> { all_entries: &'a [ID0Entry], regions: I, current_region: AddressInfoIter<'a>, } -impl<'a, I: Iterator>> SectionAddressInfoIter<'a, I> { +impl<'a, I: Iterator>> + SectionAddressInfoIter<'a, I> +{ pub fn new(all_entries: &'a [ID0Entry], regions: I, is_64: bool) -> Self { Self { all_entries, @@ -64,8 +69,10 @@ impl<'a, I: Iterator> + 'a> Iterator Some(Err(err)) => return Some(Err(err)), }; let is_64 = self.current_region.is_64; - let start_key: Vec = crate::id0::key_from_address(region.start, is_64).collect(); - let end_key: Vec = crate::id0::key_from_address(region.end, is_64).collect(); + let start_key: Vec = + crate::id0::key_from_address(region.start, is_64).collect(); + let end_key: Vec = + crate::id0::key_from_address(region.end, is_64).collect(); let start = self .all_entries .binary_search_by_key(&&start_key[..], |b| &b.key[..]) @@ -105,9 +112,12 @@ impl<'a> Iterator for AddressInfoIter<'a> { // 1.. because it starts with '.' let addr_len = if self.is_64 { 8 } else { 4 }; let key_start = addr_len + 1; - let address = super::parse_number(¤t.key[1..key_start], true, self.is_64).unwrap(); + let address = + super::parse_number(¤t.key[1..key_start], true, self.is_64) + .unwrap(); let key = ¤t.key[key_start..]; - let Some((sub_type, id_value)) = id_subkey_from_idx(key, self.is_64) else { + let Some((sub_type, id_value)) = id_subkey_from_idx(key, self.is_64) + else { return Some(Err(anyhow!("Missing SubType"))); }; diff --git a/src/id0/btree.rs b/src/id0/btree.rs index d82f7ba..ba08385 100644 --- a/src/id0/btree.rs +++ b/src/id0/btree.rs @@ -42,7 +42,10 @@ struct ID0Header { } impl ID0Header { - pub(crate) fn read(input: &mut impl IdaGenericUnpack, buf: &mut Vec) -> Result { + pub(crate) fn read( + input: &mut impl IdaGenericUnpack, + buf: &mut Vec, + ) -> Result { buf.resize(64, 0); input.read_exact(buf)?; // TODO handle the 15 version of the header: @@ -57,7 +60,8 @@ impl ID0Header { // } let mut buf_current = &buf[..]; - let next_free_offset: u32 = bincode::deserialize_from(&mut buf_current)?; + let next_free_offset: u32 = + bincode::deserialize_from(&mut buf_current)?; let page_size: u16 = bincode::deserialize_from(&mut buf_current)?; let root_page: u32 = bincode::deserialize_from(&mut buf_current)?; let record_count: u32 = bincode::deserialize_from(&mut buf_current)?; @@ -141,7 +145,8 @@ impl ID0Section { }; buf.resize(header.page_size.into(), 0); - let mut pages = HashMap::with_capacity(header.page_count.try_into().unwrap()); + let mut pages = + HashMap::with_capacity(header.page_count.try_into().unwrap()); let mut pending_pages = vec![root_page]; loop { if pending_pages.is_empty() { @@ -154,8 +159,10 @@ impl ID0Section { } // read the full page ensure!((page_idx.get() as usize) < pages_in_section); - let page_offset = page_idx.get() as usize * header.page_size as usize; - let page_raw = &input[page_offset..page_offset + header.page_size as usize]; + let page_offset = + page_idx.get() as usize * header.page_size as usize; + let page_raw = + &input[page_offset..page_offset + header.page_size as usize]; let page = ID0Page::read(page_raw, &header)?; // put in the queue the pages that need parsing, AKA children of this page match &page { @@ -179,7 +186,8 @@ impl ID0Section { ensure!(pages.len() <= header.page_count.try_into().unwrap()); // put it all in order on the vector - let mut entries = Vec::with_capacity(header.record_count.try_into().unwrap()); + let mut entries = + Vec::with_capacity(header.record_count.try_into().unwrap()); Self::tree_to_vec(root_page, &mut pages, &mut entries); // make sure the vector is sorted @@ -223,7 +231,10 @@ impl ID0Section { self.entries.iter() } - pub(crate) fn binary_search(&self, key: impl AsRef<[u8]>) -> Result { + pub(crate) fn binary_search( + &self, + key: impl AsRef<[u8]>, + ) -> Result { let key = key.as_ref(); self.entries.binary_search_by_key(&key, |b| &b.key[..]) } @@ -255,7 +266,10 @@ impl ID0Section { self.entries[start..end].iter() } - pub fn sub_values(&self, key: impl AsRef<[u8]>) -> impl Iterator { + pub fn sub_values( + &self, + key: impl AsRef<[u8]>, + ) -> impl Iterator { let key = key.as_ref(); let start = self.binary_search(key).unwrap_or_else(|start| start); let end = self.binary_search_end(key).unwrap_or_else(|end| end); @@ -264,7 +278,9 @@ impl ID0Section { } /// read the `$ segs` entries of the database - pub fn segments(&self) -> Result> + '_> { + pub fn segments( + &self, + ) -> Result> + '_> { let entry = self .get("N$ segs") .ok_or_else(|| anyhow!("Unable to find entry segs"))?; @@ -275,9 +291,9 @@ impl ID0Section { .copied() .collect(); let names = self.segment_strings()?; - Ok(self - .sub_values(key) - .map(move |e| Segment::read(&e.value, self.is_64, names.as_ref(), self))) + Ok(self.sub_values(key).map(move |e| { + Segment::read(&e.value, self.is_64, names.as_ref(), self) + })) } /// read the `$ segstrings` entries of the database @@ -301,7 +317,8 @@ impl ID0Section { ensure!(start <= end); for i in start..end { let name = value_current.unpack_ds()?; - if let Some(_old) = entries.insert(i.try_into().unwrap(), name) { + if let Some(_old) = entries.insert(i.try_into().unwrap(), name) + { return Err(anyhow!("Duplicated id in segstrings {start}")); } } @@ -332,7 +349,8 @@ impl ID0Section { let name = self .get(key) .ok_or_else(|| anyhow!("Not found name for segment {idx}"))?; - parse_maybe_cstr(&name.value).ok_or_else(|| anyhow!("Invalid segment name {idx}")) + parse_maybe_cstr(&name.value) + .ok_or_else(|| anyhow!("Invalid segment name {idx}")) } /// read the `$ loader name` entries of the database @@ -353,7 +371,9 @@ impl ID0Section { } /// read the `Root Node` entries of the database - pub fn root_info(&self) -> Result>> { + pub fn root_info( + &self, + ) -> Result>> { let entry = self .get("NRoot Node") .ok_or_else(|| anyhow!("Unable to find entry Root Node"))?; @@ -371,7 +391,8 @@ impl ID0Section { match (sub_type, sub_key.len()) { (b'N', 1) => { ensure!( - parse_maybe_cstr(&entry.value) == Some(&b"Root Node"[..]), + parse_maybe_cstr(&entry.value) + == Some(&b"Root Node"[..]), "Invalid Root Node Name" ); return Ok(IDBRootInfo::RootNodeName); @@ -380,7 +401,8 @@ impl ID0Section { (b'V', 1) => return Ok(IDBRootInfo::InputFile(&entry.value)), _ => {} } - let Some(value) = parse_number(&sub_key[1..], true, self.is_64) else { + let Some(value) = parse_number(&sub_key[1..], true, self.is_64) + else { return Ok(IDBRootInfo::Unknown(entry)); }; match (sub_type, value as i64) { @@ -407,7 +429,9 @@ impl ID0Section { .map_err(|_| anyhow!("Value Md5 with invalid len")), (b'S', 1303) => parse_maybe_cstr(&entry.value) .and_then(|version| core::str::from_utf8(version).ok()) - .ok_or_else(|| anyhow!("Unable to parse VersionString string")) + .ok_or_else(|| { + anyhow!("Unable to parse VersionString string") + }) .map(IDBRootInfo::VersionString), (b'S', 1349) => entry .value @@ -441,10 +465,9 @@ impl ID0Section { .chain(sub_key.iter()) .copied() .collect(); - let description = self - .sub_values(key) - .next() - .ok_or_else(|| anyhow!("Unable to find id_params inside Root Node"))?; + let description = self.sub_values(key).next().ok_or_else(|| { + anyhow!("Unable to find id_params inside Root Node") + })?; IDBParam::read(&description.value, self.is_64) } @@ -498,7 +521,9 @@ impl ID0Section { // TODO implement $ hidden_ranges // TODO the address_info for 0xff00_00XX (or 0xff00_0000__0000_00XX for 64bits) seesm to be reserved, what happens if there is data at that page? - fn entry_points_raw(&self) -> Result>> { + fn entry_points_raw( + &self, + ) -> Result>> { let entry = self .get("N$ entry points") .ok_or_else(|| anyhow!("Unable to find functions"))?; @@ -516,7 +541,8 @@ impl ID0Section { /// read the `$ entry points` entries of the database pub fn entry_points(&self) -> Result> { - type RawEntryPoint<'a> = HashMap, Option<&'a str>, Option<&'a str>)>; + type RawEntryPoint<'a> = + HashMap, Option<&'a str>, Option<&'a str>)>; let mut entry_points: RawEntryPoint = HashMap::new(); for entry_point in self.entry_points_raw()? { match entry_point? { @@ -524,34 +550,49 @@ impl ID0Section { | EntryPointRaw::Name | EntryPointRaw::Ordinal { .. } => {} EntryPointRaw::Address { key, address } => { - if let Some(_old) = entry_points.entry(key).or_default().0.replace(address) { - return Err(anyhow!("Duplicated function address for {key}")); + if let Some(_old) = + entry_points.entry(key).or_default().0.replace(address) + { + return Err(anyhow!( + "Duplicated function address for {key}" + )); } } EntryPointRaw::ForwardedSymbol { key, symbol } => { - if let Some(_old) = entry_points.entry(key).or_default().1.replace(symbol) { - return Err(anyhow!("Duplicated function symbol for {key}")); + if let Some(_old) = + entry_points.entry(key).or_default().1.replace(symbol) + { + return Err(anyhow!( + "Duplicated function symbol for {key}" + )); } } EntryPointRaw::FunctionName { key, name } => { - if let Some(_old) = entry_points.entry(key).or_default().2.replace(name) { - return Err(anyhow!("Duplicated function name for {key}")); + if let Some(_old) = + entry_points.entry(key).or_default().2.replace(name) + { + return Err(anyhow!( + "Duplicated function name for {key}" + )); } } } } let mut result: Vec<_> = entry_points .into_iter() - .filter_map( - |(key, (address, symbol, name))| match (address, symbol, name) { + .filter_map(|(key, (address, symbol, name))| { + match (address, symbol, name) { // Function without name or address is possible, this is // probably some label that got deleted - (Some(_), _, None) | (None, _, Some(_)) | (None, _, None) => None, + (Some(_), _, None) + | (None, _, Some(_)) + | (None, _, None) => None, (Some(address), forwarded, Some(name)) => { - let entry = match self.find_entry_point_type(key, address) { - Ok(entry) => entry, - Err(error) => return Some(Err(error)), - }; + let entry = + match self.find_entry_point_type(key, address) { + Ok(entry) => entry, + Err(error) => return Some(Err(error)), + }; Some(Ok(EntryPoint { name: name.to_owned(), address, @@ -559,25 +600,37 @@ impl ID0Section { entry_type: entry, })) } - }, - ) + } + }) .collect::>()?; result.sort_by_key(|entry| entry.address); Ok(result) } - fn find_entry_point_type(&self, key: u64, address: u64) -> Result> { - if let Some(key_entry) = self.find_entry_point_type_value(key, 0x3000)? { + fn find_entry_point_type( + &self, + key: u64, + address: u64, + ) -> Result> { + if let Some(key_entry) = + self.find_entry_point_type_value(key, 0x3000)? + { return Ok(Some(key_entry)); } // TODO some times it uses the address as key, it's based on the version? - if let Some(key_entry) = self.find_entry_point_type_value(address, 0x3000)? { + if let Some(key_entry) = + self.find_entry_point_type_value(address, 0x3000)? + { return Ok(Some(key_entry)); } Ok(None) } - fn find_entry_point_type_value(&self, value: u64, key_find: u64) -> Result> { + fn find_entry_point_type_value( + &self, + value: u64, + key_find: u64, + ) -> Result> { let key: Vec = b"." .iter() .copied() @@ -594,7 +647,8 @@ impl ID0Section { let key = parse_number(key, true, self.is_64).unwrap(); // TODO handle other values for the key if key == key_find { - return til::Type::new_from_id0(&entry.value, vec![]).map(Option::Some); + return til::Type::new_from_id0(&entry.value, vec![]) + .map(Option::Some); } } Ok(None) @@ -631,7 +685,10 @@ impl ID0Section { } /// read the label set at address, if any - pub fn label_at(&self, id0_addr: impl Id0AddressKey) -> Result> { + pub fn label_at( + &self, + id0_addr: impl Id0AddressKey, + ) -> Result> { let key: Vec = key_from_address(id0_addr.as_u64(), self.is_64) .chain(Some(b'N')) .collect(); @@ -643,8 +700,8 @@ impl ID0Section { let key_len = key.len(); let key = &entry.key[key_len..]; ensure!(key.is_empty(), "Label ID0 entry with key"); - let label = - parse_maybe_cstr(&entry.value).ok_or_else(|| anyhow!("Label is not valid CStr"))?; + let label = parse_maybe_cstr(&entry.value) + .ok_or_else(|| anyhow!("Label is not valid CStr"))?; Ok(Some(label)) } @@ -863,7 +920,8 @@ impl ID0Page { let reused_key = last_key .get(..indent.into()) .ok_or_else(|| anyhow!("key indent is too small"))?; - let key: Vec = reused_key.iter().copied().chain(ext_key).collect(); + let key: Vec = + reused_key.iter().copied().chain(ext_key).collect(); // update the last key last_key.clear(); @@ -967,7 +1025,10 @@ impl ID0Page { } } -pub(crate) fn key_from_address(address: u64, is_64: bool) -> impl Iterator { +pub(crate) fn key_from_address( + address: u64, + is_64: bool, +) -> impl Iterator { b".".iter().copied().chain(if is_64 { address.to_be_bytes().to_vec() } else { diff --git a/src/id0/dirtree.rs b/src/id0/dirtree.rs index 174d88d..45f06bf 100644 --- a/src/id0/dirtree.rs +++ b/src/id0/dirtree.rs @@ -16,7 +16,10 @@ impl DirTreeRoot { Self::inner_visit_leafs(&mut handle, &self.entries); } - fn inner_visit_leafs(handle: &mut impl FnMut(&T), entries: &[DirTreeEntry]) { + fn inner_visit_leafs( + handle: &mut impl FnMut(&T), + entries: &[DirTreeEntry], + ) { for entry in entries { match entry { DirTreeEntry::Leaf(entry) => handle(entry), @@ -92,7 +95,10 @@ impl FromDirTreeNumber for Id0TilOrd { /// "\x2e\xff\x00\x00\x31\x53\x00\x02\x00\x00":"\x01\x62\x00\x00\x00\x0d\x90\x20\x80\x88\x08\x10\x80\xe9\x04\x80\xe7\x82\x36\x06\xff\xff\xff\xfc\xd0\xff\xff\xff\xff\x60\x50\x83\x0a\x00\x0d" /// ... /// "N$ dirtree/funcs":"\x31\x00\x00\xff" -pub(crate) fn parse_dirtree<'a, T, I>(entries_iter: I, is_64: bool) -> Result> +pub(crate) fn parse_dirtree<'a, T, I>( + entries_iter: I, + is_64: bool, +) -> Result> where T: FromDirTreeNumber, I: IntoIterator>, @@ -158,7 +164,11 @@ fn dirtree_directory_from_raw( .get_mut(&number) .ok_or_else(|| anyhow!("Invalid dirtree subfolder index"))? .take() - .ok_or_else(|| anyhow!("Same entry in dirtree is owned by multiple parents"))?; + .ok_or_else(|| { + anyhow!( + "Same entry in dirtree is owned by multiple parents" + ) + })?; let DirTreeEntryRaw { name, parent, @@ -183,7 +193,9 @@ struct DirTreeEntryRaw { } impl DirTreeEntryRaw { - fn from_raw(data: &mut I) -> Result { + fn from_raw( + data: &mut I, + ) -> Result { // TODO It's unclear if this value is a version, it seems so match data.read_u8()? { 0 => Self::from_raw_v0(data), @@ -192,7 +204,9 @@ impl DirTreeEntryRaw { } } - fn from_raw_v0(data: &mut I) -> Result { + fn from_raw_v0( + data: &mut I, + ) -> Result { // part 1: header let name = data.read_c_string_raw()?; // TODO maybe just a unpack_dd followed by \x00 @@ -255,7 +269,9 @@ impl DirTreeEntryRaw { /// | entries folder | \x00 | 0..0 are folders | /// | entries values | \x0c | from 0..12 are values | /// - fn from_raw_v1(data: &mut I) -> Result { + fn from_raw_v1( + data: &mut I, + ) -> Result { // part 1: header let name = data.read_c_string_raw()?; // TODO maybe just a unpack_dd followed by \x00 @@ -292,7 +308,8 @@ impl DirTreeEntryRaw { .into()); } }; - let num = usize::try_from(num).map_err(|_| anyhow!("Invalid number of entries"))?; + let num = usize::try_from(num) + .map_err(|_| anyhow!("Invalid number of entries"))?; ensure!( current_entry.len() >= num, "Invalid number of entry of type in dirtree" @@ -354,10 +371,12 @@ where // no more entries return Ok(None); }; - let (idx, sub_idx, entry) = - next_entry.map_err(|_| anyhow!("Missing expected dirtree entry"))?; + let (idx, sub_idx, entry) = next_entry + .map_err(|_| anyhow!("Missing expected dirtree entry"))?; if sub_idx != 0 { - return Err(anyhow!("Non zero sub_idx for dirtree folder entry")); + return Err(anyhow!( + "Non zero sub_idx for dirtree folder entry" + )); } (idx, sub_idx, entry) } @@ -386,12 +405,13 @@ where let Some(next_entry) = self.iter.next() else { return Ok(false); }; - let (next_idx, next_sub_idx, next_entry) = next_entry.map_err(|_| { - std::io::Error::new( - std::io::ErrorKind::UnexpectedEof, - "Missing part of dirtree entry", - ) - })?; + let (next_idx, next_sub_idx, next_entry) = next_entry + .map_err(|_| { + std::io::Error::new( + std::io::ErrorKind::UnexpectedEof, + "Missing part of dirtree entry", + ) + })?; if next_idx != *idx { // found a EoF for this entry if next_sub_idx != 0 { @@ -471,7 +491,9 @@ where fn fill_buf(&mut self) -> std::io::Result<&[u8]> { match self.state { DirtreeEntryState::Next { .. } => Ok(&[]), - DirtreeEntryState::Reading { entry, .. } if !entry.is_empty() => Ok(entry), + DirtreeEntryState::Reading { entry, .. } if !entry.is_empty() => { + Ok(entry) + } DirtreeEntryState::Reading { .. } => { if !self.next_sub_entry()? { return Ok(&[]); @@ -503,7 +525,8 @@ fn parse_entries( None => rel_value, // other are relative from the previous Some(last_value_old) => { - let mut value = last_value_old.wrapping_add_signed(rel_value as i64); + let mut value = + last_value_old.wrapping_add_signed(rel_value as i64); // NOTE that in 32bits it wrapps using the u32 limit if !data.is_64() { value &= u32::MAX as u64; diff --git a/src/id0/root_info.rs b/src/id0/root_info.rs index 08e40e8..9fcba13 100644 --- a/src/id0/root_info.rs +++ b/src/id0/root_info.rs @@ -211,8 +211,8 @@ impl IDBParam { let mut cpu = vec![0; cpu_len]; input.read_exact(&mut cpu)?; // remove any \x00 that marks the end of the str - let cpu_str_part = - parse_maybe_cstr(&cpu[..]).ok_or_else(|| anyhow!("Invalid RootInfo CStr cpu name"))?; + let cpu_str_part = parse_maybe_cstr(&cpu[..]) + .ok_or_else(|| anyhow!("Invalid RootInfo CStr cpu name"))?; cpu.truncate(cpu_str_part.len()); // TODO tight those ranges up @@ -223,7 +223,10 @@ impl IDBParam { match version { // TODO old version may contain extra data at the end with unknown purpose ..=699 => {} - 700.. => ensure!(input.inner().is_empty(), "Data left after the IDBParam",), + 700.. => ensure!( + input.inner().is_empty(), + "Data left after the IDBParam", + ), } Ok(param) } @@ -449,7 +452,8 @@ impl IDBParam { } let nametype = input.read_u8()?; - let nametype = NameType::new(nametype).ok_or_else(|| anyhow!("Invalid NameType value"))?; + let nametype = NameType::new(nametype) + .ok_or_else(|| anyhow!("Invalid NameType value"))?; let short_demnames = input.unpack_dd()?; let long_demnames = input.unpack_dd()?; let demnames = DemName::new(input.read_u8()?)?; diff --git a/src/id0/segment.rs b/src/id0/segment.rs index 056c402..edcd823 100644 --- a/src/id0/segment.rs +++ b/src/id0/segment.rs @@ -59,10 +59,9 @@ impl Segment { .map(|name_id| { // TODO I think this is dependent on the version, and not on availability if let Some(names) = names { - names - .get(&name_id) - .map(Vec::to_owned) - .ok_or_else(|| anyhow!("Not found name for segment {name_id}")) + names.get(&name_id).map(Vec::to_owned).ok_or_else(|| { + anyhow!("Not found name for segment {name_id}") + }) } else { // if there is no names, AKA `$ segstrings`, search for the key directly id0.name_by_index(name_id.get().into()).map(<[u8]>::to_vec) diff --git a/src/id1.rs b/src/id1.rs index 2ec9fe5..2693077 100644 --- a/src/id1.rs +++ b/src/id1.rs @@ -33,7 +33,10 @@ impl ID1Section { } } - fn read_inner(input: &mut impl IdaGenericUnpack, header: &IDBHeader) -> Result { + fn read_inner( + input: &mut impl IdaGenericUnpack, + header: &IDBHeader, + ) -> Result { // TODO pages are always 0x2000? const PAGE_SIZE: usize = 0x2000; let mut buf = vec![0; PAGE_SIZE]; @@ -41,8 +44,13 @@ impl ID1Section { let mut header_page = &buf[..]; let version = VaVersion::read(&mut header_page)?; let (npages, seglist_raw) = match version { - VaVersion::Va0 | VaVersion::Va1 | VaVersion::Va2 | VaVersion::Va3 | VaVersion::Va4 => { - let nsegments: u16 = bincode::deserialize_from(&mut header_page)?; + VaVersion::Va0 + | VaVersion::Va1 + | VaVersion::Va2 + | VaVersion::Va3 + | VaVersion::Va4 => { + let nsegments: u16 = + bincode::deserialize_from(&mut header_page)?; let npages: u16 = bincode::deserialize_from(&mut header_page)?; ensure!( npages > 0, @@ -52,13 +60,19 @@ impl ID1Section { // TODO the reference code uses the magic version, should it use // the version itself instead? - let seglist: Vec = if header.magic_version.is_64() { + let seglist: Vec = if header + .magic_version + .is_64() + { (0..nsegments) .map(|_| { - let start: u64 = bincode::deserialize_from(&mut header_page)?; - let end: u64 = bincode::deserialize_from(&mut header_page)?; + let start: u64 = + bincode::deserialize_from(&mut header_page)?; + let end: u64 = + bincode::deserialize_from(&mut header_page)?; ensure!(start <= end); - let offset: u64 = bincode::deserialize_from(&mut header_page)?; + let offset: u64 = + bincode::deserialize_from(&mut header_page)?; Ok(SegInfoVaNRaw { address: start..end, offset, @@ -68,10 +82,13 @@ impl ID1Section { } else { (0..nsegments) .map(|_| { - let start: u32 = bincode::deserialize_from(&mut header_page)?; - let end: u32 = bincode::deserialize_from(&mut header_page)?; + let start: u32 = + bincode::deserialize_from(&mut header_page)?; + let end: u32 = + bincode::deserialize_from(&mut header_page)?; ensure!(start <= end); - let offset: u32 = bincode::deserialize_from(&mut header_page)?; + let offset: u32 = + bincode::deserialize_from(&mut header_page)?; Ok(SegInfoVaNRaw { address: start.into()..end.into(), offset: offset.into(), @@ -82,10 +99,13 @@ impl ID1Section { (u32::from(npages), SegInfoRaw::VaN(seglist)) } VaVersion::VaX => { - let unknown_always3: u32 = bincode::deserialize_from(&mut header_page)?; + let unknown_always3: u32 = + bincode::deserialize_from(&mut header_page)?; ensure!(unknown_always3 == 3); - let nsegments: u32 = bincode::deserialize_from(&mut header_page)?; - let unknown_always2048: u32 = bincode::deserialize_from(&mut header_page)?; + let nsegments: u32 = + bincode::deserialize_from(&mut header_page)?; + let unknown_always2048: u32 = + bincode::deserialize_from(&mut header_page)?; ensure!(unknown_always2048 == 2048); let npages: u32 = bincode::deserialize_from(&mut header_page)?; @@ -95,8 +115,12 @@ impl ID1Section { .map(|_| { let (start, end) = match header.magic_version { crate::IDBMagic::IDA0 | crate::IDBMagic::IDA1 => { - let startea: u32 = bincode::deserialize_from(&mut header_page)?; - let endea: u32 = bincode::deserialize_from(&mut header_page)?; + let startea: u32 = bincode::deserialize_from( + &mut header_page, + )?; + let endea: u32 = bincode::deserialize_from( + &mut header_page, + )?; (startea.into(), endea.into()) } crate::IDBMagic::IDA2 => ( @@ -116,7 +140,9 @@ impl ID1Section { // sort segments by address let mut overlay_check = match &seglist_raw { - SegInfoRaw::VaN(segs) => segs.iter().map(|s| s.address.clone()).collect(), + SegInfoRaw::VaN(segs) => { + segs.iter().map(|s| s.address.clone()).collect() + } SegInfoRaw::VaX(segs) => segs.clone(), }; overlay_check.sort_unstable_by_key(|s| s.start); @@ -129,8 +155,10 @@ impl ID1Section { ensure!(!overlap); // make sure the data fits the available pages - let required_size: u64 = overlay_check.iter().map(|s| (s.end - s.start) * 4).sum(); - let required_pages = required_size.div_ceil(u64::try_from(PAGE_SIZE).unwrap()); + let required_size: u64 = + overlay_check.iter().map(|s| (s.end - s.start) * 4).sum(); + let required_pages = + required_size.div_ceil(u64::try_from(PAGE_SIZE).unwrap()); // TODO if the extra data at the end of the section is identified, review replacing <= with == // -1 because the first page is always the header ensure!(required_pages <= u64::from(npages - 1)); @@ -145,12 +173,17 @@ impl ID1Section { .map(|seg| { // skip any gaps match seg.offset.cmp(¤t_offset) { - std::cmp::Ordering::Less => return Err(anyhow!("invalid offset")), + std::cmp::Ordering::Less => { + return Err(anyhow!("invalid offset")) + } std::cmp::Ordering::Greater => { // TODO can be any deleted sector contains randon data? // skip intermidiate bytes, also ensuring they are all zeros ensure_all_bytes_are_zero( - std::io::Read::take(&mut *input, seg.offset - current_offset), + std::io::Read::take( + &mut *input, + seg.offset - current_offset, + ), &mut buf, )?; current_offset = seg.offset; @@ -158,7 +191,8 @@ impl ID1Section { std::cmp::Ordering::Equal => {} } let len = seg.address.end - seg.address.start; - let (data, _flags) = split_flags_data(&mut *input, len)?; + let (data, _flags) = + split_flags_data(&mut *input, len)?; current_offset += len * 4; Ok(SegInfo { offset: seg.address.start, @@ -172,8 +206,10 @@ impl ID1Section { // the data for the segments are stored sequentialy in disk segs.into_iter() .map(|address| { - let (data, _flags) = - split_flags_data(&mut *input, address.end - address.start)?; + let (data, _flags) = split_flags_data( + &mut *input, + address.end - address.start, + )?; Ok(SegInfo { offset: address.start, data, @@ -206,7 +242,10 @@ struct SegInfoVaNRaw { offset: u64, } -fn ensure_all_bytes_are_zero(mut input: impl IdaGenericUnpack, buf: &mut [u8]) -> Result<()> { +fn ensure_all_bytes_are_zero( + mut input: impl IdaGenericUnpack, + buf: &mut [u8], +) -> Result<()> { loop { match input.read(buf) { // found EoF @@ -214,14 +253,18 @@ fn ensure_all_bytes_are_zero(mut input: impl IdaGenericUnpack, buf: &mut [u8]) - // read something Ok(n) => ensure!(&buf[..n].iter().all(|b| *b == 0)), // ignore interrupts - Err(ref e) if matches!(e.kind(), std::io::ErrorKind::Interrupted) => {} + Err(ref e) + if matches!(e.kind(), std::io::ErrorKind::Interrupted) => {} Err(e) => return Err(e.into()), }; } Ok(()) } -fn ignore_bytes(mut input: impl IdaGenericUnpack, buf: &mut [u8]) -> Result<()> { +fn ignore_bytes( + mut input: impl IdaGenericUnpack, + buf: &mut [u8], +) -> Result<()> { loop { match input.read(buf) { // found EoF @@ -229,19 +272,26 @@ fn ignore_bytes(mut input: impl IdaGenericUnpack, buf: &mut [u8]) -> Result<()> // read something Ok(_n) => {} // ignore interrupts - Err(ref e) if matches!(e.kind(), std::io::ErrorKind::Interrupted) => {} + Err(ref e) + if matches!(e.kind(), std::io::ErrorKind::Interrupted) => {} Err(e) => return Err(e.into()), }; } Ok(()) } -fn split_flags_data(mut input: impl IdaGenericUnpack, len: u64) -> Result<(Vec, Vec)> { +fn split_flags_data( + mut input: impl IdaGenericUnpack, + len: u64, +) -> Result<(Vec, Vec)> { let len = usize::try_from(len).unwrap(); let mut flags = vec![0u32; len]; // SAFETY: don't worry &mut[u32] is compatible with &mut[u8] with len * 4 input.read_exact(unsafe { - &mut *core::slice::from_raw_parts_mut(flags.as_mut_ptr() as *mut u8, len * 4) + &mut *core::slice::from_raw_parts_mut( + flags.as_mut_ptr() as *mut u8, + len * 4, + ) })?; // extract the bytes into other vector and leave the flags there let data = flags diff --git a/src/ida_reader.rs b/src/ida_reader.rs index 52b110c..71d553e 100644 --- a/src/ida_reader.rs +++ b/src/ida_reader.rs @@ -93,7 +93,10 @@ impl Read for IdaUnpacker { self.input.read(buf) } - fn read_vectored(&mut self, bufs: &mut [std::io::IoSliceMut<'_>]) -> std::io::Result { + fn read_vectored( + &mut self, + bufs: &mut [std::io::IoSliceMut<'_>], + ) -> std::io::Result { self.input.read_vectored(bufs) } @@ -119,7 +122,11 @@ impl BufRead for IdaUnpacker { self.input.consume(amt); } - fn read_until(&mut self, byte: u8, buf: &mut Vec) -> std::io::Result { + fn read_until( + &mut self, + byte: u8, + buf: &mut Vec, + ) -> std::io::Result { self.input.read_until(byte, buf) } @@ -148,7 +155,9 @@ pub trait IdaGenericBufUnpack: IdaGenericUnpack + BufRead { // skip the ordinal number match (format, (flags >> 31) != 0) { // formats below 0x12 doesn't have 64 bits ord - (0..=0x11, _) | (_, false) => data.extend(self.read_u32()?.to_le_bytes()), + (0..=0x11, _) | (_, false) => { + data.extend(self.read_u32()?.to_le_bytes()) + } (_, true) => data.extend(self.read_u64()?.to_le_bytes()), } diff --git a/src/lib.rs b/src/lib.rs index a2e18fb..cc92987 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -81,15 +81,30 @@ impl IDBParser { } pub fn read_id0_section(&mut self, id0: ID0Offset) -> Result { - read_section(&mut self.input, &self.header, id0.0.get(), ID0Section::read) + read_section( + &mut self.input, + &self.header, + id0.0.get(), + ID0Section::read, + ) } pub fn read_id1_section(&mut self, id1: ID1Offset) -> Result { - read_section(&mut self.input, &self.header, id1.0.get(), ID1Section::read) + read_section( + &mut self.input, + &self.header, + id1.0.get(), + ID1Section::read, + ) } pub fn read_nam_section(&mut self, nam: NamOffset) -> Result { - read_section(&mut self.input, &self.header, nam.0.get(), NamSection::read) + read_section( + &mut self.input, + &self.header, + nam.0.get(), + NamSection::read, + ) } pub fn read_til_section(&mut self, til: TILOffset) -> Result { @@ -107,9 +122,11 @@ impl IDBParser { output: &mut impl std::io::Write, ) -> Result<()> { self.input.seek(SeekFrom::Start(offset.idb_offset()))?; - let section_header = IDBSectionHeader::read(&self.header, &mut self.input)?; + let section_header = + IDBSectionHeader::read(&self.header, &mut self.input)?; // makes sure the reader doesn't go out-of-bounds - let mut input = std::io::Read::take(&mut self.input, section_header.len); + let mut input = + std::io::Read::take(&mut self.input, section_header.len); match section_header.compress { IDBSectionCompression::Zlib => { let mut input = flate2::bufread::ZlibDecoder::new(input); @@ -128,9 +145,11 @@ impl IDBParser { output: &mut impl std::io::Write, ) -> Result<()> { self.input.seek(SeekFrom::Start(til.0.get()))?; - let section_header = IDBSectionHeader::read(&self.header, &mut self.input)?; + let section_header = + IDBSectionHeader::read(&self.header, &mut self.input)?; // makes sure the reader doesn't go out-of-bounds - let mut input = std::io::Read::take(&mut self.input, section_header.len); + let mut input = + std::io::Read::take(&mut self.input, section_header.len); TILSection::decompress(&mut input, output, section_header.compress) } } @@ -143,7 +162,11 @@ fn read_section<'a, I, T, F>( ) -> Result where I: IdbReader, - F: FnMut(&mut std::io::Take<&'a mut I>, &IDBHeader, IDBSectionCompression) -> Result, + F: FnMut( + &mut std::io::Take<&'a mut I>, + &IDBHeader, + IDBSectionCompression, + ) -> Result, { input.seek(SeekFrom::Start(offset))?; let section_header = IDBSectionHeader::read(header, &mut *input)?; @@ -384,10 +407,14 @@ impl IDBHeader { _unk0_v7c: u32, } let v5_raw: V5Raw = bincode::deserialize_from(input)?; - let id0_offset = - u64::from_le(u64::from(header_raw.offsets[1]) << 32 | u64::from(header_raw.offsets[0])); - let id1_offset = - u64::from_le(u64::from(header_raw.offsets[3]) << 32 | u64::from(header_raw.offsets[2])); + let id0_offset = u64::from_le( + u64::from(header_raw.offsets[1]) << 32 + | u64::from(header_raw.offsets[0]), + ); + let id1_offset = u64::from_le( + u64::from(header_raw.offsets[3]) << 32 + | u64::from(header_raw.offsets[2]), + ); // TODO Final checksum is always zero on v5? #[cfg(feature = "restrictive")] @@ -433,10 +460,14 @@ impl IDBHeader { _unk0_v7c: u32, } let v6_raw: V6Raw = bincode::deserialize_from(input)?; - let id0_offset = - u64::from_le(u64::from(header_raw.offsets[1]) << 32 | u64::from(header_raw.offsets[0])); - let id1_offset = - u64::from_le(u64::from(header_raw.offsets[3]) << 32 | u64::from(header_raw.offsets[2])); + let id0_offset = u64::from_le( + u64::from(header_raw.offsets[1]) << 32 + | u64::from(header_raw.offsets[0]), + ); + let id1_offset = u64::from_le( + u64::from(header_raw.offsets[3]) << 32 + | u64::from(header_raw.offsets[2]), + ); #[cfg(feature = "restrictive")] { @@ -465,7 +496,10 @@ impl IDBHeader { } impl IDBSectionHeader { - pub fn read(header: &IDBHeader, input: impl IdaGenericUnpack) -> Result { + pub fn read( + header: &IDBHeader, + input: impl IdaGenericUnpack, + ) -> Result { match header.version { IDBVersion::V1 | IDBVersion::V4 => { #[derive(Debug, Deserialize)] @@ -527,7 +561,10 @@ impl VaVersion { } } -fn write_string_len_u8(mut output: O, value: &[u8]) -> Result<()> { +fn write_string_len_u8( + mut output: O, + value: &[u8], +) -> Result<()> { output.write_all(&[u8::try_from(value.len()).unwrap()])?; Ok(output.write_all(value)?) } @@ -548,8 +585,8 @@ mod test { 0xaf, 0x81, 0x42, 0x01, 0x53, // TODO 0x01, // void ret 0x03, //n args - 0x3d, 0x08, 0x48, 0x4d, 0x4f, 0x44, 0x55, 0x4c, 0x45, 0x3d, 0x06, 0x44, 0x57, 0x4f, - 0x52, 0x44, 0x00, + 0x3d, 0x08, 0x48, 0x4d, 0x4f, 0x44, 0x55, 0x4c, 0x45, 0x3d, 0x06, + 0x44, 0x57, 0x4f, 0x52, 0x44, 0x00, ]; let _til = til::Type::new_from_id0(&function, vec![]).unwrap(); } @@ -608,13 +645,13 @@ mod test { 0x0a, // arg1 type pointer 0xfe, 0x10, // TypeAttribute val 0x02, // dt len 1 - 0x0d, 0x5f, 0x5f, 0x6f, 0x72, 0x67, 0x5f, 0x61, 0x72, 0x72, 0x64, 0x69, - 0x6d, // TODO some _string: "__org_arrdim" + 0x0d, 0x5f, 0x5f, 0x6f, 0x72, 0x67, 0x5f, 0x61, 0x72, 0x72, 0x64, + 0x69, 0x6d, // TODO some _string: "__org_arrdim" 0x03, 0xac, 0x01, // TODO _other_thing 0x0d, // arg1 pointer type struct 0x01, // struct ref - 0x0e, 0x5f, 0x5f, 0x6a, 0x6d, 0x70, 0x5f, 0x62, 0x75, 0x66, 0x5f, 0x74, 0x61, - 0x67, // "__jmp_buf_tag" + 0x0e, 0x5f, 0x5f, 0x6a, 0x6d, 0x70, 0x5f, 0x62, 0x75, 0x66, 0x5f, + 0x74, 0x61, 0x67, // "__jmp_buf_tag" 0x00, // end of type ]; let _til = til::Type::new_from_id0(&function, vec![]).unwrap(); @@ -648,14 +685,15 @@ mod test { // arg4 ... 0x0a, // pointer 0x7d, // const typedef - 0x08, 0x41, 0x45, 0x53, 0x5f, 0x4b, 0x45, 0x59, // ordinal "AES_KEY" + 0x08, 0x41, 0x45, 0x53, 0x5f, 0x4b, 0x45, + 0x59, // ordinal "AES_KEY" // arg5 0xff, 0x48, // some flag in function arg 0x0a, // pointer 0xfe, 0x10, // TypeAttribute val 0x02, // TypeAttribute loop once - 0x0d, 0x5f, 0x5f, 0x6f, 0x72, 0x67, 0x5f, 0x61, 0x72, 0x72, 0x64, 0x69, - 0x6d, // string "__org_arrdim" + 0x0d, 0x5f, 0x5f, 0x6f, 0x72, 0x67, 0x5f, 0x61, 0x72, 0x72, 0x64, + 0x69, 0x6d, // string "__org_arrdim" 0x03, 0xac, 0x10, // ???? some other TypeAttribute field 0x22, // type unsigned __int8 // arg6 @@ -663,8 +701,8 @@ mod test { 0x0a, // pointer 0xfe, 0x10, // TypeAttribute val 0x02, // TypeAttribute loop once - 0x0d, 0x5f, 0x5f, 0x6f, 0x72, 0x67, 0x5f, 0x61, 0x72, 0x72, 0x64, 0x69, - 0x6d, // string "__org_arrdim" + 0x0d, 0x5f, 0x5f, 0x6f, 0x72, 0x67, 0x5f, 0x61, 0x72, 0x72, 0x64, + 0x69, 0x6d, // string "__org_arrdim" 0x03, 0xac, 0x10, // ???? some other TypeAttribute field 0x22, // type unsigned __int8 // arg7 ... @@ -748,7 +786,11 @@ mod test { #[test] fn parse_idbs() { - let files = find_all("resources/idbs".as_ref(), &["idb".as_ref(), "i64".as_ref()]).unwrap(); + let files = find_all( + "resources/idbs".as_ref(), + &["idb".as_ref(), "i64".as_ref()], + ) + .unwrap(); for filename in files { parse_idb(filename) } @@ -781,7 +823,8 @@ mod test { }; let _: Vec<_> = id0.segments().unwrap().map(Result::unwrap).collect(); - let _: Vec<_> = id0.loader_name().unwrap().map(Result::unwrap).collect(); + let _: Vec<_> = + id0.loader_name().unwrap().map(Result::unwrap).collect(); let _: Vec<_> = id0.root_info().unwrap().map(Result::unwrap).collect(); let _: Vec<_> = id0 .file_regions(version) @@ -822,7 +865,8 @@ mod test { #[test] fn parse_tils() { - let files = find_all("resources/tils".as_ref(), &["til".as_ref()]).unwrap(); + let files = + find_all("resources/tils".as_ref(), &["til".as_ref()]).unwrap(); let _results = files .into_iter() .map(|file| { @@ -845,7 +889,11 @@ mod test { } fn find_all(path: &Path, exts: &[&OsStr]) -> Result> { - fn inner_find_all(path: &Path, exts: &[&OsStr], buf: &mut Vec) -> Result<()> { + fn inner_find_all( + path: &Path, + exts: &[&OsStr], + buf: &mut Vec, + ) -> Result<()> { for entry in std::fs::read_dir(path)?.map(Result::unwrap) { let entry_type = entry.metadata()?.file_type(); if entry_type.is_dir() { diff --git a/src/nam.rs b/src/nam.rs index 83d226d..6f11574 100644 --- a/src/nam.rs +++ b/src/nam.rs @@ -38,13 +38,18 @@ impl NamSection { let version = VaVersion::read(&mut header_page)?; let (npages, nnames, pagesize) = match version { - VaVersion::Va0 | VaVersion::Va1 | VaVersion::Va2 | VaVersion::Va3 | VaVersion::Va4 => { + VaVersion::Va0 + | VaVersion::Va1 + | VaVersion::Va2 + | VaVersion::Va3 + | VaVersion::Va4 => { let always1: u16 = bincode::deserialize_from(&mut header_page)?; ensure!(always1 == 1); let npages: u64 = if header.magic_version.is_64() { bincode::deserialize_from(&mut header_page)? } else { - bincode::deserialize_from::<_, u32>(&mut header_page)?.into() + bincode::deserialize_from::<_, u32>(&mut header_page)? + .into() }; let always0: u16 = bincode::deserialize_from(&mut header_page)?; ensure!(always0 == 0); @@ -52,24 +57,29 @@ impl NamSection { // TODO nnames / 2? Why? bincode::deserialize_from::<_, u64>(&mut header_page)? / 2 } else { - bincode::deserialize_from::<_, u32>(&mut header_page)?.into() + bincode::deserialize_from::<_, u32>(&mut header_page)? + .into() }; - let pagesize: u32 = bincode::deserialize_from(&mut header_page)?; + let pagesize: u32 = + bincode::deserialize_from(&mut header_page)?; ensure!(pagesize >= 64); (npages, nnames, pagesize) } VaVersion::VaX => { let always3: u32 = bincode::deserialize_from(&mut header_page)?; ensure!(always3 == 3); - let one_or_zero: u32 = bincode::deserialize_from(&mut header_page)?; + let one_or_zero: u32 = + bincode::deserialize_from(&mut header_page)?; ensure!([0, 1].contains(&one_or_zero)); // TODO always2048 have some relation to pagesize? - let always2048: u32 = bincode::deserialize_from(&mut header_page)?; + let always2048: u32 = + bincode::deserialize_from(&mut header_page)?; ensure!(always2048 == 2048); let npages: u64 = if header.magic_version.is_64() { bincode::deserialize_from(&mut header_page)? } else { - bincode::deserialize_from::<_, u32>(&mut header_page)?.into() + bincode::deserialize_from::<_, u32>(&mut header_page)? + .into() }; let always0: u32 = bincode::deserialize_from(&mut header_page)?; ensure!(always0 == 0); @@ -77,7 +87,8 @@ impl NamSection { // TODO nnames / 2? Why? bincode::deserialize_from::<_, u64>(&mut header_page)? / 2 } else { - bincode::deserialize_from::<_, u32>(&mut header_page)?.into() + bincode::deserialize_from::<_, u32>(&mut header_page)? + .into() }; (npages, nnames, DEFAULT_PAGE_SIZE.try_into().unwrap()) } @@ -115,7 +126,8 @@ impl NamSection { let name = if header.magic_version.is_64() { bincode::deserialize_from::<_, u64>(&mut input) } else { - bincode::deserialize_from::<_, u32>(&mut input).map(u64::from) + bincode::deserialize_from::<_, u32>(&mut input) + .map(u64::from) }; let Ok(name) = name else { break; diff --git a/src/til.rs b/src/til.rs index 4696d9c..d426018 100644 --- a/src/til.rs +++ b/src/til.rs @@ -74,22 +74,26 @@ impl TILTypeInfo { (0..=0x11, _) | (_, false) => cursor.read_u32()?.into(), (_, true) => cursor.read_u64()?, }; - let tinfo_raw = TypeRaw::read(&mut *cursor, til).with_context(|| { - format!( - "parsing `TILTypeInfo::tiinfo` for type \"{}\"", - String::from_utf8_lossy(&name) - ) - })?; + let tinfo_raw = + TypeRaw::read(&mut *cursor, til).with_context(|| { + format!( + "parsing `TILTypeInfo::tiinfo` for type \"{}\"", + String::from_utf8_lossy(&name) + ) + })?; let _info = cursor.read_c_string_raw()?; let cmt = cursor.read_c_string_raw()?; let fields = cursor.read_c_string_vec()?; let fieldcmts = cursor.read_c_string_raw()?; let sclass: u8 = cursor.read_u8()?; - let mut fields_iter = - fields - .into_iter() - .map(|field| if field.is_empty() { None } else { Some(field) }); + let mut fields_iter = fields.into_iter().map(|field| { + if field.is_empty() { + None + } else { + Some(field) + } + }); let tinfo = Type::new(til, tinfo_raw, &mut fields_iter)?; #[cfg(feature = "restrictive")] ensure!( @@ -143,15 +147,27 @@ impl Type { TypeVariantRaw::Basic(x) => TypeVariant::Basic(x), TypeVariantRaw::Bitfield(x) => TypeVariant::Bitfield(x), TypeVariantRaw::Typedef(x) => TypeVariant::Typedef(x), - TypeVariantRaw::Pointer(x) => Pointer::new(til, x, fields).map(TypeVariant::Pointer)?, + TypeVariantRaw::Pointer(x) => { + Pointer::new(til, x, fields).map(TypeVariant::Pointer)? + } TypeVariantRaw::Function(x) => { Function::new(til, x, fields).map(TypeVariant::Function)? } - TypeVariantRaw::Array(x) => Array::new(til, x, fields).map(TypeVariant::Array)?, - TypeVariantRaw::Struct(x) => Struct::new(til, x, fields).map(TypeVariant::Struct)?, - TypeVariantRaw::Union(x) => Union::new(til, x, fields).map(TypeVariant::Union)?, - TypeVariantRaw::Enum(x) => Enum::new(til, x, fields).map(TypeVariant::Enum)?, - TypeVariantRaw::StructRef(typedef) => TypeVariant::StructRef(typedef), + TypeVariantRaw::Array(x) => { + Array::new(til, x, fields).map(TypeVariant::Array)? + } + TypeVariantRaw::Struct(x) => { + Struct::new(til, x, fields).map(TypeVariant::Struct)? + } + TypeVariantRaw::Union(x) => { + Union::new(til, x, fields).map(TypeVariant::Union)? + } + TypeVariantRaw::Enum(x) => { + Enum::new(til, x, fields).map(TypeVariant::Enum)? + } + TypeVariantRaw::StructRef(typedef) => { + TypeVariant::StructRef(typedef) + } TypeVariantRaw::UnionRef(typedef) => TypeVariant::UnionRef(typedef), TypeVariantRaw::EnumRef(typedef) => TypeVariant::EnumRef(typedef), }; @@ -162,7 +178,10 @@ impl Type { }) } // TODO find the best way to handle type parsing from id0 - pub(crate) fn new_from_id0(data: &[u8], fields: Vec>) -> Result { + pub(crate) fn new_from_id0( + data: &[u8], + fields: Vec>, + ) -> Result { // TODO it's unclear what header information id0 types use to parse tils // maybe it just use the til sector header, or more likelly it's from // IDBParam in the `Root Node` @@ -195,10 +214,13 @@ impl Type { )); } } - let mut fields_iter = - fields - .into_iter() - .map(|field| if field.is_empty() { None } else { Some(field) }); + let mut fields_iter = fields.into_iter().map(|field| { + if field.is_empty() { + None + } else { + Some(field) + } + }); let result = Self::new(&header, type_raw, &mut fields_iter)?; #[cfg(feature = "restrictive")] ensure!( @@ -233,7 +255,10 @@ pub(crate) enum TypeVariantRaw { } impl TypeRaw { - pub fn read(input: &mut impl IdaGenericBufUnpack, til: &TILSectionHeader) -> Result { + pub fn read( + input: &mut impl IdaGenericBufUnpack, + til: &TILSectionHeader, + ) -> Result { let metadata: u8 = input.read_u8()?; let type_base = metadata & flag::tf_mask::TYPE_BASE_MASK; let type_flags = metadata & flag::tf_mask::TYPE_FLAGS_MASK; @@ -247,32 +272,42 @@ impl TypeRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x480335 // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x472e13 print_til_type let variant = match (type_base, type_flags) { - (..=flag::tf_last_basic::BT_LAST_BASIC, _) => Basic::new(til, type_base, type_flags) - .context("Type::Basic") - .map(TypeVariantRaw::Basic)?, + (..=flag::tf_last_basic::BT_LAST_BASIC, _) => { + Basic::new(til, type_base, type_flags) + .context("Type::Basic") + .map(TypeVariantRaw::Basic)? + } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4804d7 - (flag::tf_ptr::BT_PTR, _) => PointerRaw::read(input, til, type_flags) - .context("Type::Pointer") - .map(TypeVariantRaw::Pointer)?, + (flag::tf_ptr::BT_PTR, _) => { + PointerRaw::read(input, til, type_flags) + .context("Type::Pointer") + .map(TypeVariantRaw::Pointer)? + } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48075a - (flag::tf_array::BT_ARRAY, _) => ArrayRaw::read(input, til, type_flags) - .context("Type::Array") - .map(TypeVariantRaw::Array)?, + (flag::tf_array::BT_ARRAY, _) => { + ArrayRaw::read(input, til, type_flags) + .context("Type::Array") + .map(TypeVariantRaw::Array)? + } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x48055d - (flag::tf_func::BT_FUNC, _) => FunctionRaw::read(input, til, type_flags) - .context("Type::Function") - .map(TypeVariantRaw::Function)?, + (flag::tf_func::BT_FUNC, _) => { + FunctionRaw::read(input, til, type_flags) + .context("Type::Function") + .map(TypeVariantRaw::Function)? + } (flag::tf_complex::BT_BITFIELD, _) => TypeVariantRaw::Bitfield( Bitfield::read(input, type_flags).context("Type::Bitfield")?, ), // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x480369 - (flag::tf_complex::BT_COMPLEX, flag::tf_complex::BTMT_TYPEDEF) => Typedef::read(input) - .context("Type::Typedef") - .map(TypeVariantRaw::Typedef)?, + (flag::tf_complex::BT_COMPLEX, flag::tf_complex::BTMT_TYPEDEF) => { + Typedef::read(input) + .context("Type::Typedef") + .map(TypeVariantRaw::Typedef)? + } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x480378 @@ -296,7 +331,9 @@ impl TypeRaw { (flag::tf_complex::BT_COMPLEX, _) => unreachable!(), // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x47395d print_til_type - (flag::BT_RESERVED, _) => return Err(anyhow!("Wrong/Unknown type: {metadata:02x}")), + (flag::BT_RESERVED, _) => { + return Err(anyhow!("Wrong/Unknown type: {metadata:02x}")) + } (flag::BT_RESERVED.., _) => unreachable!(), }; @@ -307,7 +344,10 @@ impl TypeRaw { }) } - pub fn read_ref(input: &mut impl IdaGenericUnpack, header: &TILSectionHeader) -> Result { + pub fn read_ref( + input: &mut impl IdaGenericUnpack, + header: &TILSectionHeader, + ) -> Result { let mut bytes = input.unpack_dt_bytes()?; if !bytes.starts_with(b"=") { @@ -375,7 +415,9 @@ impl Basic { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x480874 BT_UNK => { let bytes = match btmt { - BTMT_SIZE0 => return Err(anyhow!("forbidden use of BT_UNK")), + BTMT_SIZE0 => { + return Err(anyhow!("forbidden use of BT_UNK")) + } BTMT_SIZE12 => 2, // BT_UNK_WORD BTMT_SIZE48 => 8, // BT_UNK_QWORD BTMT_SIZE128 => 0, // BT_UNKNOWN @@ -409,7 +451,10 @@ impl Basic { return match bt_int { BT_INT8 => Ok(Self::Char), BT_INT => Ok(Self::SegReg), // BT_SEGREG - _ => Err(anyhow!("Reserved use of tf_int::BTMT_CHAR {:x}", btmt)), + _ => Err(anyhow!( + "Reserved use of tf_int::BTMT_CHAR {:x}", + btmt + )), }; } _ => unreachable!(), @@ -478,11 +523,15 @@ impl Typedef { let mut tmp = data; let de = tmp.read_de()?; if !tmp.is_empty() { - return Err(anyhow!("Typedef Ordinal with more data then expected")); + return Err(anyhow!( + "Typedef Ordinal with more data then expected" + )); } Ok(Typedef::Ordinal(de)) } - _ => Ok(Typedef::Name(if buf.is_empty() { None } else { Some(buf) })), + _ => { + Ok(Typedef::Name(if buf.is_empty() { None } else { Some(buf) })) + } } } } @@ -518,7 +567,10 @@ impl TILMacro { let param_num = have_param.then_some((flag & 0xFF) as u8); if !have_param { #[cfg(feature = "restrictive")] - ensure!(flag & 0xFF == 0, "Unknown/Invalid value for TILMacro flag"); + ensure!( + flag & 0xFF == 0, + "Unknown/Invalid value for TILMacro flag" + ); } // TODO find the InnerRef for this let value = input.read_c_string_raw()?; @@ -539,7 +591,9 @@ impl TILMacro { } match (max_param, param_idx) { (None, _) => max_param = Some(param_idx), - (Some(max), param_idx) if param_idx > max => max_param = Some(param_idx), + (Some(max), param_idx) if param_idx > max => { + max_param = Some(param_idx) + } (Some(_), _) => {} } Some(TILMacroValue::Param(param_idx)) diff --git a/src/til/array.rs b/src/til/array.rs index 2ed4262..57bebd4 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -21,7 +21,8 @@ impl Array { alignment: value.alignment, base: value.base, nelem: value.nelem, - elem_type: Type::new(til, *value.elem_type, fields).map(Box::new)?, + elem_type: Type::new(til, *value.elem_type, fields) + .map(Box::new)?, }) } } @@ -64,8 +65,9 @@ impl ArrayRaw { let _is_unknown_8 = alignment_raw & 0x8 != 0; #[cfg(feature = "restrictive")] anyhow::ensure!(!_is_unknown_8, "Unknown flat 8 set on Array"); - alignment = ((alignment_raw & 0x7) != 0) - .then(|| NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap()); + alignment = ((alignment_raw & 0x7) != 0).then(|| { + NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap() + }); #[cfg(feature = "restrictive")] anyhow::ensure!( tattr & !MAX_DECL_ALIGN == 0, diff --git a/src/til/bitfield.rs b/src/til/bitfield.rs index a289307..4507d08 100644 --- a/src/til/bitfield.rs +++ b/src/til/bitfield.rs @@ -27,7 +27,10 @@ pub struct Bitfield { } impl Bitfield { - pub(crate) fn read(input: &mut impl IdaGenericBufUnpack, metadata: u8) -> Result { + pub(crate) fn read( + input: &mut impl IdaGenericBufUnpack, + metadata: u8, + ) -> Result { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x472f3c print_til_type let nbytes = match metadata { super::flag::tf_complex::BTMT_BFLDI8 => 1, @@ -46,7 +49,10 @@ impl Bitfield { extended: _extended, }) => { #[cfg(feature = "restrictive")] - anyhow::ensure!(_tattr == 0, "Unknown TypeAttribute {_tattr:x}"); + anyhow::ensure!( + _tattr == 0, + "Unknown TypeAttribute {_tattr:x}" + ); #[cfg(feature = "restrictive")] anyhow::ensure!( _extended.is_none(), diff --git a/src/til/flag.rs b/src/til/flag.rs index 21ed69f..05405e0 100644 --- a/src/til/flag.rs +++ b/src/til/flag.rs @@ -391,7 +391,9 @@ pub mod tf_conv_unk { /// Convenience definitions: shortcuts pub mod tf_shortcuts { - use super::{tf_bool, tf_complex, tf_conv_unk, tf_float, tf_int, tf_unk, TypeT}; + use super::{ + tf_bool, tf_complex, tf_conv_unk, tf_float, tf_int, tf_unk, TypeT, + }; /// byte pub const BTF_BYTE: TypeT = tf_conv_unk::BT_UNK_BYTE; /// unknown @@ -448,13 +450,16 @@ pub mod tf_shortcuts { pub const BTF_TBYTE: TypeT = tf_float::BT_FLOAT | tf_float::BTMT_SPECFLT; /// struct - pub const BTF_STRUCT: TypeT = tf_complex::BT_COMPLEX | tf_complex::BTMT_STRUCT; + pub const BTF_STRUCT: TypeT = + tf_complex::BT_COMPLEX | tf_complex::BTMT_STRUCT; /// union - pub const BTF_UNION: TypeT = tf_complex::BT_COMPLEX | tf_complex::BTMT_UNION; + pub const BTF_UNION: TypeT = + tf_complex::BT_COMPLEX | tf_complex::BTMT_UNION; /// enum pub const BTF_ENUM: TypeT = tf_complex::BT_COMPLEX | tf_complex::BTMT_ENUM; /// typedef - pub const BTF_TYPEDEF: TypeT = tf_complex::BT_COMPLEX | tf_complex::BTMT_TYPEDEF; + pub const BTF_TYPEDEF: TypeT = + tf_complex::BT_COMPLEX | tf_complex::BTMT_TYPEDEF; } /// Type attributes diff --git a/src/til/function.rs b/src/til/function.rs index 925b6b1..7fe76ec 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -153,7 +153,11 @@ impl FunctionRaw { let is_static = flags_lower & BFA_STATIC != 0; let is_virtual = flags_lower & BFA_VIRTUAL != 0; #[cfg(feature = "restrictive")] - ensure!(flags_lower & !(BFA_NORET | BFA_PURE | BFA_HIGH | BFA_STATIC | BFA_VIRTUAL) == 0); + ensure!( + flags_lower + & !(BFA_NORET | BFA_PURE | BFA_HIGH | BFA_STATIC | BFA_VIRTUAL) + == 0 + ); // TODO find those flags const BFA_CONST: u8 = 0x4; @@ -164,13 +168,17 @@ impl FunctionRaw { let is_constructor = flags_upper & BFA_CONSTRUCTOR != 0; let is_destructor = flags_upper & BFA_DESTRUCTOR != 0; #[cfg(feature = "restrictive")] - ensure!(flags_upper & !(BFA_CONST | BFA_CONSTRUCTOR | BFA_DESTRUCTOR) == 0); + ensure!( + flags_upper & !(BFA_CONST | BFA_CONSTRUCTOR | BFA_DESTRUCTOR) == 0 + ); - let ret = TypeRaw::read(&mut *input, header).context("Return Argument")?; + let ret = + TypeRaw::read(&mut *input, header).context("Return Argument")?; // TODO double check documentation for [flag::tf_func::BT_FUN] - let is_special_pe = cc.map(CallingConvention::is_special_pe).unwrap_or(false); - let have_retloc = - is_special_pe && !matches!(&ret.variant, TypeVariantRaw::Basic(Basic::Void)); + let is_special_pe = + cc.map(CallingConvention::is_special_pe).unwrap_or(false); + let have_retloc = is_special_pe + && !matches!(&ret.variant, TypeVariantRaw::Basic(Basic::Void)); let retloc = have_retloc .then(|| ArgLoc::read(&mut *input)) .transpose() @@ -278,7 +286,9 @@ impl ArgLoc { Ok(Self::Static(sval)) } #[cfg(feature = "restrictive")] - ALOC_CUSTOM.. => Err(anyhow!("Custom implementation for ArgLoc")), + ALOC_CUSTOM.. => { + Err(anyhow!("Custom implementation for ArgLoc")) + } #[cfg(not(feature = "restrictive"))] ALOC_CUSTOM.. => Ok(Self::None), } @@ -323,9 +333,15 @@ impl CallingConvention { Ok(Some(match cm & CM_CC_MASK { // !ERR(spoil)! - CM_CC_SPOILED => return Err(anyhow!("Unexpected Spoiled Function Calling Convention")), + CM_CC_SPOILED => { + return Err(anyhow!( + "Unexpected Spoiled Function Calling Convention" + )) + } // this is an invalid value - CM_CC_INVALID => return Err(anyhow!("Invalid Function Calling Convention")), + CM_CC_INVALID => { + return Err(anyhow!("Invalid Function Calling Convention")) + } CM_CC_UNKNOWN => return Ok(None), CM_CC_VOIDARG => Self::Voidarg, CM_CC_CDECL => Self::Cdecl, @@ -457,7 +473,9 @@ pub enum CallMethod { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x476e60 /// [BT_FUNC](https://hex-rays.com/products/ida/support/sdkdoc/group__tf__func.html#ga7b7fee21f21237beb6d91e854410e0fa) -fn read_cc(input: &mut impl IdaGenericBufUnpack) -> Result<(u8, u16, Vec<(u16, u8)>)> { +fn read_cc( + input: &mut impl IdaGenericBufUnpack, +) -> Result<(u8, u16, Vec<(u16, u8)>)> { let mut cc = input.read_u8()?; // TODO find the flag for that if cc & 0xF0 != 0xA0 { diff --git a/src/til/pointer.rs b/src/til/pointer.rs index 56d9a68..4d69122 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -23,7 +23,8 @@ impl Pointer { .map(|(t, v)| -> Result<_> { Ok(( // TODO if this type allow non typedef, this may consume fields - Type::new(til, *t, &mut vec![].into_iter()).map(Box::new)?, + Type::new(til, *t, &mut vec![].into_iter()) + .map(Box::new)?, v, )) }) @@ -116,7 +117,8 @@ impl PointerRaw { let ptr_type = tattr & TAPTR_RESTRICT; #[cfg(feature = "restrictive")] anyhow::ensure!( - tattr & !(TAPTR_SHIFTED | TAPTR_RESTRICT | MAX_DECL_ALIGN) == 0, + tattr & !(TAPTR_SHIFTED | TAPTR_RESTRICT | MAX_DECL_ALIGN) + == 0, "Invalid Pointer taenum_bits {tattr:x}" ); if let Some(_extended) = _extended { @@ -170,7 +172,10 @@ pub(crate) enum PointerTypeRaw { } impl PointerTypeRaw { - fn read(input: &mut impl IdaGenericBufUnpack, header: &TILSectionHeader) -> Result { + fn read( + input: &mut impl IdaGenericBufUnpack, + header: &TILSectionHeader, + ) -> Result { let closure_type = input.read_u8()?; if closure_type == 0xFF { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x473b5a diff --git a/src/til/section.rs b/src/til/section.rs index 4aa4d23..2383c9d 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -99,7 +99,8 @@ impl TILSection { match compress { IDBSectionCompression::None => Self::read_inner(input), IDBSectionCompression::Zlib => { - let mut input = BufReader::new(flate2::bufread::ZlibDecoder::new(input)); + let mut input = + BufReader::new(flate2::bufread::ZlibDecoder::new(input)); Self::read_inner(&mut input) } } @@ -221,13 +222,17 @@ impl TILSection { Ok((Some(next_ord), Some(ordinals))) } - fn read_header(input: &mut impl IdaGenericUnpack) -> Result { + fn read_header( + input: &mut impl IdaGenericUnpack, + ) -> Result { // TODO this break a few files let signature: [u8; 6] = bincode::deserialize_from(&mut *input)?; ensure!(signature == *TIL_SECTION_MAGIC, "Invalid TIL Signature"); // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x431eb5 let (format, flags) = match input.read_u32()? { - format @ 0x13.. => return Err(anyhow!("Invalid TIL format {format}")), + format @ 0x13.. => { + return Err(anyhow!("Invalid TIL format {format}")) + } // read the flag after the format format @ 0x10..=0x12 => { let flags = TILSectionFlags::new(input.read_u32()?)?; @@ -259,7 +264,8 @@ impl TILSection { .collect::>(); } - let header2: TILSectionHeader2 = bincode::deserialize_from(&mut *input)?; + let header2: TILSectionHeader2 = + bincode::deserialize_from(&mut *input)?; // TODO header2.cm default to 0x13 // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x42ef86 @@ -273,8 +279,10 @@ impl TILSection { let ls = input.read_u8()?; let lls = input.read_u8()?; Ok(TILSectionExtendedSizeofInfo { - size_short: NonZeroU8::new(ss).ok_or_else(|| anyhow!("Invalid short size"))?, - size_long: NonZeroU8::new(ls).ok_or_else(|| anyhow!("Invalid long size"))?, + size_short: NonZeroU8::new(ss) + .ok_or_else(|| anyhow!("Invalid short size"))?, + size_long: NonZeroU8::new(ls) + .ok_or_else(|| anyhow!("Invalid long size"))?, size_long_long: NonZeroU8::new(lls) .ok_or_else(|| anyhow!("Invalid long long size"))?, }) @@ -289,8 +297,8 @@ impl TILSection { .transpose()? .map(|size| size.try_into()) .transpose()?; - let def_align = - (header2.def_align != 0).then(|| NonZeroU8::new(1 << (header2.def_align - 1)).unwrap()); + let def_align = (header2.def_align != 0) + .then(|| NonZeroU8::new(1 << (header2.def_align - 1)).unwrap()); Ok(TILSectionHeader { format: header1.format, @@ -316,10 +324,13 @@ impl TILSection { ) -> Result<()> { match compress { IDBSectionCompression::Zlib => { - let mut input = BufReader::new(flate2::bufread::ZlibDecoder::new(input)); + let mut input = + BufReader::new(flate2::bufread::ZlibDecoder::new(input)); Self::decompress_inner(&mut input, output) } - IDBSectionCompression::None => Self::decompress_inner(input, output), + IDBSectionCompression::None => { + Self::decompress_inner(input, output) + } } } @@ -372,7 +383,10 @@ impl TILSection { } if header.flags.has_size_long_double() { - bincode::serialize_into(&mut *output, &header.size_long_double.unwrap().get())?; + bincode::serialize_into( + &mut *output, + &header.size_long_double.unwrap().get(), + )?; } // if not zipped, just copy the rest of the data, there is no possible zip @@ -533,7 +547,9 @@ pub(crate) struct TILBucketRaw { } impl TILSection { - fn read_bucket_header(input: &mut impl IdaGenericUnpack) -> Result<(u32, u32)> { + fn read_bucket_header( + input: &mut impl IdaGenericUnpack, + ) -> Result<(u32, u32)> { let ndefs = bincode::deserialize_from(&mut *input)?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x42e3e0 //ensure!(ndefs < 0x55555555); @@ -541,7 +557,9 @@ impl TILSection { Ok((ndefs, len)) } - fn read_bucket_zip_header(input: &mut impl IdaGenericUnpack) -> Result<(u32, u32, u32)> { + fn read_bucket_zip_header( + input: &mut impl IdaGenericUnpack, + ) -> Result<(u32, u32, u32)> { let (ndefs, len) = Self::read_bucket_header(&mut *input)?; let compressed_len = bincode::deserialize_from(&mut *input)?; Ok((ndefs, len, compressed_len)) @@ -554,9 +572,19 @@ impl TILSection { ordinal_alias: Option<&[(u32, u32)]>, ) -> Result> { if header.flags.is_zip() { - Self::read_bucket_zip(&mut *input, header, next_ordinal, ordinal_alias) + Self::read_bucket_zip( + &mut *input, + header, + next_ordinal, + ordinal_alias, + ) } else { - Self::read_bucket_normal(&mut *input, header, next_ordinal, ordinal_alias) + Self::read_bucket_normal( + &mut *input, + header, + next_ordinal, + ordinal_alias, + ) } } @@ -567,7 +595,14 @@ impl TILSection { ordinal_alias: Option<&[(u32, u32)]>, ) -> Result> { let (ndefs, len) = Self::read_bucket_header(&mut *input)?; - Self::read_bucket_inner(&mut *input, header, ndefs, len, next_ordinal, ordinal_alias) + Self::read_bucket_inner( + &mut *input, + header, + ndefs, + len, + next_ordinal, + ordinal_alias, + ) } fn read_bucket_zip( @@ -576,10 +611,13 @@ impl TILSection { next_ordinal: Option, ordinal_alias: Option<&[(u32, u32)]>, ) -> Result> { - let (ndefs, len, compressed_len) = Self::read_bucket_zip_header(&mut *input)?; + let (ndefs, len, compressed_len) = + Self::read_bucket_zip_header(&mut *input)?; // make sure the decompressor don't read out-of-bounds let mut compressed_input = input.take(compressed_len.into()); - let mut inflate = BufReader::new(flate2::bufread::ZlibDecoder::new(&mut compressed_input)); + let mut inflate = BufReader::new(flate2::bufread::ZlibDecoder::new( + &mut compressed_input, + )); // make sure only the defined size is decompressed let type_info = Self::read_bucket_inner( &mut inflate, @@ -637,7 +675,9 @@ impl TILSection { } } - fn read_macros_normal(input: &mut impl IdaGenericBufUnpack) -> Result> { + fn read_macros_normal( + input: &mut impl IdaGenericBufUnpack, + ) -> Result> { let (ndefs, len) = Self::read_bucket_header(&mut *input)?; let mut input = input.take(len.into()); let type_info = (0..ndefs) @@ -651,11 +691,16 @@ impl TILSection { Ok(type_info) } - fn read_macros_zip(input: &mut impl IdaGenericBufUnpack) -> Result> { - let (ndefs, len, compressed_len) = Self::read_bucket_zip_header(&mut *input)?; + fn read_macros_zip( + input: &mut impl IdaGenericBufUnpack, + ) -> Result> { + let (ndefs, len, compressed_len) = + Self::read_bucket_zip_header(&mut *input)?; // make sure the decompressor don't read out-of-bounds let mut compressed_input = input.take(compressed_len.into()); - let inflate = BufReader::new(flate2::bufread::ZlibDecoder::new(&mut compressed_input)); + let inflate = BufReader::new(flate2::bufread::ZlibDecoder::new( + &mut compressed_input, + )); // make sure only the defined size is decompressed let mut decompressed_input = inflate.take(len.into()); let type_info = (0..ndefs.try_into().unwrap()) @@ -680,7 +725,8 @@ impl TILSection { input: &mut impl IdaGenericBufUnpack, output: &mut impl std::io::Write, ) -> Result<()> { - let (ndefs, len, compressed_len) = Self::read_bucket_zip_header(&mut *input)?; + let (ndefs, len, compressed_len) = + Self::read_bucket_zip_header(&mut *input)?; bincode::serialize_into(&mut *output, &TILBucketRaw { len, ndefs })?; // write the decompressed data let mut compressed_input = input.take(compressed_len.into()); diff --git a/src/til/size_calculator.rs b/src/til/size_calculator.rs index a64f185..c809d9b 100644 --- a/src/til/size_calculator.rs +++ b/src/til/size_calculator.rs @@ -27,7 +27,11 @@ impl<'a> TILTypeSizeSolver<'a> { // TODO make a type for type_idx and symbol_idx, accept both here /// NOTE that type_idx need to be specified if not a symbol - pub fn type_size_bytes(&mut self, type_idx: Option, ty: &Type) -> Option { + pub fn type_size_bytes( + &mut self, + type_idx: Option, + ty: &Type, + ) -> Option { assert!(self.solving.is_empty()); if let Some(idx) = type_idx { // if cached return it @@ -58,15 +62,27 @@ impl<'a> TILTypeSizeSolver<'a> { TypeVariant::Basic(Basic::SegReg) => 1, TypeVariant::Basic(Basic::Void) => 0, TypeVariant::Basic(Basic::Unknown { bytes }) => (*bytes).into(), - TypeVariant::Basic(Basic::Bool) => self.section.size_bool.get().into(), - TypeVariant::Basic(Basic::Short { .. }) => self.section.sizeof_short().get().into(), - TypeVariant::Basic(Basic::Int { .. }) => self.section.size_int.get().into(), - TypeVariant::Basic(Basic::Long { .. }) => self.section.sizeof_long().get().into(), + TypeVariant::Basic(Basic::Bool) => { + self.section.size_bool.get().into() + } + TypeVariant::Basic(Basic::Short { .. }) => { + self.section.sizeof_short().get().into() + } + TypeVariant::Basic(Basic::Int { .. }) => { + self.section.size_int.get().into() + } + TypeVariant::Basic(Basic::Long { .. }) => { + self.section.sizeof_long().get().into() + } TypeVariant::Basic(Basic::LongLong { .. }) => { self.section.sizeof_long_long().get().into() } - TypeVariant::Basic(Basic::IntSized { bytes, .. }) => bytes.get().into(), - TypeVariant::Basic(Basic::BoolSized { bytes }) => bytes.get().into(), + TypeVariant::Basic(Basic::IntSized { bytes, .. }) => { + bytes.get().into() + } + TypeVariant::Basic(Basic::BoolSized { bytes }) => { + bytes.get().into() + } // TODO what's the long double default size if it's not defined? TypeVariant::Basic(Basic::LongDouble) => self .section @@ -79,7 +95,8 @@ impl<'a> TILTypeSizeSolver<'a> { TypeVariant::Pointer(_) => self.section.addr_size().get().into(), TypeVariant::Function(_) => 0, // function type dont have a size, only a pointer to it TypeVariant::Array(array) => { - let element_len = self.inner_type_size_bytes(&array.elem_type)?; + let element_len = + self.inner_type_size_bytes(&array.elem_type)?; let nelem = array.nelem.map(|x| x.get()).unwrap_or(0) as u64; element_len * nelem } @@ -97,27 +114,34 @@ impl<'a> TILTypeSizeSolver<'a> { // no more members break; }; - let field_size = match &first_member.member_type.type_variant { - // if bit-field, condensate one or more to create a byte-field - TypeVariant::Bitfield(bitfield) => { - members = &members[1..]; - // NOTE it skips 0..n members - condensate_bitfields_from_struct(*bitfield, &mut members) + let field_size = + match &first_member.member_type.type_variant { + // if bit-field, condensate one or more to create a byte-field + TypeVariant::Bitfield(bitfield) => { + members = &members[1..]; + // NOTE it skips 0..n members + condensate_bitfields_from_struct( + *bitfield, + &mut members, + ) .get() .into() - } - // get the inner type size - _ => { - let first = &members[0]; - members = &members[1..]; - // next member - self.inner_type_size_bytes(&first.member_type)? - } - }; + } + // get the inner type size + _ => { + let first = &members[0]; + members = &members[1..]; + // next member + self.inner_type_size_bytes(&first.member_type)? + } + }; if !til_struct.is_unaligned { let align = match ( first_member.alignment.map(|x| x.get().into()), - self.alignemnt(&first_member.member_type, field_size), + self.alignemnt( + &first_member.member_type, + field_size, + ), ) { (Some(a), Some(b)) => a.max(b), (Some(a), None) | (None, Some(a)) => a, @@ -179,9 +203,9 @@ impl<'a> TILTypeSizeSolver<'a> { fn alignemnt(&mut self, til: &Type, til_size: u64) -> Option { match &til.type_variant { // TODO basic types have a inherited alignment? - TypeVariant::Basic(_) | TypeVariant::Enum(_) | TypeVariant::Pointer(_) => { - Some(til_size) - } + TypeVariant::Basic(_) + | TypeVariant::Enum(_) + | TypeVariant::Pointer(_) => Some(til_size), TypeVariant::Array(array) => { let size = self.inner_type_size_bytes(&array.elem_type); self.alignemnt(&array.elem_type, size.unwrap_or(1)) @@ -205,7 +229,8 @@ impl<'a> TILTypeSizeSolver<'a> { Typedef::Name(None) => None, }; ty.and_then(|ty| { - let size = self.inner_type_size_bytes(&ty.tinfo).unwrap_or(1); + let size = + self.inner_type_size_bytes(&ty.tinfo).unwrap_or(1); self.alignemnt(&ty.tinfo, size) }) } @@ -223,7 +248,8 @@ fn condensate_bitfields_from_struct( let mut condensated_bits = first_field.width; loop { - let Some(TypeVariant::Bitfield(member)) = rest.first().map(|x| &x.member_type.type_variant) + let Some(TypeVariant::Bitfield(member)) = + rest.first().map(|x| &x.member_type.type_variant) else { // no more bit-fields to condensate break; diff --git a/src/til/struct.rs b/src/til/struct.rs index 0fad21d..9139998 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -34,7 +34,14 @@ impl Struct { let members = value .members .into_iter() - .map(|member| StructMember::new(til, fields.next().flatten(), member, &mut *fields)) + .map(|member| { + StructMember::new( + til, + fields.next().flatten(), + member, + &mut *fields, + ) + }) .collect::>()?; Ok(Struct { effective_alignment: value.effective_alignment, @@ -89,7 +96,8 @@ impl StructRaw { let mem_cnt = n >> 3; // TODO what is effective_alignment and how it's diferent from Modifier alignment? let alpow = n & 7; - let effective_alignment = (alpow != 0).then(|| NonZeroU8::new(1 << (alpow - 1)).unwrap()); + let effective_alignment = + (alpow != 0).then(|| NonZeroU8::new(1 << (alpow - 1)).unwrap()); // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x459c97 let mut alignment = None; let mut is_unknown_8 = false; @@ -146,8 +154,13 @@ impl StructRaw { let members = (0..mem_cnt) .map(|i| { - StructMemberRaw::read(&mut *input, header, is_method, is_bitset2) - .with_context(|| format!("Member {i}")) + StructMemberRaw::read( + &mut *input, + header, + is_method, + is_bitset2, + ) + .with_context(|| format!("Member {i}")) }) .collect::>()?; @@ -244,12 +257,16 @@ impl StructMemberRaw { let alignment_raw = (tattr & MAX_DECL_ALIGN) as u8; is_unknown_8 = alignment_raw & 0x8 != 0; - alignment = ((alignment_raw & 0x7) != 0) - .then(|| NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap()); + alignment = ((alignment_raw & 0x7) != 0).then(|| { + NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap() + }); is_baseclass = tattr & TAFLD_BASECLASS != 0; is_unaligned = tattr & TAFLD_UNALIGNED != 0; let is_virtbase = tattr & TAFLD_VIRTBASE != 0; - ensure!(!is_virtbase, "UDT Member virtual base is not supported yet"); + ensure!( + !is_virtbase, + "UDT Member virtual base is not supported yet" + ); is_vft = tattr & TAFLD_VFTABLE != 0; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x478203 is_method = tattr & TAFLD_METHOD != 0; @@ -298,7 +315,9 @@ impl StructMemberRaw { let att = input.read_ext_att()?; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x486d0d match att & 0xf { - 0xd..=0xf => Err(anyhow!("Invalid value for member attribute {att:#x}")), + 0xd..=0xf => { + Err(anyhow!("Invalid value for member attribute {att:#x}")) + } 0..=7 => Ok(StructMemberAtt::Var0to7(Self::basic_att(input, att)?)), 8 | 0xb => todo!(), // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x486d3f @@ -329,7 +348,10 @@ impl StructMemberRaw { } } - fn basic_att(input: &mut impl IdaGenericBufUnpack, att: u64) -> Result { + fn basic_att( + input: &mut impl IdaGenericBufUnpack, + att: u64, + ) -> Result { if (att >> 8) & 0x10 != 0 { // TODO this is diferent from the implementation, double check the read_de and this code // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x486df0 @@ -413,7 +435,9 @@ impl StructMemberAtt { val1, val2, val3: u32::MAX, - }) if att & 0x1000 != 0 => ExtAttBasic::from_raw(att & !0x1000, Some((val1, val2))), + }) if att & 0x1000 != 0 => { + ExtAttBasic::from_raw(att & !0x1000, Some((val1, val2))) + } _ => None, } } @@ -513,7 +537,10 @@ impl ExtAttBasic { let is_lzero = value & 0x800 != 0; let tabform = val1.map(|(val1, val2)| { - let val1 = ExtAttBasicTabformVal1::try_from_primitive(val1.try_into().ok()?).ok()?; + let val1 = ExtAttBasicTabformVal1::try_from_primitive( + val1.try_into().ok()?, + ) + .ok()?; Some(ExtAttBasicTabform { val1, val2 }) }); let tabform = match tabform { diff --git a/src/til/union.rs b/src/til/union.rs index 13bd82b..54485d5 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -87,8 +87,9 @@ impl UnionRaw { let alignment_raw = (tattr & MAX_DECL_ALIGN) as u8; is_unknown_8 = alignment_raw & 0x8 != 0; - alignment = ((alignment_raw & 0x7) != 0) - .then(|| NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap()); + alignment = ((alignment_raw & 0x7) != 0).then(|| { + NonZeroU8::new(1 << ((alignment_raw & 0x7) - 1)).unwrap() + }); is_unaligned = tattr & TAUDT_UNALIGNED != 0; const _ALL_FLAGS: u16 = MAX_DECL_ALIGN | TAUDT_UNALIGNED; @@ -105,7 +106,10 @@ impl UnionRaw { } let members = (0..mem_cnt) - .map(|i| TypeRaw::read(&mut *input, header).with_context(|| format!("Member {i}"))) + .map(|i| { + TypeRaw::read(&mut *input, header) + .with_context(|| format!("Member {i}")) + }) .collect::>()?; Ok(TypeVariantRaw::Union(Self { effective_alignment, diff --git a/src/tools/decompress_til.rs b/src/tools/decompress_til.rs index 6fe92b7..355c16b 100644 --- a/src/tools/decompress_til.rs +++ b/src/tools/decompress_til.rs @@ -14,16 +14,20 @@ pub fn decompress_til(args: &Args, til_args: &DecompressTilArgs) -> Result<()> { FileType::Idb => { let input = BufReader::new(File::open(&args.input)?); let mut parser = IDBParser::new(input)?; - let til_offset = parser - .til_section_offset() - .ok_or_else(|| anyhow!("IDB file don't contains a TIL sector"))?; + let til_offset = parser.til_section_offset().ok_or_else(|| { + anyhow!("IDB file don't contains a TIL sector") + })?; // TODO make decompress til public parser.decompress_til_section(til_offset, &mut output) } FileType::Til => { let mut input = BufReader::new(File::open(&args.input)?); // TODO make decompress til public - TILSection::decompress(&mut input, &mut output, idb_rs::IDBSectionCompression::None) + TILSection::decompress( + &mut input, + &mut output, + idb_rs::IDBSectionCompression::None, + ) } } } diff --git a/src/tools/dump_addr_info.rs b/src/tools/dump_addr_info.rs index c73b30a..5905709 100644 --- a/src/tools/dump_addr_info.rs +++ b/src/tools/dump_addr_info.rs @@ -8,8 +8,12 @@ pub fn dump_addr_info(args: &Args) -> Result<()> { // TODO create a function for that in ida_info let version = match id0.ida_info()? { - idb_rs::id0::IDBParam::V1(idb_rs::id0::IDBParam1 { version, .. }) => version, - idb_rs::id0::IDBParam::V2(idb_rs::id0::IDBParam2 { version, .. }) => version, + idb_rs::id0::IDBParam::V1(idb_rs::id0::IDBParam1 { + version, .. + }) => version, + idb_rs::id0::IDBParam::V2(idb_rs::id0::IDBParam2 { + version, .. + }) => version, }; for entry in id0.address_info(version)? { let (addr, info) = entry?; @@ -19,7 +23,10 @@ pub fn dump_addr_info(args: &Args) -> Result<()> { key: [key_type, rest @ ..], value, } if (*key_type as char).is_ascii_graphic() => { - println!("Other('{}':{rest:02x?}:{value:02x?})", *key_type as char); + println!( + "Other('{}':{rest:02x?}:{value:02x?})", + *key_type as char + ); } idb_rs::id0::AddressInfo::Other { key, value } => { println!("Other({key:02x?}:{value:02x?})",); diff --git a/src/tools/dump_dirtree.rs b/src/tools/dump_dirtree.rs index fbe1c23..67e86bc 100644 --- a/src/tools/dump_dirtree.rs +++ b/src/tools/dump_dirtree.rs @@ -1,6 +1,9 @@ use idb_rs::id0::{DirTreeEntry, DirTreeRoot}; -pub fn print_dirtree(mut handle_print: impl FnMut(&T), dirtree: &DirTreeRoot) { +pub fn print_dirtree( + mut handle_print: impl FnMut(&T), + dirtree: &DirTreeRoot, +) { inner_print_dirtree(&mut handle_print, &dirtree.entries, 0); } diff --git a/src/tools/dump_dirtree_funcs.rs b/src/tools/dump_dirtree_funcs.rs index 68611e4..1c53df0 100644 --- a/src/tools/dump_dirtree_funcs.rs +++ b/src/tools/dump_dirtree_funcs.rs @@ -19,7 +19,8 @@ pub fn print_function(id0: &ID0Section, address: Id0Address) -> Result<()> { let mut ty = None; for info in infos { match info? { - idb_rs::id0::AddressInfo::Comment(_) | idb_rs::id0::AddressInfo::Other { .. } => {} + idb_rs::id0::AddressInfo::Comment(_) + | idb_rs::id0::AddressInfo::Other { .. } => {} idb_rs::id0::AddressInfo::Label(label) => { if let Some(_old) = name.replace(label) { panic!("Multiple labels can't be return for address") @@ -27,7 +28,10 @@ pub fn print_function(id0: &ID0Section, address: Id0Address) -> Result<()> { } idb_rs::id0::AddressInfo::TilType(addr_ty) => { ensure!( - matches!(&addr_ty.type_variant, idb_rs::til::TypeVariant::Function(_)), + matches!( + &addr_ty.type_variant, + idb_rs::til::TypeVariant::Function(_) + ), "Type for function at {address:#?} is invalid" ); if let Some(_old) = ty.replace(addr_ty) { diff --git a/src/tools/dump_dirtree_types.rs b/src/tools/dump_dirtree_types.rs index 1671bf8..497140a 100644 --- a/src/tools/dump_dirtree_types.rs +++ b/src/tools/dump_dirtree_types.rs @@ -9,17 +9,19 @@ use idb_rs::{id0::Id0TilOrd, IDBParser}; pub fn dump_dirtree_types(args: &Args) -> Result<()> { // parse the id0 sector/file let (id0, til) = match args.input_type() { - FileType::Til => return Err(anyhow!("TIL don't contains any ID0 data")), + FileType::Til => { + return Err(anyhow!("TIL don't contains any ID0 data")) + } FileType::Idb => { let input = BufReader::new(File::open(&args.input)?); let mut parser = IDBParser::new(input)?; - let id0_offset = parser - .id0_section_offset() - .ok_or_else(|| anyhow!("IDB file don't contains a ID0 sector"))?; + let id0_offset = parser.id0_section_offset().ok_or_else(|| { + anyhow!("IDB file don't contains a ID0 sector") + })?; let id0 = parser.read_id0_section(id0_offset)?; - let til_offset = parser - .til_section_offset() - .ok_or_else(|| anyhow!("IDB file don't contains a TIL sector"))?; + let til_offset = parser.til_section_offset().ok_or_else(|| { + anyhow!("IDB file don't contains a TIL sector") + })?; let til = parser.read_til_section(til_offset)?; (id0, til) } diff --git a/src/tools/dump_functions.rs b/src/tools/dump_functions.rs index e052f1b..72988fc 100644 --- a/src/tools/dump_functions.rs +++ b/src/tools/dump_functions.rs @@ -75,7 +75,9 @@ pub fn dump_functions(args: &Args) -> Result<()> { print!(" {:#x}:", address.as_u64()); print_function(&id0, address)? } - idb_rs::id0::DirTreeEntry::Directory { name: _, entries } => buffer.extend(entries), + idb_rs::id0::DirTreeEntry::Directory { name: _, entries } => { + buffer.extend(entries) + } } } diff --git a/src/tools/dump_segments.rs b/src/tools/dump_segments.rs index 5b2e987..f85ac2d 100644 --- a/src/tools/dump_segments.rs +++ b/src/tools/dump_segments.rs @@ -13,8 +13,12 @@ pub fn dump_segments(args: &Args) -> Result<()> { // TODO create a function for that in ida_info let version = match id0.ida_info()? { - idb_rs::id0::IDBParam::V1(idb_rs::id0::IDBParam1 { version, .. }) => version, - idb_rs::id0::IDBParam::V2(idb_rs::id0::IDBParam2 { version, .. }) => version, + idb_rs::id0::IDBParam::V1(idb_rs::id0::IDBParam1 { + version, .. + }) => version, + idb_rs::id0::IDBParam::V2(idb_rs::id0::IDBParam2 { + version, .. + }) => version, }; println!(); println!("Segments AKA `$ fileregions`: "); diff --git a/src/tools/dump_til.rs b/src/tools/dump_til.rs index 190f96c..9f2a374 100644 --- a/src/tools/dump_til.rs +++ b/src/tools/dump_til.rs @@ -14,9 +14,9 @@ pub fn dump_til(args: &Args) -> Result<()> { FileType::Idb => { let input = BufReader::new(File::open(&args.input)?); let mut parser = IDBParser::new(input)?; - let til_offset = parser - .til_section_offset() - .ok_or_else(|| anyhow!("IDB file don't contains a TIL sector"))?; + let til_offset = parser.til_section_offset().ok_or_else(|| { + anyhow!("IDB file don't contains a TIL sector") + })?; parser.read_til_section(til_offset)? } FileType::Til => { @@ -94,8 +94,12 @@ pub fn dump_til(args: &Args) -> Result<()> { let value: String = value .iter() .map(|c| match c { - idb_rs::til::TILMacroValue::Char(c) => format!("{}", *c as char), - idb_rs::til::TILMacroValue::Param(param) => format!("{{P{}}}", *param), + idb_rs::til::TILMacroValue::Char(c) => { + format!("{}", *c as char) + } + idb_rs::til::TILMacroValue::Param(param) => { + format!("{{P{}}}", *param) + } }) .collect(); println!("------------------------------`{name}`------------------------------"); diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index a06b801..27d40df 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -7,7 +7,9 @@ use idb_rs::til::r#enum::Enum; use idb_rs::til::r#struct::{Struct, StructMemberAtt}; use idb_rs::til::section::TILSection; use idb_rs::til::union::Union; -use idb_rs::til::{Basic, TILTypeInfo, TILTypeSizeSolver, Type, TypeVariant, Typedef}; +use idb_rs::til::{ + Basic, TILTypeInfo, TILTypeSizeSolver, Type, TypeVariant, Typedef, +}; use idb_rs::IDBParser; use std::fs::File; @@ -26,9 +28,9 @@ pub fn tilib_print(args: &Args) -> anyhow::Result<()> { } FileType::Idb => { let mut parser = IDBParser::new(input)?; - let til_offset = parser - .til_section_offset() - .ok_or_else(|| anyhow::anyhow!("IDB file don't contains a TIL sector"))?; + let til_offset = parser.til_section_offset().ok_or_else(|| { + anyhow::anyhow!("IDB file don't contains a TIL sector") + })?; let section = parser.read_til_section(til_offset)?; print_til_section(std::io::stdout(), §ion)?; } @@ -159,7 +161,10 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { Ok(()) } -fn print_section_flags(fmt: &mut impl Write, section: &TILSection) -> Result<()> { +fn print_section_flags( + fmt: &mut impl Write, + section: &TILSection, +) -> Result<()> { write!(fmt, "Flags : {:04X}", section.flags.as_raw())?; if section.flags.is_zip() { write!(fmt, " compressed")?; @@ -212,9 +217,11 @@ fn print_symbols( // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a80 match len.and_then(|b| u32::try_from(b).ok()) { Some(8) => write!(fmt, " {:016X}", symbol.ordinal)?, - Some(bytes @ 0..=7) => { - write!(fmt, " {:08X}", symbol.ordinal & !(u64::MAX << (bytes * 8)))? - } + Some(bytes @ 0..=7) => write!( + fmt, + " {:08X}", + symbol.ordinal & !(u64::MAX << (bytes * 8)) + )?, _ => write!(fmt, " {:08X}", symbol.ordinal)?, } @@ -234,14 +241,23 @@ fn print_symbols( write!(fmt, " {} ", sym_kind)?; // TODO investiage this - let name = if symbol.ordinal == 0 && symbol.name.first() == Some(&b'_') { + let name = if symbol.ordinal == 0 && symbol.name.first() == Some(&b'_') + { // remove the first "_", if any &symbol.name[1..] } else { &symbol.name }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a3a - print_til_type(fmt, section, Some(name), &symbol.tinfo, true, false, true)?; + print_til_type( + fmt, + section, + Some(name), + &symbol.tinfo, + true, + false, + true, + )?; writeln!(fmt, ";")?; } Ok(()) @@ -310,7 +326,12 @@ fn print_types_by_ordinals( if let OrdType::Alias((_alias_ord, type_ord)) = ord_type { write!(fmt, "(aliased to {type_ord}) ")?; } - print_til_type_root(fmt, section, Some(&final_type.name), &final_type.tinfo)?; + print_til_type_root( + fmt, + section, + Some(&final_type.name), + &final_type.tinfo, + )?; writeln!(fmt, ";")?; } Ok(()) @@ -342,7 +363,9 @@ fn print_til_type_root( // TODO: InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4438d1 // TODO: if a is a typedef and ComplexRef or something like it, also print typedef match &til_type.type_variant { - TypeVariant::Struct(_) | TypeVariant::Union(_) | TypeVariant::Enum(_) => {} + TypeVariant::Struct(_) + | TypeVariant::Union(_) + | TypeVariant::Enum(_) => {} TypeVariant::StructRef(Typedef::Name(None)) | TypeVariant::UnionRef(Typedef::Name(None)) | TypeVariant::EnumRef(Typedef::Name(None)) => {} @@ -374,9 +397,9 @@ fn print_til_type( print_pointer_space, print_type_prefix, ), - TypeVariant::Function(function) => { - print_til_type_function(fmt, section, name, til_type, function, false) - } + TypeVariant::Function(function) => print_til_type_function( + fmt, section, name, til_type, function, false, + ), TypeVariant::Array(array) => print_til_type_array( fmt, section, @@ -386,26 +409,45 @@ fn print_til_type( print_pointer_space, print_type_prefix, ), - TypeVariant::Typedef(ref_type) => { - print_til_type_typedef(fmt, section, name, til_type, ref_type, false) - } - TypeVariant::UnionRef(ref_type) => { - print_til_type_complex_ref(fmt, section, name, til_type, ref_type, print_type_prefix) - } - TypeVariant::EnumRef(ref_type) => { - print_til_type_complex_ref(fmt, section, name, til_type, ref_type, print_type_prefix) - } - TypeVariant::StructRef(ref_type) => { - print_til_type_complex_ref(fmt, section, name, til_type, ref_type, print_type_prefix) - } - TypeVariant::Struct(til_struct) => { - print_til_type_struct(fmt, section, name, til_type, til_struct, print_name) + TypeVariant::Typedef(ref_type) => print_til_type_typedef( + fmt, section, name, til_type, ref_type, false, + ), + TypeVariant::UnionRef(ref_type) => print_til_type_complex_ref( + fmt, + section, + name, + til_type, + ref_type, + print_type_prefix, + ), + TypeVariant::EnumRef(ref_type) => print_til_type_complex_ref( + fmt, + section, + name, + til_type, + ref_type, + print_type_prefix, + ), + TypeVariant::StructRef(ref_type) => print_til_type_complex_ref( + fmt, + section, + name, + til_type, + ref_type, + print_type_prefix, + ), + TypeVariant::Struct(til_struct) => print_til_type_struct( + fmt, section, name, til_type, til_struct, print_name, + ), + TypeVariant::Union(til_union) => print_til_type_union( + fmt, section, name, til_type, til_union, print_name, + ), + TypeVariant::Enum(til_enum) => { + print_til_type_enum(fmt, section, name, til_type, til_enum) } - TypeVariant::Union(til_union) => { - print_til_type_union(fmt, section, name, til_type, til_union, print_name) + TypeVariant::Bitfield(bitfield) => { + print_til_type_bitfield(fmt, name, til_type, bitfield) } - TypeVariant::Enum(til_enum) => print_til_type_enum(fmt, section, name, til_type, til_enum), - TypeVariant::Bitfield(bitfield) => print_til_type_bitfield(fmt, name, til_type, bitfield), } } @@ -454,7 +496,9 @@ fn print_til_type_pointer( true, )?; // if the innertype is also a pointer, don't print the space - if print_pointer_space && !matches!(&pointer.typ.type_variant, TypeVariant::Pointer(_)) { + if print_pointer_space + && !matches!(&pointer.typ.type_variant, TypeVariant::Pointer(_)) + { write!(fmt, " ")?; } write!(fmt, "*")?; @@ -466,8 +510,12 @@ fn print_til_type_pointer( } match pointer.modifier { None => {} - Some(idb_rs::til::pointer::PointerModifier::Ptr32) => write!(fmt, "__ptr32 ")?, - Some(idb_rs::til::pointer::PointerModifier::Ptr64) => write!(fmt, "__ptr64 ")?, + Some(idb_rs::til::pointer::PointerModifier::Ptr32) => { + write!(fmt, "__ptr32 ")? + } + Some(idb_rs::til::pointer::PointerModifier::Ptr64) => { + write!(fmt, "__ptr64 ")? + } Some(idb_rs::til::pointer::PointerModifier::Restricted) => { write!(fmt, "__restricted ")? } @@ -552,7 +600,9 @@ fn print_til_type_function( } write!(fmt, "(")?; - for (i, (param_name, param, _argloc)) in til_function.args.iter().enumerate() { + for (i, (param_name, param, _argloc)) in + til_function.args.iter().enumerate() + { if i != 0 { write!(fmt, ", ")?; } @@ -672,7 +722,14 @@ fn print_til_type_complex_ref( fmt.write_all(name)?; } } else { - print_til_type_typedef(fmt, section, name, til_type, typedef, print_prefix)?; + print_til_type_typedef( + fmt, + section, + name, + til_type, + typedef, + print_prefix, + )?; } Ok(()) } @@ -765,7 +822,15 @@ fn print_til_type_union( write!(fmt, "{{")?; for (member_name, member) in &til_union.members { let member_name = member_name.as_deref(); - print_til_type_complex_member(fmt, section, name, member_name, member, true, true)?; + print_til_type_complex_member( + fmt, + section, + name, + member_name, + member, + true, + true, + )?; write!(fmt, ";")?; } write!(fmt, "}}") @@ -794,7 +859,8 @@ fn print_til_type_complex_member( print_name, ); }; - let qualified_parent_name: Vec<_> = parent_name.iter().chain(b"::").copied().collect(); + let qualified_parent_name: Vec<_> = + parent_name.iter().chain(b"::").copied().collect(); // TODO if the field is named, don't embeded it? if name.is_some() { @@ -830,7 +896,9 @@ fn print_til_type_complex_member( }; let inner_type = match typedef { - Typedef::Ordinal(ord) => section.get_ord(Id0TilOrd { ord: (*ord).into() }).unwrap(), + Typedef::Ordinal(ord) => { + section.get_ord(Id0TilOrd { ord: (*ord).into() }).unwrap() + } Typedef::Name(None) => { return print_til_type( fmt, @@ -891,7 +959,10 @@ fn print_til_type_enum( write!(fmt, " ")?; } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4443b0 - if til_enum.storage_size.is_some() || til_enum.is_signed || til_enum.is_unsigned { + if til_enum.storage_size.is_some() + || til_enum.is_signed + || til_enum.is_unsigned + { let bytes = til_enum.storage_size.or(section.size_enum).unwrap(); let signed = if til_enum.is_unsigned { "unsigned " @@ -907,7 +978,9 @@ fn print_til_type_enum( } write!(fmt, " = ")?; match til_enum.output_format { - Char if *value <= 0xFF => write!(fmt, "'{}'", (*value) as u8 as char)?, + Char if *value <= 0xFF => { + write!(fmt, "'{}'", (*value) as u8 as char)? + } Char => write!(fmt, "'\\xu{value:X}'")?, Hex => write!(fmt, "{value:#X}")?, SignedDecimal => write!(fmt, "{}", (*value) as i64)?, @@ -952,13 +1025,19 @@ fn print_til_struct_member_att( match &tinfo.type_variant { TypeVariant::Basic(_) => print_til_struct_member_basic_att(fmt, att)?, TypeVariant::Pointer(pointer) => match &pointer.typ.type_variant { - TypeVariant::Basic(Basic::Char) => print_til_struct_member_string_att(fmt, att)?, + TypeVariant::Basic(Basic::Char) => { + print_til_struct_member_string_att(fmt, att)? + } // TODO is valid for other then void? - TypeVariant::Basic(Basic::Void) => print_til_struct_member_void_pointer_att(fmt, att)?, + TypeVariant::Basic(Basic::Void) => { + print_til_struct_member_void_pointer_att(fmt, att)? + } _ => {} }, TypeVariant::Array(array) => match &array.elem_type.type_variant { - TypeVariant::Basic(Basic::Char) => print_til_struct_member_string_att(fmt, att)?, + TypeVariant::Basic(Basic::Char) => { + print_til_struct_member_string_att(fmt, att)? + } _ => {} }, _ => {} @@ -967,7 +1046,10 @@ fn print_til_struct_member_att( } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x4872f0 -fn print_til_struct_member_string_att(fmt: &mut impl Write, att: &StructMemberAtt) -> Result<()> { +fn print_til_struct_member_string_att( + fmt: &mut impl Write, + att: &StructMemberAtt, +) -> Result<()> { let Some(value) = att.str_type() else { // TODO don't ignore errors return Ok(()); @@ -1014,7 +1096,10 @@ fn print_til_struct_member_void_pointer_att( Ok(()) } -fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt) -> Result<()> { +fn print_til_struct_member_basic_att( + fmt: &mut impl Write, + att: &StructMemberAtt, +) -> Result<()> { // TODO incomplete implementation if let Some((val, is_auto)) = att.basic_offset_type() { write!( @@ -1075,10 +1160,18 @@ fn print_til_struct_member_basic_att(fmt: &mut impl Write, att: &StructMemberAtt Ok(()) } -fn print_til_type_prefix(fmt: &mut impl Write, tinfo: &Type, with_space: bool) -> Result<()> { +fn print_til_type_prefix( + fmt: &mut impl Write, + tinfo: &Type, + with_space: bool, +) -> Result<()> { match &tinfo.type_variant { - TypeVariant::UnionRef(_) | TypeVariant::Union(_) => write!(fmt, "union")?, - TypeVariant::StructRef(_) | TypeVariant::Struct(_) => write!(fmt, "struct")?, + TypeVariant::UnionRef(_) | TypeVariant::Union(_) => { + write!(fmt, "union")? + } + TypeVariant::StructRef(_) | TypeVariant::Struct(_) => { + write!(fmt, "struct")? + } TypeVariant::EnumRef(_) | TypeVariant::Enum(_) => write!(fmt, "enum")?, _ => return Ok(()), } @@ -1088,7 +1181,11 @@ fn print_til_type_prefix(fmt: &mut impl Write, tinfo: &Type, with_space: bool) - Ok(()) } -fn print_til_type_only(fmt: &mut impl Write, section: &TILSection, tinfo: &Type) -> Result<()> { +fn print_til_type_only( + fmt: &mut impl Write, + section: &TILSection, + tinfo: &Type, +) -> Result<()> { match &tinfo.type_variant { TypeVariant::Typedef(Typedef::Name(Some(name))) => { fmt.write_all(name)?; @@ -1194,7 +1291,9 @@ fn is_vft(section: &TILSection, typ: &Type) -> bool { TypeVariant::Struct(ty) => ty.is_vft, TypeVariant::Typedef(typedef) | TypeVariant::StructRef(typedef) => { let inner_type = match typedef { - Typedef::Ordinal(ord) => section.get_ord(Id0TilOrd { ord: (*ord).into() }), + Typedef::Ordinal(ord) => { + section.get_ord(Id0TilOrd { ord: (*ord).into() }) + } Typedef::Name(None) => return false, Typedef::Name(Some(name)) => section.get_name(name), }; @@ -1218,7 +1317,9 @@ fn print_basic_type(fmt: &mut impl Write, til_basic: &Basic) -> Result<()> { match til_basic { Basic::Bool => write!(fmt, "bool")?, Basic::Char => write!(fmt, "char")?, - Basic::Short { is_signed } => write!(fmt, "{}short", signed_name(*is_signed))?, + Basic::Short { is_signed } => { + write!(fmt, "{}short", signed_name(*is_signed))? + } Basic::Void => write!(fmt, "void")?, Basic::SegReg => write!(fmt, "SegReg")?, Basic::Unknown { bytes: 1 } => write!(fmt, "_BYTE")?, @@ -1226,9 +1327,15 @@ fn print_basic_type(fmt: &mut impl Write, til_basic: &Basic) -> Result<()> { Basic::Unknown { bytes: 4 } => write!(fmt, "_DWORD")?, Basic::Unknown { bytes: 8 } => write!(fmt, "_QWORD")?, Basic::Unknown { bytes } => write!(fmt, "unknown{bytes}")?, - Basic::Int { is_signed } => write!(fmt, "{}int", signed_name(*is_signed))?, - Basic::Long { is_signed } => write!(fmt, "{}long", signed_name(*is_signed))?, - Basic::LongLong { is_signed } => write!(fmt, "{}longlong", signed_name(*is_signed))?, + Basic::Int { is_signed } => { + write!(fmt, "{}int", signed_name(*is_signed))? + } + Basic::Long { is_signed } => { + write!(fmt, "{}long", signed_name(*is_signed))? + } + Basic::LongLong { is_signed } => { + write!(fmt, "{}longlong", signed_name(*is_signed))? + } Basic::IntSized { bytes, is_signed } => { if let Some(false) = is_signed { write!(fmt, "unsigned ")?; diff --git a/src/tools/tools.rs b/src/tools/tools.rs index 9028f9b..8a7c08b 100644 --- a/src/tools/tools.rs +++ b/src/tools/tools.rs @@ -148,9 +148,9 @@ fn get_id0_section(args: &Args) -> Result { FileType::Idb => { let input = BufReader::new(File::open(&args.input)?); let mut parser = IDBParser::new(input)?; - let id0_offset = parser - .id0_section_offset() - .ok_or_else(|| anyhow!("IDB file don't contains a TIL sector"))?; + let id0_offset = parser.id0_section_offset().ok_or_else(|| { + anyhow!("IDB file don't contains a TIL sector") + })?; parser.read_id0_section(id0_offset) } } @@ -163,7 +163,9 @@ fn main() -> Result<()> { Operation::DumpTil => dump_til(&args), Operation::DumpID0 => dump_id0(&args), //Operation::SplitIDB(split_idbargs) => split_idb(&args, split_idbargs), - Operation::DecompressTil(decompress_til_args) => decompress_til(&args, decompress_til_args), + Operation::DecompressTil(decompress_til_args) => { + decompress_til(&args, decompress_til_args) + } Operation::DumpFunctions => dump_functions(&args), Operation::DumpSegments => dump_segments(&args), Operation::DumpLoaderNames => dump_loader_name(&args), @@ -176,9 +178,15 @@ fn main() -> Result<()> { Operation::DumpDirtreeNames => dump_dirtree_names(&args), Operation::DumpDirtreeImports => dump_dirtree_imports(&args), Operation::DumpDirtreeBpts => dump_dirtree_bpts(&args), - Operation::DumpDirtreeBookmarksIdaplace => dump_dirtree_bookmarks_idaplace(&args), - Operation::DumpDirtreeBookmarksStructplace => dump_dirtree_bookmarks_structplace(&args), - Operation::DumpDirtreeBookmarksTiplace => dump_dirtree_bookmarks_tiplace(&args), + Operation::DumpDirtreeBookmarksIdaplace => { + dump_dirtree_bookmarks_idaplace(&args) + } + Operation::DumpDirtreeBookmarksStructplace => { + dump_dirtree_bookmarks_structplace(&args) + } + Operation::DumpDirtreeBookmarksTiplace => { + dump_dirtree_bookmarks_tiplace(&args) + } Operation::PrintTilib => tilib_print(&args), } } From 5faae3908546f8f6a92327269b923b98d504c78f Mon Sep 17 00:00:00 2001 From: rbran Date: Sat, 11 Jan 2025 13:29:05 -0300 Subject: [PATCH 48/53] allow a struct to reverse-inherit the cppobj from baseclass --- src/tools/tilib.rs | 23 ++++++++++++++++++----- 1 file changed, 18 insertions(+), 5 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 27d40df..5db7f77 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -742,6 +742,11 @@ fn print_til_type_struct( til_struct: &Struct, print_name: bool, ) -> Result<()> { + // TODO check innerref, maybe baseclass don't need to be the first, nor + // need to only one + let is_cppobj = til_struct.is_cppobj + || matches!(til_struct.members.first(), Some(first) if first.is_baseclass); + write!(fmt, "struct ")?; if til_struct.is_unaligned { if til_struct.is_uknown_8 { @@ -753,7 +758,7 @@ fn print_til_type_struct( if til_struct.is_msstruct { write!(fmt, "__attribute__((msstruct)) ")?; } - if til_struct.is_cppobj { + if is_cppobj { write!(fmt, "__cppobj ")?; } if til_struct.is_vft { @@ -769,15 +774,23 @@ fn print_til_type_struct( } } let mut members = &til_struct.members[..]; - if til_struct.is_cppobj { + if is_cppobj { match members.first() { - Some(baseclass) if baseclass.is_baseclass /*&& x.name.is_none()*/=> { + Some(baseclass) if baseclass.is_baseclass => { members = &members[1..]; write!(fmt, ": ")?; - print_til_type(fmt, section, None, &baseclass.member_type, true, true, false)?; + print_til_type( + fmt, + section, + None, + &baseclass.member_type, + true, + true, + false, + )?; write!(fmt, " ")?; } - _ => {}, + _ => {} } } From 16f615230d2869024dc85e93653fc50e7fa3a032 Mon Sep 17 00:00:00 2001 From: rbran Date: Sat, 11 Jan 2025 13:41:10 -0300 Subject: [PATCH 49/53] fix tilib pointer not inheriting the VFT att --- src/tools/tilib.rs | 37 +++++++++++++++++++++++++++++++++---- 1 file changed, 33 insertions(+), 4 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 5db7f77..ed3dd8b 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -254,6 +254,7 @@ fn print_symbols( section, Some(name), &symbol.tinfo, + false, true, false, true, @@ -372,7 +373,7 @@ fn print_til_type_root( // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x443906 _ => write!(fmt, "typedef ")?, } - print_til_type(fmt, section, name, til_type, true, true, true) + print_til_type(fmt, section, name, til_type, false, true, true, true) } fn print_til_type( @@ -380,6 +381,7 @@ fn print_til_type( section: &TILSection, name: Option<&[u8]>, til_type: &Type, + is_vft: bool, print_pointer_space: bool, print_type_prefix: bool, print_name: bool, @@ -394,6 +396,7 @@ fn print_til_type( name, til_type, pointer, + is_vft, print_pointer_space, print_type_prefix, ), @@ -478,6 +481,7 @@ fn print_til_type_pointer( name: Option<&[u8]>, til_type: &Type, pointer: &Pointer, + is_vft_parent: bool, print_pointer_space: bool, print_type_prefix: bool, ) -> Result<()> { @@ -491,6 +495,7 @@ fn print_til_type_pointer( section, None, &pointer.typ, + is_vft_parent, print_pointer_space, print_type_prefix, true, @@ -530,7 +535,9 @@ fn print_til_type_pointer( } // if the pointed type itself is a VFT then the pointer need to print that - if is_vft(section, &pointer.typ) { + // TODO maybe the above is not ture, it it was inheritec from the + // struct member att + if is_vft_parent || is_vft(section, &pointer.typ) { write!(fmt, " /*VFT*/")?; } } @@ -552,7 +559,16 @@ fn print_til_type_function( write!(fmt, "const ")?; } // return type - print_til_type(fmt, section, None, &til_function.ret, true, true, true)?; + print_til_type( + fmt, + section, + None, + &til_function.ret, + false, + true, + true, + true, + )?; if !matches!(&til_function.ret.type_variant, TypeVariant::Pointer(_)) { write!(fmt, " ")?; } @@ -607,7 +623,9 @@ fn print_til_type_function( write!(fmt, ", ")?; } let param_name = param_name.as_ref().map(Vec::as_slice); - print_til_type(fmt, section, param_name, param, true, false, true)?; + print_til_type( + fmt, section, param_name, param, false, true, false, true, + )?; } match til_function.calling_convention { Some(CallingConvention::Voidarg) => write!(fmt, "void")?, @@ -642,6 +660,7 @@ fn print_til_type_array( section, None, &til_array.elem_type, + false, print_pointer_space, print_type_prefix, true, @@ -784,6 +803,7 @@ fn print_til_type_struct( section, None, &baseclass.member_type, + baseclass.is_vft, true, true, false, @@ -803,6 +823,7 @@ fn print_til_type_struct( name, member_name, &member.member_type, + member.is_vft, true, true, )?; @@ -841,6 +862,7 @@ fn print_til_type_union( name, member_name, member, + false, true, true, )?; @@ -856,6 +878,7 @@ fn print_til_type_complex_member( parent_name: Option<&[u8]>, name: Option<&[u8]>, til: &Type, + is_vft: bool, print_pointer_space: bool, print_name: bool, ) -> Result<()> { @@ -867,6 +890,7 @@ fn print_til_type_complex_member( section, name, til, + is_vft, print_pointer_space, true, print_name, @@ -882,6 +906,7 @@ fn print_til_type_complex_member( section, name, til, + is_vft, print_pointer_space, true, print_name, @@ -901,6 +926,7 @@ fn print_til_type_complex_member( section, name, til, + is_vft, print_pointer_space, true, print_name, @@ -918,6 +944,7 @@ fn print_til_type_complex_member( section, name, til, + is_vft, print_pointer_space, true, print_name, @@ -934,6 +961,7 @@ fn print_til_type_complex_member( section, name, til, + is_vft, print_pointer_space, true, print_name, @@ -945,6 +973,7 @@ fn print_til_type_complex_member( section, Some(&inner_type.name), &inner_type.tinfo, + is_vft, print_pointer_space, true, false, From 5af511736a3157a2e9c421d2f3ef6eb0c14f9ef5 Mon Sep 17 00:00:00 2001 From: rbran Date: Mon, 13 Jan 2025 14:45:47 -0300 Subject: [PATCH 50/53] add til typeref resolution to creation --- src/lib.rs | 2 +- src/til.rs | 259 +++++++++++++---- src/til/array.rs | 16 +- src/til/enum.rs | 3 +- src/til/function.rs | 21 +- src/til/pointer.rs | 36 ++- src/til/section.rs | 580 ++++++++++++++++++++----------------- src/til/size_calculator.rs | 62 ++-- src/til/struct.rs | 17 +- src/til/union.rs | 13 +- src/tools/dump_til.rs | 58 ++-- src/tools/tilib.rs | 255 ++++++++-------- 12 files changed, 793 insertions(+), 529 deletions(-) diff --git a/src/lib.rs b/src/lib.rs index cc92987..8ce6ff8 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -112,7 +112,7 @@ impl IDBParser { &mut self.input, &self.header, til.0.get(), - |input, _, compress| TILSection::read(input, compress), + |input, _header, compressed| TILSection::read(input, compressed), ) } diff --git a/src/til.rs b/src/til.rs index d426018..e0abe7d 100644 --- a/src/til.rs +++ b/src/til.rs @@ -11,8 +11,10 @@ pub mod union; mod size_calculator; +use section::TILSectionHeader; pub use size_calculator::*; +use std::collections::HashMap; use std::num::NonZeroU8; use anyhow::{anyhow, ensure, Context, Result}; @@ -25,21 +27,62 @@ use crate::til::function::{Function, FunctionRaw}; use crate::til::pointer::{Pointer, PointerRaw}; use crate::til::r#enum::{Enum, EnumRaw}; use crate::til::r#struct::{Struct, StructRaw}; -use crate::til::section::TILSectionHeader; use crate::til::union::{Union, UnionRaw}; #[derive(Debug, Clone)] pub struct TILTypeInfo { - _flags: u32, pub name: Vec, pub ordinal: u64, pub tinfo: Type, +} + +impl TILTypeInfo { + pub(crate) fn new( + til: &TILSectionHeader, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, + name: Vec, + ordinal: u64, + tinfo_raw: TypeRaw, + fields: Vec>, + ) -> Result { + let mut fields_iter = fields + .into_iter() + .map(|field| (!field.is_empty()).then_some(field)); + let tinfo = Type::new( + til, + type_by_name, + type_by_ord, + tinfo_raw, + &mut fields_iter, + )?; + #[cfg(feature = "restrictive")] + ensure!( + fields_iter.next().is_none(), + "Extra fields found for til type \"{}\"", + String::from_utf8_lossy(&name) + ); + Ok(Self { + name, + ordinal, + tinfo, + }) + } +} + +#[derive(Debug, Clone)] +pub(crate) struct TILTypeInfoRaw { + _flags: u32, + pub name: Vec, + pub ordinal: u64, + pub tinfo: TypeRaw, _cmt: Vec, _fieldcmts: Vec, + fields: Vec>, _sclass: u8, } -impl TILTypeInfo { +impl TILTypeInfoRaw { pub(crate) fn read( input: &mut impl IdaGenericBufUnpack, til: &TILSectionHeader, @@ -55,7 +98,8 @@ impl TILTypeInfo { input.read_raw_til_type(til.format)? }; let mut cursor = &data[..]; - let result = TILTypeInfo::read_inner(&mut cursor, til)?; + let result = Self::read_inner(&mut cursor, til)?; + #[cfg(feature = "restrictive")] ensure!( cursor.is_empty(), "Unable to parse til type fully, left {} bytes", @@ -74,40 +118,25 @@ impl TILTypeInfo { (0..=0x11, _) | (_, false) => cursor.read_u32()?.into(), (_, true) => cursor.read_u64()?, }; - let tinfo_raw = - TypeRaw::read(&mut *cursor, til).with_context(|| { - format!( - "parsing `TILTypeInfo::tiinfo` for type \"{}\"", - String::from_utf8_lossy(&name) - ) - })?; + let tinfo = TypeRaw::read(&mut *cursor, til).with_context(|| { + format!( + "parsing `TILTypeInfo::tiinfo` for type \"{}\"", + String::from_utf8_lossy(&name) + ) + })?; let _info = cursor.read_c_string_raw()?; let cmt = cursor.read_c_string_raw()?; let fields = cursor.read_c_string_vec()?; let fieldcmts = cursor.read_c_string_raw()?; let sclass: u8 = cursor.read_u8()?; - let mut fields_iter = fields.into_iter().map(|field| { - if field.is_empty() { - None - } else { - Some(field) - } - }); - let tinfo = Type::new(til, tinfo_raw, &mut fields_iter)?; - #[cfg(feature = "restrictive")] - ensure!( - fields_iter.next().is_none(), - "Extra fields found for til type \"{}\"", - String::from_utf8_lossy(&name) - ); - Ok(Self { _flags: flags, name, ordinal, tinfo, _cmt: cmt, + fields, _fieldcmts: fieldcmts, _sclass: sclass, }) @@ -127,49 +156,63 @@ pub enum TypeVariant { Pointer(Pointer), Function(Function), Array(Array), - Typedef(Typedef), + Typeref(Typeref), Struct(Struct), Union(Union), Enum(Enum), - StructRef(Typedef), - UnionRef(Typedef), - EnumRef(Typedef), Bitfield(Bitfield), } impl Type { pub(crate) fn new( til: &TILSectionHeader, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, tinfo_raw: TypeRaw, fields: &mut impl Iterator>>, ) -> Result { let type_variant = match tinfo_raw.variant { TypeVariantRaw::Basic(x) => TypeVariant::Basic(x), TypeVariantRaw::Bitfield(x) => TypeVariant::Bitfield(x), - TypeVariantRaw::Typedef(x) => TypeVariant::Typedef(x), + TypeVariantRaw::Typedef(x) => { + Typeref::new(type_by_name, type_by_ord, x) + .map(TypeVariant::Typeref)? + } TypeVariantRaw::Pointer(x) => { - Pointer::new(til, x, fields).map(TypeVariant::Pointer)? + Pointer::new(til, type_by_name, type_by_ord, x, fields) + .map(TypeVariant::Pointer)? } TypeVariantRaw::Function(x) => { - Function::new(til, x, fields).map(TypeVariant::Function)? + Function::new(til, type_by_name, type_by_ord, x, fields) + .map(TypeVariant::Function)? } TypeVariantRaw::Array(x) => { - Array::new(til, x, fields).map(TypeVariant::Array)? + Array::new(til, type_by_name, type_by_ord, x, fields) + .map(TypeVariant::Array)? } TypeVariantRaw::Struct(x) => { - Struct::new(til, x, fields).map(TypeVariant::Struct)? + Struct::new(til, type_by_name, type_by_ord, x, fields) + .map(TypeVariant::Struct)? } TypeVariantRaw::Union(x) => { - Union::new(til, x, fields).map(TypeVariant::Union)? + Union::new(til, type_by_name, type_by_ord, x, fields) + .map(TypeVariant::Union)? } TypeVariantRaw::Enum(x) => { Enum::new(til, x, fields).map(TypeVariant::Enum)? } - TypeVariantRaw::StructRef(typedef) => { - TypeVariant::StructRef(typedef) + TypeVariantRaw::StructRef(x) => { + Typeref::new_struct(type_by_name, type_by_ord, x) + .map(TypeVariant::Typeref)? + } + TypeVariantRaw::UnionRef(x) => { + Typeref::new_union(type_by_name, type_by_ord, x) + .map(TypeVariant::Typeref)? + } + TypeVariantRaw::EnumRef(x) => { + Typeref::new_enum(type_by_name, type_by_ord, x) + .map(TypeVariant::Typeref)? } - TypeVariantRaw::UnionRef(typedef) => TypeVariant::UnionRef(typedef), - TypeVariantRaw::EnumRef(typedef) => TypeVariant::EnumRef(typedef), }; Ok(Self { is_const: tinfo_raw.is_const, @@ -190,14 +233,18 @@ impl Type { flags: section::TILSectionFlags(0), description: Vec::new(), dependencies: Vec::new(), - compiler_id: 0, - cm: 0, size_enum: None, size_int: 4.try_into().unwrap(), size_bool: 1.try_into().unwrap(), def_align: None, size_long_double: None, extended_sizeof_info: None, + cc: None, + cn: None, + type_ordinal_alias: None, + is_universal: true, + compiler_id: crate::id0::Compiler::Unknown, + cm: None, }; let mut reader = data; let type_raw = TypeRaw::read(&mut reader, &header)?; @@ -221,7 +268,13 @@ impl Type { Some(field) } }); - let result = Self::new(&header, type_raw, &mut fields_iter)?; + let result = Self::new( + &header, + &HashMap::new(), + &HashMap::new(), + type_raw, + &mut fields_iter, + )?; #[cfg(feature = "restrictive")] ensure!( fields_iter.next().is_none(), @@ -244,13 +297,13 @@ pub(crate) enum TypeVariantRaw { Pointer(PointerRaw), Function(FunctionRaw), Array(ArrayRaw), - Typedef(Typedef), + Typedef(TypedefRaw), Struct(StructRaw), Union(UnionRaw), Enum(EnumRaw), - StructRef(Typedef), - UnionRef(Typedef), - EnumRef(Typedef), + StructRef(TypedefRaw), + UnionRef(TypedefRaw), + EnumRef(TypedefRaw), Bitfield(Bitfield), } @@ -304,7 +357,7 @@ impl TypeRaw { // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x480369 (flag::tf_complex::BT_COMPLEX, flag::tf_complex::BTMT_TYPEDEF) => { - Typedef::read(input) + TypedefRaw::read(input) .context("Type::Typedef") .map(TypeVariantRaw::Typedef)? } @@ -357,9 +410,8 @@ impl TypeRaw { let mut bytes = &bytes[..]; let result = TypeRaw::read(&mut bytes, header)?; - if !bytes.is_empty() { - return Err(anyhow!("Unable to fully parser Type ref")); - } + #[cfg(feature = "restrictive")] + ensure!(bytes.is_empty(), "Unable to fully parser Type ref"); Ok(result) } } @@ -509,13 +561,12 @@ impl Basic { } #[derive(Clone, Debug)] -pub enum Typedef { - // TODO make this a `Id0TilOrd` +pub enum TypedefRaw { Ordinal(u32), Name(Option>), } -impl Typedef { +impl TypedefRaw { fn read(input: &mut impl IdaGenericUnpack) -> Result { let buf = input.unpack_dt_bytes()?; match &buf[..] { @@ -527,12 +578,106 @@ impl Typedef { "Typedef Ordinal with more data then expected" )); } - Ok(Typedef::Ordinal(de)) + Ok(Self::Ordinal(de)) + } + _ => Ok(Self::Name(if buf.is_empty() { None } else { Some(buf) })), + } + } +} + +#[derive(Clone, Debug)] +pub enum Typeref { + Ref(usize), + UnresolvedName { + name: Option>, + ref_type: Option, + }, + UnresolvedOrd { + ord: u32, + ref_type: Option, + }, +} + +#[derive(Clone, Copy, Debug, PartialEq, Eq)] +pub enum TyperefType { + Struct, + Union, + Enum, +} + +impl Typeref { + pub(crate) fn new( + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, + tyref: TypedefRaw, + ) -> Result { + let pos = match tyref { + // TODO check is ord is set on the header + TypedefRaw::Ordinal(ord) => { + let Some(pos) = type_by_ord.get(&(ord.into())) else { + return Ok(Self::UnresolvedOrd { + ord, + ref_type: None, + }); + }; + pos } - _ => { - Ok(Typedef::Name(if buf.is_empty() { None } else { Some(buf) })) + TypedefRaw::Name(None) => { + return Ok(Self::UnresolvedName { + name: None, + ref_type: None, + }) + } + TypedefRaw::Name(Some(name)) => { + let Some(pos) = type_by_name.get(&name[..]) else { + return Ok(Self::UnresolvedName { + name: Some(name), + ref_type: None, + }); + }; + pos } + }; + Ok(Self::Ref(*pos)) + } + + fn new_struct( + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, + x: TypedefRaw, + ) -> Result { + let mut result = Self::new(type_by_name, type_by_ord, x)?; + if let Typeref::UnresolvedName { name: _, ref_type } = &mut result { + *ref_type = Some(TyperefType::Struct) + } + // TODO check the inner type is in fact a struct + Ok(result) + } + + fn new_union( + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, + x: TypedefRaw, + ) -> Result { + let mut result = Self::new(type_by_name, type_by_ord, x)?; + if let Typeref::UnresolvedName { name: _, ref_type } = &mut result { + *ref_type = Some(TyperefType::Union) + } + // TODO check the inner type is in fact a union + Ok(result) + } + + fn new_enum( + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, + x: TypedefRaw, + ) -> Result { + let mut result = Self::new(type_by_name, type_by_ord, x)?; + if let Typeref::UnresolvedName { name: _, ref_type } = &mut result { + *ref_type = Some(TyperefType::Enum) } + // TODO check the inner type is in fact a enum + Ok(result) } } diff --git a/src/til/array.rs b/src/til/array.rs index 57bebd4..2c31434 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -1,9 +1,11 @@ +use std::collections::HashMap; use std::num::{NonZeroU16, NonZeroU8}; use crate::ida_reader::IdaGenericBufUnpack; -use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeAttribute, TypeRaw}; +use super::section::TILSectionHeader; + #[derive(Clone, Debug)] pub struct Array { pub alignment: Option, @@ -14,6 +16,8 @@ pub struct Array { impl Array { pub(crate) fn new( til: &TILSectionHeader, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, value: ArrayRaw, fields: &mut impl Iterator>>, ) -> anyhow::Result { @@ -21,8 +25,14 @@ impl Array { alignment: value.alignment, base: value.base, nelem: value.nelem, - elem_type: Type::new(til, *value.elem_type, fields) - .map(Box::new)?, + elem_type: Type::new( + til, + type_by_name, + type_by_ord, + *value.elem_type, + fields, + ) + .map(Box::new)?, }) } } diff --git a/src/til/enum.rs b/src/til/enum.rs index 4e7fd0c..e864212 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -1,10 +1,11 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; -use crate::til::section::TILSectionHeader; use crate::til::{flag, TypeAttribute, TypeRaw, TypeVariantRaw}; use anyhow::{anyhow, ensure}; +use super::section::TILSectionHeader; + #[derive(Clone, Debug)] pub struct Enum { pub is_signed: bool, diff --git a/src/til/function.rs b/src/til/function.rs index 7fe76ec..e0a21b2 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -1,10 +1,11 @@ +use std::collections::HashMap; use std::num::NonZeroU8; use crate::ida_reader::{IdaGenericBufUnpack, IdaGenericUnpack}; -use crate::til::section::TILSectionHeader; use crate::til::{Basic, Type, TypeRaw}; use anyhow::{anyhow, ensure, Context, Result}; +use super::section::TILSectionHeader; use super::TypeVariantRaw; #[derive(Debug, Clone)] @@ -28,14 +29,28 @@ pub struct Function { impl Function { pub(crate) fn new( til: &TILSectionHeader, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, value: FunctionRaw, fields: &mut impl Iterator>>, ) -> Result { - let ret = Type::new(til, *value.ret, &mut *fields)?; + let ret = Type::new( + til, + type_by_name, + type_by_ord, + *value.ret, + &mut *fields, + )?; let mut args = Vec::with_capacity(value.args.len()); for (arg_type, arg_loc) in value.args { let field_name = fields.next().flatten(); - let new_member = Type::new(til, arg_type, &mut *fields)?; + let new_member = Type::new( + til, + type_by_name, + type_by_ord, + arg_type, + &mut *fields, + )?; args.push((field_name, new_member, arg_loc)); } Ok(Self { diff --git a/src/til/pointer.rs b/src/til/pointer.rs index 4d69122..8b52c44 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -1,9 +1,12 @@ +use std::collections::HashMap; + use anyhow::Result; use crate::ida_reader::IdaGenericBufUnpack; -use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeAttribute, TypeRaw}; +use super::section::TILSectionHeader; + #[derive(Debug, Clone)] pub struct Pointer { pub closure: PointerType, @@ -15,6 +18,8 @@ pub struct Pointer { impl Pointer { pub(crate) fn new( til: &TILSectionHeader, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, raw: PointerRaw, fields: &mut impl Iterator>>, ) -> Result { @@ -23,16 +28,28 @@ impl Pointer { .map(|(t, v)| -> Result<_> { Ok(( // TODO if this type allow non typedef, this may consume fields - Type::new(til, *t, &mut vec![].into_iter()) - .map(Box::new)?, + Type::new( + til, + type_by_name, + type_by_ord, + *t, + &mut vec![].into_iter(), + ) + .map(Box::new)?, v, )) }) .transpose()?; - let typ = Type::new(til, *raw.typ, fields).map(Box::new)?; + let typ = Type::new(til, type_by_name, type_by_ord, *raw.typ, fields) + .map(Box::new)?; Ok(Self { // TODO forward fields to closure? - closure: PointerType::new(til, raw.closure)?, + closure: PointerType::new( + til, + type_by_name, + type_by_ord, + raw.closure, + )?, modifier: raw.modifier, shifted, typ, @@ -50,12 +67,17 @@ pub enum PointerType { } impl PointerType { - fn new(til: &TILSectionHeader, raw: PointerTypeRaw) -> Result { + fn new( + til: &TILSectionHeader, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, + raw: PointerTypeRaw, + ) -> Result { match raw { PointerTypeRaw::Closure(c) => { // TODO subtype get the fields? let mut sub_fields = vec![].into_iter(); - Type::new(til, *c, &mut sub_fields) + Type::new(til, type_by_name, type_by_ord, *c, &mut sub_fields) .map(Box::new) .map(Self::Closure) } diff --git a/src/til/section.rs b/src/til/section.rs index 2383c9d..2239c62 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -1,6 +1,6 @@ use crate::id0::{Compiler, Id0TilOrd}; use crate::ida_reader::{IdaGenericBufUnpack, IdaGenericUnpack}; -use crate::til::{flag, TILMacro, TILTypeInfo}; +use crate::til::{flag, TILMacro, TILTypeInfo, TILTypeInfoRaw}; use crate::IDBSectionCompression; use anyhow::{anyhow, ensure, Result}; use serde::{Deserialize, Serialize}; @@ -16,6 +16,22 @@ pub const TIL_SECTION_MAGIC: &[u8; 6] = b"IDATIL"; #[derive(Debug, Clone)] pub struct TILSection { + pub header: TILSectionHeader, + pub symbols: Vec, + pub types: Vec, + pub macros: Option>, +} + +#[derive(Debug, Clone)] +pub(crate) struct TILSectionRaw { + pub header: TILSectionHeader, + pub symbols: Vec, + pub types: Vec, + pub macros: Option>, +} + +#[derive(Debug, Clone)] +pub struct TILSectionHeader { pub format: u32, /// short file name (without path and extension) pub description: Vec, @@ -34,16 +50,13 @@ pub struct TILSection { //pub cc: CallingConvention, //pub cm: CCPtrSize, pub def_align: Option, - pub symbols: Vec, // TODO create a struct for ordinal aliases pub type_ordinal_alias: Option>, - pub types: Vec, pub size_int: NonZeroU8, pub size_bool: NonZeroU8, pub size_enum: Option, pub extended_sizeof_info: Option, pub size_long_double: Option, - pub macros: Option>, pub is_universal: bool, } @@ -55,7 +68,7 @@ pub struct TILSectionExtendedSizeofInfo { } #[derive(Debug, Clone)] -pub struct TILSectionHeader { +pub struct TILSectionHeaderRaw { pub format: u32, pub flags: TILSectionFlags, pub description: Vec, @@ -87,11 +100,7 @@ pub struct TILSectionHeader2 { pub def_align: u8, } -impl TILSection { - pub fn parse(mut input: impl IdaGenericBufUnpack) -> Result { - Self::read_inner(&mut input) - } - +impl TILSectionRaw { pub(crate) fn read( input: &mut impl IdaGenericBufUnpack, compress: IDBSectionCompression, @@ -107,38 +116,21 @@ impl TILSection { } fn read_inner(input: &mut impl IdaGenericBufUnpack) -> Result { - let header = Self::read_header(&mut *input)?; - let symbols = Self::read_bucket(&mut *input, &header, None, None)?; - - // TODO create an ordinal -> type mapping, to make sure the ordinals are not duplicated - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x42e292 - let (next_ordinal, type_ordinal_alias) = - Self::read_next_ordinal_and_alias(&mut *input, &header)?; - let types = Self::read_bucket( - &mut *input, - &header, - next_ordinal, - type_ordinal_alias.as_deref(), - )?; - let macros = header - .flags - .has_macro_table() - .then(|| Self::read_macros(&mut *input, &header)) - .transpose()?; + let header_raw = Self::read_header(&mut *input)?; // TODO verify that is always false? - let _mod = header.flags.is_mod(); - let _uni = header.flags.is_universal(); - let _ord = header.flags.has_ordinal(); - let _ali = header.flags.has_type_aliases(); - let _stm = header.flags.has_extra_stream(); - - let cc = CallingConvention::from_cm_raw(header.cm)?; - let cn = CCPtrSize::from_cm_raw(header.cm, header.size_int); - let cm = CCModel::from_cm_raw(header.cm); - - let dependencies = if !header.dependencies.is_empty() { - header + let _mod = header_raw.flags.is_mod(); + let _uni = header_raw.flags.is_universal(); + let _ord = header_raw.flags.has_ordinal(); + let _ali = header_raw.flags.has_type_aliases(); + let _stm = header_raw.flags.has_extra_stream(); + + let cc = CallingConvention::from_cm_raw(header_raw.cm)?; + let cn = CCPtrSize::from_cm_raw(header_raw.cm, header_raw.size_int); + let cm = CCModel::from_cm_raw(header_raw.cm); + + let dependencies = if !header_raw.dependencies.is_empty() { + header_raw .dependencies .split(|x| *x == b',') .map(<[_]>::to_vec) @@ -146,27 +138,44 @@ impl TILSection { } else { vec![] }; - - Ok(TILSection { - format: header.format, - description: header.description, - flags: header.flags, + let mut header = TILSectionHeader { + format: header_raw.format, + description: header_raw.description, + flags: header_raw.flags, dependencies, - compiler_id: Compiler::from_value(header.compiler_id), + compiler_id: Compiler::from_value(header_raw.compiler_id), cc, cn, cm, - def_align: header.def_align, - size_long_double: header.size_long_double, - is_universal: header.flags.is_universal(), - size_bool: header.size_bool, - size_int: header.size_int, - size_enum: header.size_enum, - extended_sizeof_info: header.extended_sizeof_info, + def_align: header_raw.def_align, + size_long_double: header_raw.size_long_double, + is_universal: header_raw.flags.is_universal(), + size_bool: header_raw.size_bool, + size_int: header_raw.size_int, + size_enum: header_raw.size_enum, + extended_sizeof_info: header_raw.extended_sizeof_info, + type_ordinal_alias: None, + }; + + let symbols = Self::read_bucket(&mut *input, &header, None)?; + + // TODO create an ordinal -> type mapping, to make sure the ordinals are not duplicated + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x42e292 + let (next_ordinal, type_ordinal_alias) = + Self::read_next_ordinal_and_alias(&mut *input, &header)?; + header.type_ordinal_alias = type_ordinal_alias; + let types = Self::read_bucket(&mut *input, &header, next_ordinal)?; + let macros = header + .flags + .has_macro_table() + .then(|| Self::read_macros(&mut *input, &header)) + .transpose()?; + + Ok(Self { symbols, - type_ordinal_alias, types, macros, + header, }) } @@ -224,7 +233,7 @@ impl TILSection { fn read_header( input: &mut impl IdaGenericUnpack, - ) -> Result { + ) -> Result { // TODO this break a few files let signature: [u8; 6] = bincode::deserialize_from(&mut *input)?; ensure!(signature == *TIL_SECTION_MAGIC, "Invalid TIL Signature"); @@ -300,7 +309,7 @@ impl TILSection { let def_align = (header2.def_align != 0) .then(|| NonZeroU8::new(1 << (header2.def_align - 1)).unwrap()); - Ok(TILSectionHeader { + Ok(TILSectionHeaderRaw { format: header1.format, flags: header1.flags, description, @@ -317,6 +326,162 @@ impl TILSection { }) } + fn read_bucket_header( + input: &mut impl IdaGenericUnpack, + ) -> Result<(u32, u32)> { + let ndefs = bincode::deserialize_from(&mut *input)?; + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x42e3e0 + //ensure!(ndefs < 0x55555555); + let len = bincode::deserialize_from(&mut *input)?; + Ok((ndefs, len)) + } + + fn read_bucket_zip_header( + input: &mut impl IdaGenericUnpack, + ) -> Result<(u32, u32, u32)> { + let (ndefs, len) = Self::read_bucket_header(&mut *input)?; + let compressed_len = bincode::deserialize_from(&mut *input)?; + Ok((ndefs, len, compressed_len)) + } + + fn read_bucket( + input: &mut impl IdaGenericBufUnpack, + header: &TILSectionHeader, + next_ordinal: Option, + ) -> Result> { + if header.flags.is_zip() { + Self::read_bucket_zip(&mut *input, header, next_ordinal) + } else { + Self::read_bucket_normal(&mut *input, header, next_ordinal) + } + } + + fn read_bucket_normal( + input: &mut impl IdaGenericBufUnpack, + header: &TILSectionHeader, + next_ordinal: Option, + ) -> Result> { + let (ndefs, len) = Self::read_bucket_header(&mut *input)?; + Self::read_bucket_inner(&mut *input, header, ndefs, len, next_ordinal) + } + + fn read_bucket_zip( + input: &mut impl IdaGenericBufUnpack, + header: &TILSectionHeader, + next_ordinal: Option, + ) -> Result> { + let (ndefs, len, compressed_len) = + Self::read_bucket_zip_header(&mut *input)?; + // make sure the decompressor don't read out-of-bounds + let mut compressed_input = input.take(compressed_len.into()); + let mut inflate = BufReader::new(flate2::bufread::ZlibDecoder::new( + &mut compressed_input, + )); + // make sure only the defined size is decompressed + let type_info = Self::read_bucket_inner( + &mut inflate, + header, + ndefs, + len, + next_ordinal, + )?; + #[cfg(feature = "restrictive")] + ensure!( + compressed_input.limit() == 0, + "TypeBucket compressed data is smaller then expected" + ); + Ok(type_info) + } + + fn read_bucket_inner( + input: &mut impl IdaGenericBufUnpack, + header: &TILSectionHeader, + ndefs: u32, + len: u32, + next_ord: Option, + ) -> Result> { + if let Some(next_ord) = next_ord { + let alias: u32 = header + .type_ordinal_alias + .as_ref() + .map(|x| x.len()) + .unwrap_or(0) + .try_into() + .unwrap(); + // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x42e3e0 + ensure!(ndefs + alias + 1 <= next_ord); + } + let mut input = input.take(len.into()); + let type_info_raw: Vec<_> = (0..ndefs) + .map(|i| TILTypeInfoRaw::read(&mut input, header, i == ndefs - 1)) + .collect::>()?; + #[cfg(feature = "restrictive")] + ensure!( + input.limit() == 0, + "TypeBucket total data is smaller then expected" + ); + Ok(type_info_raw) + } + + fn read_macros( + input: &mut impl IdaGenericBufUnpack, + header: &TILSectionHeader, + ) -> Result> { + if header.flags.is_zip() { + Self::read_macros_zip(&mut *input) + } else { + Self::read_macros_normal(&mut *input) + } + } + + fn read_macros_normal( + input: &mut impl IdaGenericBufUnpack, + ) -> Result> { + let (ndefs, len) = Self::read_bucket_header(&mut *input)?; + let mut input = input.take(len.into()); + let type_info = (0..ndefs) + .map(|_| TILMacro::read(&mut input)) + .collect::>()?; + #[cfg(feature = "restrictive")] + ensure!( + input.limit() == 0, + "TypeBucket macro total data is smaller then expected" + ); + Ok(type_info) + } + + fn read_macros_zip( + input: &mut impl IdaGenericBufUnpack, + ) -> Result> { + let (ndefs, len, compressed_len) = + Self::read_bucket_zip_header(&mut *input)?; + // make sure the decompressor don't read out-of-bounds + let mut compressed_input = input.take(compressed_len.into()); + let inflate = BufReader::new(flate2::bufread::ZlibDecoder::new( + &mut compressed_input, + )); + // make sure only the defined size is decompressed + let mut decompressed_input = inflate.take(len.into()); + let type_info = (0..ndefs.try_into().unwrap()) + .map(|_| TILMacro::read(&mut decompressed_input)) + .collect::, _>>()?; + // make sure the input was fully consumed + #[cfg(feature = "restrictive")] + ensure!( + decompressed_input.limit() == 0, + "TypeBucket macros data is smaller then expected" + ); + #[cfg(feature = "restrictive")] + ensure!( + compressed_input.limit() == 0, + "TypeBucket macros compressed data is smaller then expected" + ); + Ok(type_info) + } + // TODO replace usize with a IDTypeIdx type +} + +impl TILSection { pub fn decompress( input: &mut impl IdaGenericBufUnpack, output: &mut impl Write, @@ -338,7 +503,7 @@ impl TILSection { input: &mut impl IdaGenericBufUnpack, output: &mut impl Write, ) -> Result<()> { - let mut header = Self::read_header(&mut *input)?; + let mut header = TILSectionRaw::read_header(&mut *input)?; let og_flags = header.flags; // disable the zip flag header.flags.set_zip(false); @@ -419,7 +584,32 @@ impl TILSection { Ok(()) } - // TODO replace usize with a IDTypeIdx type + #[allow(dead_code)] + fn decompress_bucket( + input: &mut impl IdaGenericBufUnpack, + output: &mut impl std::io::Write, + ) -> Result<()> { + let (ndefs, len, compressed_len) = + TILSectionRaw::read_bucket_zip_header(&mut *input)?; + bincode::serialize_into(&mut *output, &TILBucketRaw { len, ndefs })?; + // write the decompressed data + let mut compressed_input = input.take(compressed_len.into()); + let inflate = flate2::bufread::ZlibDecoder::new(&mut compressed_input); + let mut decompressed_input = inflate.take(len.into()); + std::io::copy(&mut decompressed_input, output)?; + #[cfg(feature = "restrictive")] + ensure!( + decompressed_input.limit() == 0, + "TypeBucket data is smaller then expected" + ); + #[cfg(feature = "restrictive")] + ensure!( + compressed_input.limit() == 0, + "TypeBucket compressed data is smaller then expected" + ); + Ok(()) + } + pub fn get_type_by_idx(&self, idx: usize) -> &TILTypeInfo { &self.types[idx] } @@ -434,7 +624,7 @@ impl TILSection { pub fn get_ord_idx(&self, id0_ord: Id0TilOrd) -> Option { // first search the ordinal alias - if let Some(ordinals) = &self.type_ordinal_alias { + if let Some(ordinals) = &self.header.type_ordinal_alias { // it's unclear what is the first value if let Some((_src, dst)) = ordinals .iter() @@ -452,21 +642,24 @@ impl TILSection { } pub fn sizeof_short(&self) -> NonZeroU8 { - self.extended_sizeof_info + self.header + .extended_sizeof_info .as_ref() .map(|x| x.size_short) .unwrap_or(2.try_into().unwrap()) } pub fn sizeof_long(&self) -> NonZeroU8 { - self.extended_sizeof_info + self.header + .extended_sizeof_info .as_ref() .map(|x| x.size_long) .unwrap_or(4.try_into().unwrap()) } pub fn sizeof_long_long(&self) -> NonZeroU8 { - self.extended_sizeof_info + self.header + .extended_sizeof_info .as_ref() .map(|x| x.size_long_long) .unwrap_or(8.try_into().unwrap()) @@ -474,12 +667,72 @@ impl TILSection { // TODO check this impl in InnerRef pub fn addr_size(&self) -> NonZeroU8 { - self.cn + self.header + .cn .map(CCPtrSize::near_bytes) .unwrap_or(NonZeroU8::new(4).unwrap()) } } +impl TILSection { + pub fn read( + input: &mut impl IdaGenericBufUnpack, + compress: IDBSectionCompression, + ) -> Result { + let type_info_raw = TILSectionRaw::read(input, compress)?; + // TODO check for dups? + let type_by_name = type_info_raw + .types + .iter() + .enumerate() + .map(|(i, til)| (til.name.to_vec(), i)) + .collect(); + let type_by_ord = type_info_raw + .types + .iter() + .enumerate() + .map(|(i, til)| (til.ordinal, i)) + .collect(); + let symbols = type_info_raw + .symbols + .into_iter() + .map(|ty| { + TILTypeInfo::new( + &type_info_raw.header, + &type_by_name, + &type_by_ord, + ty.name, + ty.ordinal, + ty.tinfo, + ty.fields, + ) + }) + .collect::>()?; + let types = type_info_raw + .types + .into_iter() + .map(|ty| { + TILTypeInfo::new( + &type_info_raw.header, + &type_by_name, + &type_by_ord, + ty.name, + ty.ordinal, + ty.tinfo, + ty.fields, + ) + }) + .collect::>()?; + + Ok(Self { + header: type_info_raw.header, + symbols, + types, + macros: type_info_raw.macros, + }) + } +} + // TODO remove deserialize and implement a verification if the value is correct #[derive(Clone, Copy, Debug, Deserialize, Serialize)] pub struct TILSectionFlags(pub(crate) u16); @@ -545,204 +798,3 @@ pub(crate) struct TILBucketRaw { ndefs: u32, len: u32, } - -impl TILSection { - fn read_bucket_header( - input: &mut impl IdaGenericUnpack, - ) -> Result<(u32, u32)> { - let ndefs = bincode::deserialize_from(&mut *input)?; - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x42e3e0 - //ensure!(ndefs < 0x55555555); - let len = bincode::deserialize_from(&mut *input)?; - Ok((ndefs, len)) - } - - fn read_bucket_zip_header( - input: &mut impl IdaGenericUnpack, - ) -> Result<(u32, u32, u32)> { - let (ndefs, len) = Self::read_bucket_header(&mut *input)?; - let compressed_len = bincode::deserialize_from(&mut *input)?; - Ok((ndefs, len, compressed_len)) - } - - fn read_bucket( - input: &mut impl IdaGenericBufUnpack, - header: &TILSectionHeader, - next_ordinal: Option, - ordinal_alias: Option<&[(u32, u32)]>, - ) -> Result> { - if header.flags.is_zip() { - Self::read_bucket_zip( - &mut *input, - header, - next_ordinal, - ordinal_alias, - ) - } else { - Self::read_bucket_normal( - &mut *input, - header, - next_ordinal, - ordinal_alias, - ) - } - } - - fn read_bucket_normal( - input: &mut impl IdaGenericBufUnpack, - header: &TILSectionHeader, - next_ordinal: Option, - ordinal_alias: Option<&[(u32, u32)]>, - ) -> Result> { - let (ndefs, len) = Self::read_bucket_header(&mut *input)?; - Self::read_bucket_inner( - &mut *input, - header, - ndefs, - len, - next_ordinal, - ordinal_alias, - ) - } - - fn read_bucket_zip( - input: &mut impl IdaGenericBufUnpack, - header: &TILSectionHeader, - next_ordinal: Option, - ordinal_alias: Option<&[(u32, u32)]>, - ) -> Result> { - let (ndefs, len, compressed_len) = - Self::read_bucket_zip_header(&mut *input)?; - // make sure the decompressor don't read out-of-bounds - let mut compressed_input = input.take(compressed_len.into()); - let mut inflate = BufReader::new(flate2::bufread::ZlibDecoder::new( - &mut compressed_input, - )); - // make sure only the defined size is decompressed - let type_info = Self::read_bucket_inner( - &mut inflate, - header, - ndefs, - len, - next_ordinal, - ordinal_alias, - )?; - #[cfg(feature = "restrictive")] - ensure!( - compressed_input.limit() == 0, - "TypeBucket compressed data is smaller then expected" - ); - Ok(type_info) - } - - fn read_bucket_inner( - input: &mut impl IdaGenericBufUnpack, - header: &TILSectionHeader, - ndefs: u32, - len: u32, - next_ord: Option, - ordinal_alias: Option<&[(u32, u32)]>, - ) -> Result> { - if let Some(next_ord) = next_ord { - let alias: u32 = ordinal_alias - .map(|x| x.len()) - .unwrap_or(0) - .try_into() - .unwrap(); - // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x42e3e0 - ensure!(ndefs + alias + 1 <= next_ord); - } - let mut input = input.take(len.into()); - let type_info = (0..ndefs) - .map(|i| TILTypeInfo::read(&mut input, header, i == ndefs - 1)) - .collect::>()?; - #[cfg(feature = "restrictive")] - ensure!( - input.limit() == 0, - "TypeBucket total data is smaller then expected" - ); - Ok(type_info) - } - - fn read_macros( - input: &mut impl IdaGenericBufUnpack, - header: &TILSectionHeader, - ) -> Result> { - if header.flags.is_zip() { - Self::read_macros_zip(&mut *input) - } else { - Self::read_macros_normal(&mut *input) - } - } - - fn read_macros_normal( - input: &mut impl IdaGenericBufUnpack, - ) -> Result> { - let (ndefs, len) = Self::read_bucket_header(&mut *input)?; - let mut input = input.take(len.into()); - let type_info = (0..ndefs) - .map(|_| TILMacro::read(&mut input)) - .collect::>()?; - #[cfg(feature = "restrictive")] - ensure!( - input.limit() == 0, - "TypeBucket macro total data is smaller then expected" - ); - Ok(type_info) - } - - fn read_macros_zip( - input: &mut impl IdaGenericBufUnpack, - ) -> Result> { - let (ndefs, len, compressed_len) = - Self::read_bucket_zip_header(&mut *input)?; - // make sure the decompressor don't read out-of-bounds - let mut compressed_input = input.take(compressed_len.into()); - let inflate = BufReader::new(flate2::bufread::ZlibDecoder::new( - &mut compressed_input, - )); - // make sure only the defined size is decompressed - let mut decompressed_input = inflate.take(len.into()); - let type_info = (0..ndefs.try_into().unwrap()) - .map(|_| TILMacro::read(&mut decompressed_input)) - .collect::, _>>()?; - // make sure the input was fully consumed - #[cfg(feature = "restrictive")] - ensure!( - decompressed_input.limit() == 0, - "TypeBucket macros data is smaller then expected" - ); - #[cfg(feature = "restrictive")] - ensure!( - compressed_input.limit() == 0, - "TypeBucket macros compressed data is smaller then expected" - ); - Ok(type_info) - } - - #[allow(dead_code)] - fn decompress_bucket( - input: &mut impl IdaGenericBufUnpack, - output: &mut impl std::io::Write, - ) -> Result<()> { - let (ndefs, len, compressed_len) = - Self::read_bucket_zip_header(&mut *input)?; - bincode::serialize_into(&mut *output, &TILBucketRaw { len, ndefs })?; - // write the decompressed data - let mut compressed_input = input.take(compressed_len.into()); - let inflate = flate2::bufread::ZlibDecoder::new(&mut compressed_input); - let mut decompressed_input = inflate.take(len.into()); - std::io::copy(&mut decompressed_input, output)?; - #[cfg(feature = "restrictive")] - ensure!( - decompressed_input.limit() == 0, - "TypeBucket data is smaller then expected" - ); - #[cfg(feature = "restrictive")] - ensure!( - compressed_input.limit() == 0, - "TypeBucket compressed data is smaller then expected" - ); - Ok(()) - } -} diff --git a/src/til/size_calculator.rs b/src/til/size_calculator.rs index c809d9b..32334e2 100644 --- a/src/til/size_calculator.rs +++ b/src/til/size_calculator.rs @@ -7,7 +7,7 @@ use super::r#enum::Enum; use super::r#struct::StructMember; use super::section::TILSection; use super::union::Union; -use super::{Basic, Type, TypeVariant, Typedef}; +use super::{Basic, Type, TypeVariant, Typeref}; pub struct TILTypeSizeSolver<'a> { section: &'a TILSection, @@ -63,13 +63,13 @@ impl<'a> TILTypeSizeSolver<'a> { TypeVariant::Basic(Basic::Void) => 0, TypeVariant::Basic(Basic::Unknown { bytes }) => (*bytes).into(), TypeVariant::Basic(Basic::Bool) => { - self.section.size_bool.get().into() + self.section.header.size_bool.get().into() } TypeVariant::Basic(Basic::Short { .. }) => { self.section.sizeof_short().get().into() } TypeVariant::Basic(Basic::Int { .. }) => { - self.section.size_int.get().into() + self.section.header.size_int.get().into() } TypeVariant::Basic(Basic::Long { .. }) => { self.section.sizeof_long().get().into() @@ -86,6 +86,7 @@ impl<'a> TILTypeSizeSolver<'a> { // TODO what's the long double default size if it's not defined? TypeVariant::Basic(Basic::LongDouble) => self .section + .header .size_long_double .map(|x| x.get()) .unwrap_or(8) @@ -100,10 +101,7 @@ impl<'a> TILTypeSizeSolver<'a> { let nelem = array.nelem.map(|x| x.get()).unwrap_or(0) as u64; element_len * nelem } - TypeVariant::StructRef(ref_type) - | TypeVariant::UnionRef(ref_type) - | TypeVariant::EnumRef(ref_type) - | TypeVariant::Typedef(ref_type) => self.solve_typedef(ref_type)?, + TypeVariant::Typeref(ref_type) => self.solve_typedef(ref_type)?, TypeVariant::Struct(til_struct) => { let mut sum = 0u64; // TODO default alignment, seems like default alignemnt is the field size @@ -166,7 +164,7 @@ impl<'a> TILTypeSizeSolver<'a> { max } TypeVariant::Enum(Enum { storage_size, .. }) => storage_size - .or(self.section.size_enum) + .or(self.section.header.size_enum) .map(|x| x.get()) .unwrap_or(4) .into(), @@ -174,28 +172,22 @@ impl<'a> TILTypeSizeSolver<'a> { }) } - fn solve_typedef(&mut self, typedef: &Typedef) -> Option { - let idx = match typedef { - Typedef::Name(name) => { - // NOTE missing names may indicate a external type, just return no size - self.section.get_name_idx(name.as_ref()?)? - } - Typedef::Ordinal(ord) => self - .section - .get_ord_idx(crate::id0::Id0TilOrd { ord: (*ord).into() })?, + fn solve_typedef(&mut self, typedef: &Typeref) -> Option { + let Typeref::Ref(idx) = typedef else { + return None; }; // if cached return it - if let Some(solved) = self.cached(idx) { + if let Some(solved) = self.cached(*idx) { return Some(solved); } - if !self.solving.insert(idx) { + if !self.solving.insert(*idx) { return None; } - let inner_type = self.section.get_type_by_idx(idx); + let inner_type = self.section.get_type_by_idx(*idx); let result = self.inner_type_size_bytes(&inner_type.tinfo); self.solving.remove(&idx); if let Some(result) = result { - assert!(self.solved.insert(idx, result).is_none()); + assert!(self.solved.insert(*idx, result).is_none()); } result } @@ -210,29 +202,13 @@ impl<'a> TILTypeSizeSolver<'a> { let size = self.inner_type_size_bytes(&array.elem_type); self.alignemnt(&array.elem_type, size.unwrap_or(1)) } - TypeVariant::EnumRef(ty) => { - let ty = match ty { - Typedef::Ordinal(ord) => self - .section - .get_ord(crate::id0::Id0TilOrd { ord: (*ord).into() }), - Typedef::Name(Some(name)) => self.section.get_name(name), - Typedef::Name(None) => None, - }; - ty.and_then(|ty| self.inner_type_size_bytes(&ty.tinfo)) - } - TypeVariant::Typedef(ty) => { - let ty = match ty { - Typedef::Ordinal(ord) => self - .section - .get_ord(crate::id0::Id0TilOrd { ord: (*ord).into() }), - Typedef::Name(Some(name)) => self.section.get_name(name), - Typedef::Name(None) => None, + TypeVariant::Typeref(ty) => { + let Typeref::Ref(idx) = ty else { + return None; }; - ty.and_then(|ty| { - let size = - self.inner_type_size_bytes(&ty.tinfo).unwrap_or(1); - self.alignemnt(&ty.tinfo, size) - }) + let ty = &self.section.types[*idx].tinfo; + let size = self.inner_type_size_bytes(ty).unwrap_or(1); + self.alignemnt(ty, size) } _ => None, } diff --git a/src/til/struct.rs b/src/til/struct.rs index 9139998..a96ce81 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -1,11 +1,12 @@ +use std::collections::HashMap; use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; -use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeRaw}; use anyhow::{anyhow, ensure, Context, Result}; use num_enum::{FromPrimitive, IntoPrimitive, TryFromPrimitive}; +use super::section::TILSectionHeader; use super::{TypeAttribute, TypeVariantRaw}; #[derive(Clone, Debug)] @@ -28,6 +29,8 @@ pub struct Struct { impl Struct { pub(crate) fn new( til: &TILSectionHeader, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, value: StructRaw, fields: &mut impl Iterator>>, ) -> Result { @@ -38,6 +41,8 @@ impl Struct { StructMember::new( til, fields.next().flatten(), + type_by_name, + type_by_ord, member, &mut *fields, ) @@ -195,12 +200,20 @@ impl StructMember { fn new( til: &TILSectionHeader, name: Option>, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, m: StructMemberRaw, fields: &mut impl Iterator>>, ) -> Result { Ok(Self { name, - member_type: Type::new(til, m.ty, fields)?, + member_type: Type::new( + til, + type_by_name, + type_by_ord, + m.ty, + fields, + )?, att: m.att, alignment: m.alignment, is_baseclass: m.is_baseclass, diff --git a/src/til/union.rs b/src/til/union.rs index 54485d5..404d468 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -1,11 +1,12 @@ use anyhow::{anyhow, Context, Result}; +use std::collections::HashMap; use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; -use crate::til::section::TILSectionHeader; use crate::til::{Type, TypeRaw}; +use super::section::TILSectionHeader; use super::{TypeAttribute, TypeVariantRaw}; #[derive(Clone, Debug)] @@ -20,6 +21,8 @@ pub struct Union { impl Union { pub(crate) fn new( til: &TILSectionHeader, + type_by_name: &HashMap, usize>, + type_by_ord: &HashMap, value: UnionRaw, fields: &mut impl Iterator>>, ) -> Result { @@ -28,7 +31,13 @@ impl Union { .into_iter() .map(|member| { let field_name = fields.next().flatten(); - let new_member = Type::new(til, member, &mut *fields)?; + let new_member = Type::new( + til, + type_by_name, + type_by_ord, + member, + &mut *fields, + )?; Ok((field_name, new_member)) }) .collect::>()?; diff --git a/src/tools/dump_til.rs b/src/tools/dump_til.rs index 9f2a374..4f93465 100644 --- a/src/tools/dump_til.rs +++ b/src/tools/dump_til.rs @@ -2,7 +2,7 @@ use std::fs::File; use std::io::BufReader; use anyhow::{anyhow, Result}; -use idb_rs::til::section::TILSection; +use idb_rs::til::section::{TILSection, TILSectionExtendedSizeofInfo}; use idb_rs::til::TILMacro; use idb_rs::IDBParser; @@ -20,37 +20,43 @@ pub fn dump_til(args: &Args) -> Result<()> { parser.read_til_section(til_offset)? } FileType::Til => { - let input = BufReader::new(File::open(&args.input)?); - idb_rs::til::section::TILSection::parse(input)? + let mut input = BufReader::new(File::open(&args.input)?); + idb_rs::til::section::TILSection::read( + &mut input, + idb_rs::IDBSectionCompression::None, + )? } }; // this deconstruction is to changes on TILSection to force a review on this code let TILSection { - format, - description: title, - flags: _, - dependencies: dependency, - compiler_id, - cc, - cm, - cn, - def_align, - type_ordinal_alias, - size_int, - size_enum, - size_bool, - extended_sizeof_info: _, - size_long_double, - is_universal, symbols, types, macros, + header: + idb_rs::til::section::TILSectionHeader { + flags: _, + format, + description, + dependencies, + compiler_id, + cc, + cn, + cm, + def_align, + type_ordinal_alias, + size_int, + size_bool, + size_enum, + extended_sizeof_info, + size_long_double, + is_universal, + }, } = &til; // write the header info println!("format: {format}"); - println!("title: {}", String::from_utf8_lossy(title)); - for (i, dependency) in dependency.iter().enumerate() { + println!("description: {}", String::from_utf8_lossy(description)); + for (i, dependency) in dependencies.iter().enumerate() { println!("dependency-{i}: {}", String::from_utf8_lossy(dependency)); } println!("id: {compiler_id:?}"); @@ -61,6 +67,16 @@ pub fn dump_til(args: &Args) -> Result<()> { println!("size_int: {size_int}"); println!("size_bool: {size_bool}"); println!("size_enum: {size_enum:?}"); + if let Some(TILSectionExtendedSizeofInfo { + size_short, + size_long, + size_long_long, + }) = extended_sizeof_info + { + println!("size_short: {size_short}"); + println!("size_long: {size_long}"); + println!("size_long_long: {size_long_long}"); + } println!("is_universal: {is_universal}"); if let Some(type_ordinal_numbers) = type_ordinal_alias { println!("type_ordinal_numbers: {type_ordinal_numbers:?}"); diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index ed3dd8b..3ced186 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -8,9 +8,10 @@ use idb_rs::til::r#struct::{Struct, StructMemberAtt}; use idb_rs::til::section::TILSection; use idb_rs::til::union::Union; use idb_rs::til::{ - Basic, TILTypeInfo, TILTypeSizeSolver, Type, TypeVariant, Typedef, + Basic, TILTypeInfo, TILTypeSizeSolver, Type, TypeVariant, Typeref, + TyperefType, }; -use idb_rs::IDBParser; +use idb_rs::{IDBParser, IDBSectionCompression}; use std::fs::File; use std::io::{BufReader, Result, Write}; @@ -20,10 +21,11 @@ use crate::{Args, FileType}; pub fn tilib_print(args: &Args) -> anyhow::Result<()> { // parse the id0 sector/file - let input = BufReader::new(File::open(&args.input)?); + let mut input = BufReader::new(File::open(&args.input)?); match args.input_type() { FileType::Til => { - let section = TILSection::parse(input)?; + let section = + TILSection::read(&mut input, IDBSectionCompression::None)?; print_til_section(std::io::stdout(), §ion)?; } FileType::Idb => { @@ -39,10 +41,10 @@ pub fn tilib_print(args: &Args) -> anyhow::Result<()> { } fn print_til_section(mut fmt: impl Write, section: &TILSection) -> Result<()> { - if !section.dependencies.is_empty() { + if !section.header.dependencies.is_empty() { // TODO open those files? What todo with then? write!(fmt, "Warning: ")?; - for dependency in §ion.dependencies { + for dependency in §ion.header.dependencies { fmt.write_all(dependency)?; writeln!(fmt, ": No such file or directory")?; } @@ -81,7 +83,7 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { // the description of the file // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b710 write!(fmt, "Description: ")?; - fmt.write_all(§ion.description)?; + fmt.write_all(§ion.header.description)?; writeln!(fmt)?; // flags from the section header @@ -105,12 +107,12 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { writeln!( fmt, "Compiler : {}", - compiler_id_to_str(section.compiler_id) + compiler_id_to_str(section.header.compiler_id) )?; // alignement and convention stuff // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b7ed - if let Some(cn) = section.cn { + if let Some(cn) = section.header.cn { write!( fmt, "sizeof(near*) = {} sizeof(far*) = {}", @@ -119,8 +121,8 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { )?; } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40ba3b - if let Some(cm) = section.cm { - if section.cn.is_some() { + if let Some(cm) = section.header.cm { + if section.header.cn.is_some() { write!(fmt, " ")?; } let code = if cm.is_code_near() { "near" } else { "far" }; @@ -128,8 +130,8 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { write!(fmt, "{code} code, {data} data",)?; } // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b860 - if let Some(cc) = section.cc { - if section.cm.is_some() || section.cn.is_some() { + if let Some(cc) = section.header.cc { + if section.header.cm.is_some() || section.header.cn.is_some() { write!(fmt, ", ")?; } write!(fmt, "{}", calling_convention_to_str(cc))?; @@ -141,22 +143,26 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { writeln!( fmt, "default_align = {} sizeof(bool) = {} sizeof(long) = {} sizeof(llong) = {}", - section.def_align.map(|x| x.get()).unwrap_or(0), - section.size_bool, + section.header.def_align.map(|x| x.get()).unwrap_or(0), + section.header.size_bool, section.sizeof_long(), section.sizeof_long_long(), )?; writeln!( fmt, "sizeof(enum) = {} sizeof(int) = {} sizeof(short) = {}", - section.size_enum.map(NonZeroU8::get).unwrap_or(0), - section.size_int, + section.header.size_enum.map(NonZeroU8::get).unwrap_or(0), + section.header.size_int, section.sizeof_short(), )?; writeln!( fmt, "sizeof(long double) = {}", - section.size_long_double.map(NonZeroU8::get).unwrap_or(0) + section + .header + .size_long_double + .map(NonZeroU8::get) + .unwrap_or(0) )?; Ok(()) } @@ -165,29 +171,30 @@ fn print_section_flags( fmt: &mut impl Write, section: &TILSection, ) -> Result<()> { - write!(fmt, "Flags : {:04X}", section.flags.as_raw())?; - if section.flags.is_zip() { + let flags = section.header.flags; + write!(fmt, "Flags : {:04X}", flags.as_raw())?; + if flags.is_zip() { write!(fmt, " compressed")?; } - if section.flags.has_macro_table() { + if flags.has_macro_table() { write!(fmt, " macro_table_present")?; } - if section.flags.have_extended_sizeof_info() { + if flags.have_extended_sizeof_info() { write!(fmt, " extended_sizeof_info")?; } - if section.flags.is_universal() { + if flags.is_universal() { write!(fmt, " universal")?; } - if section.flags.has_ordinal() { + if flags.has_ordinal() { write!(fmt, " ordinals_present")?; } - if section.flags.has_type_aliases() { + if flags.has_type_aliases() { write!(fmt, " aliases_present")?; } - if section.flags.has_extra_stream() { + if flags.has_extra_stream() { write!(fmt, " extra_streams")?; } - if section.flags.has_size_long_double() { + if flags.has_size_long_double() { write!(fmt, " sizeof_long_double")?; } writeln!(fmt) @@ -270,7 +277,7 @@ fn print_types( solver: &mut TILTypeSizeSolver<'_>, ) -> Result<()> { // TODO only print by ordinals if there are ordinals - if section.flags.has_ordinal() { + if section.header.flags.has_ordinal() { writeln!(fmt, "(enumerated by ordinals)")?; print_types_by_ordinals(fmt, section, solver)?; writeln!(fmt, "(enumerated by names)")?; @@ -295,6 +302,7 @@ fn print_types_by_ordinals( .map(|(idx, ty)| OrdType::Type { idx, ty }) .chain( section + .header .type_ordinal_alias .iter() .flat_map(|x| x.iter()) @@ -367,9 +375,10 @@ fn print_til_type_root( TypeVariant::Struct(_) | TypeVariant::Union(_) | TypeVariant::Enum(_) => {} - TypeVariant::StructRef(Typedef::Name(None)) - | TypeVariant::UnionRef(Typedef::Name(None)) - | TypeVariant::EnumRef(Typedef::Name(None)) => {} + TypeVariant::Typeref(Typeref::UnresolvedName { + name: _, + ref_type: Some(_), + }) => {} // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x443906 _ => write!(fmt, "typedef ")?, } @@ -412,26 +421,7 @@ fn print_til_type( print_pointer_space, print_type_prefix, ), - TypeVariant::Typedef(ref_type) => print_til_type_typedef( - fmt, section, name, til_type, ref_type, false, - ), - TypeVariant::UnionRef(ref_type) => print_til_type_complex_ref( - fmt, - section, - name, - til_type, - ref_type, - print_type_prefix, - ), - TypeVariant::EnumRef(ref_type) => print_til_type_complex_ref( - fmt, - section, - name, - til_type, - ref_type, - print_type_prefix, - ), - TypeVariant::StructRef(ref_type) => print_til_type_complex_ref( + TypeVariant::Typeref(ref_type) => print_til_type_typedef( fmt, section, name, @@ -573,7 +563,7 @@ fn print_til_type_function( write!(fmt, " ")?; } - let cc = match (section.cc, til_function.calling_convention) { + let cc = match (section.header.cc, til_function.calling_convention) { // don't print if using the til section default cc | (_, None) // if elipsis just print the '...' as last param @@ -647,7 +637,7 @@ fn print_til_type_array( til_type: &Type, til_array: &Array, print_pointer_space: bool, - print_type_prefix: bool, + _print_type_prefix: bool, ) -> Result<()> { if til_type.is_volatile { write!(fmt, "volatile ")?; @@ -662,7 +652,7 @@ fn print_til_type_array( &til_array.elem_type, false, print_pointer_space, - print_type_prefix, + false, true, )?; if let Some(name) = name { @@ -686,7 +676,7 @@ fn print_til_type_typedef( section: &TILSection, name: Option<&[u8]>, til_type: &Type, - typedef: &Typedef, + typedef: &Typeref, print_prefix: bool, ) -> Result<()> { if til_type.is_volatile { @@ -696,24 +686,31 @@ fn print_til_type_typedef( write!(fmt, "const ")?; } if print_prefix { - print_til_type_prefix(fmt, til_type, true)?; + print_til_type_prefix(fmt, section, til_type, true)?; } // get the type referenced by the typdef let need_space = match typedef { - idb_rs::til::Typedef::Ordinal(ord) => { - let inner_ty = section - .get_ord(idb_rs::id0::Id0TilOrd { ord: (*ord).into() }) - .unwrap(); + Typeref::Ref(idx) => { + let inner_ty = §ion.types[*idx]; fmt.write_all(&inner_ty.name)?; true } - idb_rs::til::Typedef::Name(Some(name)) => { - // NOTE don't need to get the inner type, we already have it's name + Typeref::UnresolvedName { + name: Some(name), + ref_type: _, + } => { fmt.write_all(name)?; true } // Nothing to print - idb_rs::til::Typedef::Name(None) => false, + Typeref::UnresolvedName { + name: None, + ref_type: _, + } + | Typeref::UnresolvedOrd { + ord: _, + ref_type: _, + } => false, }; // print the type name, if some if let Some(name) = name { @@ -725,34 +722,6 @@ fn print_til_type_typedef( Ok(()) } -fn print_til_type_complex_ref( - fmt: &mut impl Write, - section: &TILSection, - name: Option<&[u8]>, - til_type: &Type, - typedef: &Typedef, - print_prefix: bool, -) -> Result<()> { - if let idb_rs::til::Typedef::Name(None) = typedef { - if print_prefix { - print_til_type_prefix(fmt, til_type, true)?; - } - if let Some(name) = name { - fmt.write_all(name)?; - } - } else { - print_til_type_typedef( - fmt, - section, - name, - til_type, - typedef, - print_prefix, - )?; - } - Ok(()) -} - fn print_til_type_struct( fmt: &mut impl Write, section: &TILSection, @@ -892,12 +861,10 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - true, + false, print_name, ); }; - let qualified_parent_name: Vec<_> = - parent_name.iter().chain(b"::").copied().collect(); // TODO if the field is named, don't embeded it? if name.is_some() { @@ -908,7 +875,7 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - true, + false, print_name, ); } @@ -916,10 +883,7 @@ fn print_til_type_complex_member( // if typedef of complex ref, we may want to embed the definition inside the type // otherwise just print the type regularly let typedef = match &til.type_variant { - TypeVariant::EnumRef(typedef) - | TypeVariant::StructRef(typedef) - | TypeVariant::UnionRef(typedef) - | TypeVariant::Typedef(typedef) => typedef, + TypeVariant::Typeref(typedef) => typedef, _ => { return print_til_type( fmt, @@ -928,17 +892,32 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - true, + false, print_name, ); } }; let inner_type = match typedef { - Typedef::Ordinal(ord) => { - section.get_ord(Id0TilOrd { ord: (*ord).into() }).unwrap() + Typeref::Ref(idx) => §ion.types[*idx], + Typeref::UnresolvedName { + name: Some(name), + ref_type, + } => { + if let Some(ref_type) = ref_type { + print_typeref_type_prefix(fmt, *ref_type)?; + } + fmt.write_all(&name)?; + return Ok(()); } - Typedef::Name(None) => { + Typeref::UnresolvedOrd { + ord: _, + ref_type: _, + } + | Typeref::UnresolvedName { + name: None, + ref_type: _, + } => { return print_til_type( fmt, section, @@ -946,15 +925,16 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - true, + false, print_name, ); } - Typedef::Name(Some(name)) => section.get_name(name).unwrap(), }; // if the inner_type name is in the format `parent_name::something_else` then // we embed it + let qualified_parent_name: Vec<_> = + parent_name.iter().chain(b"::").copied().collect(); if !inner_type.name.starts_with(&qualified_parent_name) { return print_til_type( fmt, @@ -963,7 +943,7 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - true, + false, print_name, ); } @@ -1005,7 +985,7 @@ fn print_til_type_enum( || til_enum.is_signed || til_enum.is_unsigned { - let bytes = til_enum.storage_size.or(section.size_enum).unwrap(); + let bytes = til_enum.storage_size.or(section.header.size_enum).unwrap(); let signed = if til_enum.is_unsigned { "unsigned " } else { @@ -1204,17 +1184,27 @@ fn print_til_struct_member_basic_att( fn print_til_type_prefix( fmt: &mut impl Write, + section: &TILSection, tinfo: &Type, with_space: bool, ) -> Result<()> { match &tinfo.type_variant { - TypeVariant::UnionRef(_) | TypeVariant::Union(_) => { - write!(fmt, "union")? - } - TypeVariant::StructRef(_) | TypeVariant::Struct(_) => { - write!(fmt, "struct")? + TypeVariant::Typeref(Typeref::Ref(idx)) => { + // NOTE don't go other level down + match §ion.types[*idx].tinfo.type_variant { + TypeVariant::Union(_) => write!(fmt, "union")?, + TypeVariant::Struct(_) => write!(fmt, "struct")?, + TypeVariant::Enum(_) => write!(fmt, "enum")?, + _ => return Ok(()), + } } - TypeVariant::EnumRef(_) | TypeVariant::Enum(_) => write!(fmt, "enum")?, + TypeVariant::Typeref(Typeref::UnresolvedName { + name: _, + ref_type: Some(ref_type), + }) => print_typeref_type_prefix(fmt, *ref_type)?, + TypeVariant::Union(_) => write!(fmt, "union")?, + TypeVariant::Struct(_) => write!(fmt, "struct")?, + TypeVariant::Enum(_) => write!(fmt, "enum")?, _ => return Ok(()), } if with_space { @@ -1229,11 +1219,19 @@ fn print_til_type_only( tinfo: &Type, ) -> Result<()> { match &tinfo.type_variant { - TypeVariant::Typedef(Typedef::Name(Some(name))) => { + TypeVariant::Typeref(Typeref::UnresolvedName { + name: Some(name), + ref_type: _, + }) => { fmt.write_all(name)?; } - TypeVariant::Typedef(Typedef::Ordinal(ord)) => { - let ty = section.get_ord(Id0TilOrd { ord: (*ord).into() }).unwrap(); + TypeVariant::Typeref(Typeref::UnresolvedName { + name: None, + ref_type: _, + }) => {} + TypeVariant::Typeref(Typeref::Ref(idx)) => { + //TypeVariant::Typeref(Typeref::Ordinal(ord)) => { + let ty = §ion.types[*idx]; fmt.write_all(&ty.name)?; } _ => {} @@ -1313,6 +1311,7 @@ fn print_types_total(fmt: &mut impl Write, section: &TILSection) -> Result<()> { .map(|macros| macros.len()) .unwrap_or(0); let alias_num = section + .header .type_ordinal_alias .as_ref() .map(Vec::len) @@ -1331,16 +1330,11 @@ fn is_vft(section: &TILSection, typ: &Type) -> bool { //TypeVariant::Pointer(pointer) => todo!(), // TODO struct with only function-pointers is also vftable? TypeVariant::Struct(ty) => ty.is_vft, - TypeVariant::Typedef(typedef) | TypeVariant::StructRef(typedef) => { + TypeVariant::Typeref(typedef) => { let inner_type = match typedef { - Typedef::Ordinal(ord) => { - section.get_ord(Id0TilOrd { ord: (*ord).into() }) - } - Typedef::Name(None) => return false, - Typedef::Name(Some(name)) => section.get_name(name), - }; - let Some(inner_type) = inner_type else { - return false; + Typeref::Ref(idx) => §ion.types[*idx], + Typeref::UnresolvedOrd { .. } + | Typeref::UnresolvedName { .. } => return false, }; is_vft(section, &inner_type.tinfo) } @@ -1393,3 +1387,14 @@ fn print_basic_type(fmt: &mut impl Write, til_basic: &Basic) -> Result<()> { } Ok(()) } + +fn print_typeref_type_prefix( + fmt: &mut impl Write, + ref_type: TyperefType, +) -> Result<()> { + match ref_type { + idb_rs::til::TyperefType::Union => write!(fmt, "union"), + idb_rs::til::TyperefType::Struct => write!(fmt, "struct"), + idb_rs::til::TyperefType::Enum => write!(fmt, "enum"), + } +} From 1c5d29a6af1f15fedcfd3bb540dc09d273e6a1d0 Mon Sep 17 00:00:00 2001 From: rbran Date: Mon, 13 Jan 2025 17:50:32 -0300 Subject: [PATCH 51/53] add til typeref ref kind to all typerefs --- src/til.rs | 47 +++++++------- src/til/size_calculator.rs | 6 +- src/tools/tilib.rs | 122 +++++++++++++------------------------ 3 files changed, 68 insertions(+), 107 deletions(-) diff --git a/src/til.rs b/src/til.rs index e0abe7d..e1ded8c 100644 --- a/src/til.rs +++ b/src/til.rs @@ -586,16 +586,16 @@ impl TypedefRaw { } #[derive(Clone, Debug)] -pub enum Typeref { +pub struct Typeref { + pub ref_type: Option, + pub typeref_value: TyperefValue, +} + +#[derive(Clone, Debug)] +pub enum TyperefValue { Ref(usize), - UnresolvedName { - name: Option>, - ref_type: Option, - }, - UnresolvedOrd { - ord: u32, - ref_type: Option, - }, + UnsolvedName(Option>), + UnsolvedOrd(u32), } #[derive(Clone, Copy, Debug, PartialEq, Eq)] @@ -615,30 +615,33 @@ impl Typeref { // TODO check is ord is set on the header TypedefRaw::Ordinal(ord) => { let Some(pos) = type_by_ord.get(&(ord.into())) else { - return Ok(Self::UnresolvedOrd { - ord, + return Ok(Self { ref_type: None, + typeref_value: TyperefValue::UnsolvedOrd(ord), }); }; pos } TypedefRaw::Name(None) => { - return Ok(Self::UnresolvedName { - name: None, + return Ok(Self { ref_type: None, + typeref_value: TyperefValue::UnsolvedName(None), }) } TypedefRaw::Name(Some(name)) => { let Some(pos) = type_by_name.get(&name[..]) else { - return Ok(Self::UnresolvedName { - name: Some(name), + return Ok(Self { ref_type: None, + typeref_value: TyperefValue::UnsolvedName(Some(name)), }); }; pos } }; - Ok(Self::Ref(*pos)) + Ok(Self { + ref_type: None, + typeref_value: TyperefValue::Ref(*pos), + }) } fn new_struct( @@ -647,9 +650,7 @@ impl Typeref { x: TypedefRaw, ) -> Result { let mut result = Self::new(type_by_name, type_by_ord, x)?; - if let Typeref::UnresolvedName { name: _, ref_type } = &mut result { - *ref_type = Some(TyperefType::Struct) - } + result.ref_type = Some(TyperefType::Struct); // TODO check the inner type is in fact a struct Ok(result) } @@ -660,9 +661,7 @@ impl Typeref { x: TypedefRaw, ) -> Result { let mut result = Self::new(type_by_name, type_by_ord, x)?; - if let Typeref::UnresolvedName { name: _, ref_type } = &mut result { - *ref_type = Some(TyperefType::Union) - } + result.ref_type = Some(TyperefType::Union); // TODO check the inner type is in fact a union Ok(result) } @@ -673,9 +672,7 @@ impl Typeref { x: TypedefRaw, ) -> Result { let mut result = Self::new(type_by_name, type_by_ord, x)?; - if let Typeref::UnresolvedName { name: _, ref_type } = &mut result { - *ref_type = Some(TyperefType::Enum) - } + result.ref_type = Some(TyperefType::Enum); // TODO check the inner type is in fact a enum Ok(result) } diff --git a/src/til/size_calculator.rs b/src/til/size_calculator.rs index 32334e2..e9bd53f 100644 --- a/src/til/size_calculator.rs +++ b/src/til/size_calculator.rs @@ -7,7 +7,7 @@ use super::r#enum::Enum; use super::r#struct::StructMember; use super::section::TILSection; use super::union::Union; -use super::{Basic, Type, TypeVariant, Typeref}; +use super::{Basic, Type, TypeVariant, Typeref, TyperefValue}; pub struct TILTypeSizeSolver<'a> { section: &'a TILSection, @@ -173,7 +173,7 @@ impl<'a> TILTypeSizeSolver<'a> { } fn solve_typedef(&mut self, typedef: &Typeref) -> Option { - let Typeref::Ref(idx) = typedef else { + let TyperefValue::Ref(idx) = &typedef.typeref_value else { return None; }; // if cached return it @@ -203,7 +203,7 @@ impl<'a> TILTypeSizeSolver<'a> { self.alignemnt(&array.elem_type, size.unwrap_or(1)) } TypeVariant::Typeref(ty) => { - let Typeref::Ref(idx) = ty else { + let TyperefValue::Ref(idx) = &ty.typeref_value else { return None; }; let ty = &self.section.types[*idx].tinfo; diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 3ced186..712b87b 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -9,7 +9,7 @@ use idb_rs::til::section::TILSection; use idb_rs::til::union::Union; use idb_rs::til::{ Basic, TILTypeInfo, TILTypeSizeSolver, Type, TypeVariant, Typeref, - TyperefType, + TyperefType, TyperefValue, }; use idb_rs::{IDBParser, IDBSectionCompression}; @@ -375,9 +375,9 @@ fn print_til_type_root( TypeVariant::Struct(_) | TypeVariant::Union(_) | TypeVariant::Enum(_) => {} - TypeVariant::Typeref(Typeref::UnresolvedName { - name: _, - ref_type: Some(_), + TypeVariant::Typeref(Typeref { + typeref_value: TyperefValue::UnsolvedName(Some(_)), + ref_type: _, }) => {} // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x443906 _ => write!(fmt, "typedef ")?, @@ -685,36 +685,38 @@ fn print_til_type_typedef( if til_type.is_const { write!(fmt, "const ")?; } + let mut need_prefix_space = false; if print_prefix { - print_til_type_prefix(fmt, section, til_type, true)?; + if let Some(ref_prefix) = typedef.ref_type { + print_typeref_type_prefix(fmt, ref_prefix)?; + need_prefix_space = true; + } } // get the type referenced by the typdef - let need_space = match typedef { - Typeref::Ref(idx) => { + let need_type_space = match &typedef.typeref_value { + TyperefValue::Ref(idx) => { + if need_prefix_space { + write!(fmt, " ")?; + } let inner_ty = §ion.types[*idx]; fmt.write_all(&inner_ty.name)?; true } - Typeref::UnresolvedName { - name: Some(name), - ref_type: _, - } => { + TyperefValue::UnsolvedName(Some(name)) => { + if need_prefix_space { + write!(fmt, " ")?; + } fmt.write_all(name)?; true } // Nothing to print - Typeref::UnresolvedName { - name: None, - ref_type: _, + TyperefValue::UnsolvedName(None) | TyperefValue::UnsolvedOrd(_) => { + false } - | Typeref::UnresolvedOrd { - ord: _, - ref_type: _, - } => false, }; // print the type name, if some if let Some(name) = name { - if need_space { + if need_type_space { write!(fmt, " ")?; } fmt.write_all(name)?; @@ -861,7 +863,7 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - false, + true, print_name, ); }; @@ -875,7 +877,7 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - false, + true, print_name, ); } @@ -892,32 +894,22 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - false, + true, print_name, ); } }; - let inner_type = match typedef { - Typeref::Ref(idx) => §ion.types[*idx], - Typeref::UnresolvedName { - name: Some(name), - ref_type, - } => { - if let Some(ref_type) = ref_type { + let inner_type = match &typedef.typeref_value { + TyperefValue::Ref(idx) => §ion.types[*idx], + TyperefValue::UnsolvedName(Some(name)) => { + if let Some(ref_type) = &typedef.ref_type { print_typeref_type_prefix(fmt, *ref_type)?; } fmt.write_all(&name)?; return Ok(()); } - Typeref::UnresolvedOrd { - ord: _, - ref_type: _, - } - | Typeref::UnresolvedName { - name: None, - ref_type: _, - } => { + TyperefValue::UnsolvedOrd(_) | TyperefValue::UnsolvedName(None) => { return print_til_type( fmt, section, @@ -925,7 +917,7 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - false, + true, print_name, ); } @@ -943,7 +935,7 @@ fn print_til_type_complex_member( til, is_vft, print_pointer_space, - false, + true, print_name, ); } @@ -1182,54 +1174,26 @@ fn print_til_struct_member_basic_att( Ok(()) } -fn print_til_type_prefix( - fmt: &mut impl Write, - section: &TILSection, - tinfo: &Type, - with_space: bool, -) -> Result<()> { - match &tinfo.type_variant { - TypeVariant::Typeref(Typeref::Ref(idx)) => { - // NOTE don't go other level down - match §ion.types[*idx].tinfo.type_variant { - TypeVariant::Union(_) => write!(fmt, "union")?, - TypeVariant::Struct(_) => write!(fmt, "struct")?, - TypeVariant::Enum(_) => write!(fmt, "enum")?, - _ => return Ok(()), - } - } - TypeVariant::Typeref(Typeref::UnresolvedName { - name: _, - ref_type: Some(ref_type), - }) => print_typeref_type_prefix(fmt, *ref_type)?, - TypeVariant::Union(_) => write!(fmt, "union")?, - TypeVariant::Struct(_) => write!(fmt, "struct")?, - TypeVariant::Enum(_) => write!(fmt, "enum")?, - _ => return Ok(()), - } - if with_space { - write!(fmt, " ")?; - } - Ok(()) -} - fn print_til_type_only( fmt: &mut impl Write, section: &TILSection, tinfo: &Type, ) -> Result<()> { match &tinfo.type_variant { - TypeVariant::Typeref(Typeref::UnresolvedName { - name: Some(name), + TypeVariant::Typeref(Typeref { + typeref_value: TyperefValue::UnsolvedName(Some(name)), ref_type: _, }) => { fmt.write_all(name)?; } - TypeVariant::Typeref(Typeref::UnresolvedName { - name: None, + TypeVariant::Typeref(Typeref { + typeref_value: TyperefValue::UnsolvedName(None), ref_type: _, }) => {} - TypeVariant::Typeref(Typeref::Ref(idx)) => { + TypeVariant::Typeref(Typeref { + typeref_value: TyperefValue::Ref(idx), + ref_type: _, + }) => { //TypeVariant::Typeref(Typeref::Ordinal(ord)) => { let ty = §ion.types[*idx]; fmt.write_all(&ty.name)?; @@ -1331,10 +1295,10 @@ fn is_vft(section: &TILSection, typ: &Type) -> bool { // TODO struct with only function-pointers is also vftable? TypeVariant::Struct(ty) => ty.is_vft, TypeVariant::Typeref(typedef) => { - let inner_type = match typedef { - Typeref::Ref(idx) => §ion.types[*idx], - Typeref::UnresolvedOrd { .. } - | Typeref::UnresolvedName { .. } => return false, + let inner_type = match &typedef.typeref_value { + TyperefValue::Ref(idx) => §ion.types[*idx], + TyperefValue::UnsolvedOrd(_) + | TyperefValue::UnsolvedName(_) => return false, }; is_vft(section, &inner_type.tinfo) } From 73832de86ec5cd0f201113fdc86b5b179ab3fd42 Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 14 Jan 2025 08:26:53 -0300 Subject: [PATCH 52/53] fix tilib print format issues --- src/tools/tilib.rs | 27 +++++++++++++-------------- 1 file changed, 13 insertions(+), 14 deletions(-) diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 712b87b..264bb7c 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -376,8 +376,8 @@ fn print_til_type_root( | TypeVariant::Union(_) | TypeVariant::Enum(_) => {} TypeVariant::Typeref(Typeref { - typeref_value: TyperefValue::UnsolvedName(Some(_)), - ref_type: _, + typeref_value: TyperefValue::UnsolvedName(None), + ref_type: Some(_), }) => {} // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x443906 _ => write!(fmt, "typedef ")?, @@ -652,7 +652,7 @@ fn print_til_type_array( &til_array.elem_type, false, print_pointer_space, - false, + true, true, )?; if let Some(name) = name { @@ -685,38 +685,36 @@ fn print_til_type_typedef( if til_type.is_const { write!(fmt, "const ")?; } - let mut need_prefix_space = false; + let mut need_space = false; if print_prefix { if let Some(ref_prefix) = typedef.ref_type { print_typeref_type_prefix(fmt, ref_prefix)?; - need_prefix_space = true; + need_space = true; } } // get the type referenced by the typdef - let need_type_space = match &typedef.typeref_value { + match &typedef.typeref_value { TyperefValue::Ref(idx) => { - if need_prefix_space { + if need_space { write!(fmt, " ")?; } let inner_ty = §ion.types[*idx]; fmt.write_all(&inner_ty.name)?; - true + need_space = true; } TyperefValue::UnsolvedName(Some(name)) => { - if need_prefix_space { + if need_space { write!(fmt, " ")?; } fmt.write_all(name)?; - true + need_space = true; } // Nothing to print - TyperefValue::UnsolvedName(None) | TyperefValue::UnsolvedOrd(_) => { - false - } + TyperefValue::UnsolvedName(None) | TyperefValue::UnsolvedOrd(_) => {} }; // print the type name, if some if let Some(name) = name { - if need_type_space { + if need_space { write!(fmt, " ")?; } fmt.write_all(name)?; @@ -853,6 +851,7 @@ fn print_til_type_complex_member( print_pointer_space: bool, print_name: bool, ) -> Result<()> { + // TODO make closure that print member atts: VFT, align, unaligned, packed, etc // if parent is not named, don't embeded it, because we can verify if it's part // of the parent let Some(parent_name) = parent_name else { From c44932259b35f467905e177f5f54b92f913c65df Mon Sep 17 00:00:00 2001 From: rbran Date: Tue, 14 Jan 2025 10:27:10 -0300 Subject: [PATCH 53/53] add IDBString for better debug format --- src/lib.rs | 32 ++++++++++++++++++++++++++ src/til.rs | 33 +++++++++++++++------------ src/til/array.rs | 3 ++- src/til/enum.rs | 5 +++-- src/til/function.rs | 5 +++-- src/til/pointer.rs | 3 ++- src/til/section.rs | 13 ++++++----- src/til/struct.rs | 9 ++++---- src/til/union.rs | 5 +++-- src/tools/dump_til.rs | 4 ++-- src/tools/tilib.rs | 52 ++++++++++++++++++++++++++----------------- 11 files changed, 109 insertions(+), 55 deletions(-) diff --git a/src/lib.rs b/src/lib.rs index 8ce6ff8..43c85a9 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -5,7 +5,9 @@ pub(crate) mod ida_reader; pub mod nam; pub mod til; +use std::borrow::Cow; use std::fmt::Debug; +use std::fmt::Write; use std::io::SeekFrom; use std::num::NonZeroU64; @@ -561,6 +563,36 @@ impl VaVersion { } } +#[derive(Clone)] +pub struct IDBString(Vec); + +impl IDBString { + pub fn new(data: Vec) -> Self { + Self(data) + } + + pub fn as_utf8_lossy(&self) -> Cow { + String::from_utf8_lossy(&self.0) + } + + pub fn as_bytes(&self) -> &[u8] { + &self.0 + } + + pub fn into_inner(self) -> Vec { + self.0 + } +} + +impl std::fmt::Debug for IDBString { + fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result { + f.write_char('"')?; + f.write_str(&self.as_utf8_lossy())?; + f.write_char('"')?; + Ok(()) + } +} + fn write_string_len_u8( mut output: O, value: &[u8], diff --git a/src/til.rs b/src/til.rs index e1ded8c..f0fd53b 100644 --- a/src/til.rs +++ b/src/til.rs @@ -28,10 +28,11 @@ use crate::til::pointer::{Pointer, PointerRaw}; use crate::til::r#enum::{Enum, EnumRaw}; use crate::til::r#struct::{Struct, StructRaw}; use crate::til::union::{Union, UnionRaw}; +use crate::IDBString; #[derive(Debug, Clone)] pub struct TILTypeInfo { - pub name: Vec, + pub name: IDBString, pub ordinal: u64, pub tinfo: Type, } @@ -41,14 +42,14 @@ impl TILTypeInfo { til: &TILSectionHeader, type_by_name: &HashMap, usize>, type_by_ord: &HashMap, - name: Vec, + name: IDBString, ordinal: u64, tinfo_raw: TypeRaw, fields: Vec>, ) -> Result { let mut fields_iter = fields .into_iter() - .map(|field| (!field.is_empty()).then_some(field)); + .map(|field| (!field.is_empty()).then_some(IDBString::new(field))); let tinfo = Type::new( til, type_by_name, @@ -60,7 +61,7 @@ impl TILTypeInfo { ensure!( fields_iter.next().is_none(), "Extra fields found for til type \"{}\"", - String::from_utf8_lossy(&name) + name.as_utf8_lossy() ); Ok(Self { name, @@ -73,7 +74,7 @@ impl TILTypeInfo { #[derive(Debug, Clone)] pub(crate) struct TILTypeInfoRaw { _flags: u32, - pub name: Vec, + pub name: IDBString, pub ordinal: u64, pub tinfo: TypeRaw, _cmt: Vec, @@ -111,7 +112,7 @@ impl TILTypeInfoRaw { fn read_inner(cursor: &mut &[u8], til: &TILSectionHeader) -> Result { let flags: u32 = cursor.read_u32()?; // TODO verify if flags equal to 0x7fff_fffe? - let name = cursor.read_c_string_raw()?; + let name = IDBString::new(cursor.read_c_string_raw()?); let is_u64 = (flags >> 31) != 0; let ordinal = match (til.format, is_u64) { // formats below 0x12 doesn't have 64 bits ord @@ -121,7 +122,7 @@ impl TILTypeInfoRaw { let tinfo = TypeRaw::read(&mut *cursor, til).with_context(|| { format!( "parsing `TILTypeInfo::tiinfo` for type \"{}\"", - String::from_utf8_lossy(&name) + name.as_utf8_lossy() ) })?; let _info = cursor.read_c_string_raw()?; @@ -169,7 +170,7 @@ impl Type { type_by_name: &HashMap, usize>, type_by_ord: &HashMap, tinfo_raw: TypeRaw, - fields: &mut impl Iterator>>, + fields: &mut impl Iterator>, ) -> Result { let type_variant = match tinfo_raw.variant { TypeVariantRaw::Basic(x) => TypeVariant::Basic(x), @@ -231,7 +232,7 @@ impl Type { let header = section::TILSectionHeader { format: 12, flags: section::TILSectionFlags(0), - description: Vec::new(), + description: IDBString::new(Vec::new()), dependencies: Vec::new(), size_enum: None, size_int: 4.try_into().unwrap(), @@ -265,7 +266,7 @@ impl Type { if field.is_empty() { None } else { - Some(field) + Some(IDBString::new(field)) } }); let result = Self::new( @@ -563,7 +564,7 @@ impl Basic { #[derive(Clone, Debug)] pub enum TypedefRaw { Ordinal(u32), - Name(Option>), + Name(Option), } impl TypedefRaw { @@ -580,7 +581,11 @@ impl TypedefRaw { } Ok(Self::Ordinal(de)) } - _ => Ok(Self::Name(if buf.is_empty() { None } else { Some(buf) })), + _ => Ok(Self::Name(if buf.is_empty() { + None + } else { + Some(IDBString::new(buf)) + })), } } } @@ -594,7 +599,7 @@ pub struct Typeref { #[derive(Clone, Debug)] pub enum TyperefValue { Ref(usize), - UnsolvedName(Option>), + UnsolvedName(Option), UnsolvedOrd(u32), } @@ -629,7 +634,7 @@ impl Typeref { }) } TypedefRaw::Name(Some(name)) => { - let Some(pos) = type_by_name.get(&name[..]) else { + let Some(pos) = type_by_name.get(name.as_bytes()) else { return Ok(Self { ref_type: None, typeref_value: TyperefValue::UnsolvedName(Some(name)), diff --git a/src/til/array.rs b/src/til/array.rs index 2c31434..670cffa 100644 --- a/src/til/array.rs +++ b/src/til/array.rs @@ -3,6 +3,7 @@ use std::num::{NonZeroU16, NonZeroU8}; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::{Type, TypeAttribute, TypeRaw}; +use crate::IDBString; use super::section::TILSectionHeader; @@ -19,7 +20,7 @@ impl Array { type_by_name: &HashMap, usize>, type_by_ord: &HashMap, value: ArrayRaw, - fields: &mut impl Iterator>>, + fields: &mut impl Iterator>, ) -> anyhow::Result { Ok(Self { alignment: value.alignment, diff --git a/src/til/enum.rs b/src/til/enum.rs index e864212..92bb38b 100644 --- a/src/til/enum.rs +++ b/src/til/enum.rs @@ -2,6 +2,7 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::{flag, TypeAttribute, TypeRaw, TypeVariantRaw}; +use crate::IDBString; use anyhow::{anyhow, ensure}; use super::section::TILSectionHeader; @@ -11,7 +12,7 @@ pub struct Enum { pub is_signed: bool, pub is_unsigned: bool, pub output_format: EnumFormat, - pub members: Vec<(Option>, u64)>, + pub members: Vec<(Option, u64)>, pub groups: Option>, pub storage_size: Option, // TODO parse type attributes @@ -21,7 +22,7 @@ impl Enum { pub(crate) fn new( _til: &TILSectionHeader, value: EnumRaw, - fields: &mut impl Iterator>>, + fields: &mut impl Iterator>, ) -> anyhow::Result { let members = value .members diff --git a/src/til/function.rs b/src/til/function.rs index e0a21b2..088b12a 100644 --- a/src/til/function.rs +++ b/src/til/function.rs @@ -3,6 +3,7 @@ use std::num::NonZeroU8; use crate::ida_reader::{IdaGenericBufUnpack, IdaGenericUnpack}; use crate::til::{Basic, Type, TypeRaw}; +use crate::IDBString; use anyhow::{anyhow, ensure, Context, Result}; use super::section::TILSectionHeader; @@ -12,7 +13,7 @@ use super::TypeVariantRaw; pub struct Function { pub calling_convention: Option, pub ret: Box, - pub args: Vec<(Option>, Type, Option)>, + pub args: Vec<(Option, Type, Option)>, pub retloc: Option, pub method: Option, @@ -32,7 +33,7 @@ impl Function { type_by_name: &HashMap, usize>, type_by_ord: &HashMap, value: FunctionRaw, - fields: &mut impl Iterator>>, + fields: &mut impl Iterator>, ) -> Result { let ret = Type::new( til, diff --git a/src/til/pointer.rs b/src/til/pointer.rs index 8b52c44..46ecbd0 100644 --- a/src/til/pointer.rs +++ b/src/til/pointer.rs @@ -4,6 +4,7 @@ use anyhow::Result; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::{Type, TypeAttribute, TypeRaw}; +use crate::IDBString; use super::section::TILSectionHeader; @@ -21,7 +22,7 @@ impl Pointer { type_by_name: &HashMap, usize>, type_by_ord: &HashMap, raw: PointerRaw, - fields: &mut impl Iterator>>, + fields: &mut impl Iterator>, ) -> Result { let shifted = raw .shifted diff --git a/src/til/section.rs b/src/til/section.rs index 2239c62..ba6cd08 100644 --- a/src/til/section.rs +++ b/src/til/section.rs @@ -1,7 +1,7 @@ use crate::id0::{Compiler, Id0TilOrd}; use crate::ida_reader::{IdaGenericBufUnpack, IdaGenericUnpack}; use crate::til::{flag, TILMacro, TILTypeInfo, TILTypeInfoRaw}; -use crate::IDBSectionCompression; +use crate::{IDBSectionCompression, IDBString}; use anyhow::{anyhow, ensure, Result}; use serde::{Deserialize, Serialize}; @@ -34,11 +34,11 @@ pub(crate) struct TILSectionRaw { pub struct TILSectionHeader { pub format: u32, /// short file name (without path and extension) - pub description: Vec, + pub description: IDBString, pub flags: TILSectionFlags, // TODO unclear what exacly dependency is for /// module required - pub dependencies: Vec>, + pub dependencies: Vec, /// the compiler used to generated types pub compiler_id: Compiler, /// default calling convention @@ -134,13 +134,14 @@ impl TILSectionRaw { .dependencies .split(|x| *x == b',') .map(<[_]>::to_vec) + .map(IDBString::new) .collect() } else { vec![] }; let mut header = TILSectionHeader { format: header_raw.format, - description: header_raw.description, + description: IDBString::new(header_raw.description), flags: header_raw.flags, dependencies, compiler_id: Compiler::from_value(header_raw.compiler_id), @@ -615,7 +616,7 @@ impl TILSection { } pub fn get_name_idx(&self, name: &[u8]) -> Option { - self.types.iter().position(|ty| ty.name.as_slice() == name) + self.types.iter().position(|ty| ty.name.as_bytes() == name) } pub fn get_name(&self, name: &[u8]) -> Option<&TILTypeInfo> { @@ -685,7 +686,7 @@ impl TILSection { .types .iter() .enumerate() - .map(|(i, til)| (til.name.to_vec(), i)) + .map(|(i, til)| (til.name.clone().into_inner(), i)) .collect(); let type_by_ord = type_info_raw .types diff --git a/src/til/struct.rs b/src/til/struct.rs index a96ce81..3cac211 100644 --- a/src/til/struct.rs +++ b/src/til/struct.rs @@ -3,6 +3,7 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::{Type, TypeRaw}; +use crate::IDBString; use anyhow::{anyhow, ensure, Context, Result}; use num_enum::{FromPrimitive, IntoPrimitive, TryFromPrimitive}; @@ -32,7 +33,7 @@ impl Struct { type_by_name: &HashMap, usize>, type_by_ord: &HashMap, value: StructRaw, - fields: &mut impl Iterator>>, + fields: &mut impl Iterator>, ) -> Result { let members = value .members @@ -184,7 +185,7 @@ impl StructRaw { #[derive(Clone, Debug)] pub struct StructMember { - pub name: Option>, + pub name: Option, pub member_type: Type, pub att: Option, @@ -199,11 +200,11 @@ pub struct StructMember { impl StructMember { fn new( til: &TILSectionHeader, - name: Option>, + name: Option, type_by_name: &HashMap, usize>, type_by_ord: &HashMap, m: StructMemberRaw, - fields: &mut impl Iterator>>, + fields: &mut impl Iterator>, ) -> Result { Ok(Self { name, diff --git a/src/til/union.rs b/src/til/union.rs index 404d468..975a913 100644 --- a/src/til/union.rs +++ b/src/til/union.rs @@ -5,6 +5,7 @@ use std::num::NonZeroU8; use crate::ida_reader::IdaGenericBufUnpack; use crate::til::{Type, TypeRaw}; +use crate::IDBString; use super::section::TILSectionHeader; use super::{TypeAttribute, TypeVariantRaw}; @@ -13,7 +14,7 @@ use super::{TypeAttribute, TypeVariantRaw}; pub struct Union { pub effective_alignment: u16, pub alignment: Option, - pub members: Vec<(Option>, Type)>, + pub members: Vec<(Option, Type)>, pub is_unaligned: bool, pub is_unknown_8: bool, @@ -24,7 +25,7 @@ impl Union { type_by_name: &HashMap, usize>, type_by_ord: &HashMap, value: UnionRaw, - fields: &mut impl Iterator>>, + fields: &mut impl Iterator>, ) -> Result { let members = value .members diff --git a/src/tools/dump_til.rs b/src/tools/dump_til.rs index 4f93465..9e06748 100644 --- a/src/tools/dump_til.rs +++ b/src/tools/dump_til.rs @@ -55,9 +55,9 @@ pub fn dump_til(args: &Args) -> Result<()> { } = &til; // write the header info println!("format: {format}"); - println!("description: {}", String::from_utf8_lossy(description)); + println!("description: {}", description.as_utf8_lossy()); for (i, dependency) in dependencies.iter().enumerate() { - println!("dependency-{i}: {}", String::from_utf8_lossy(dependency)); + println!("dependency-{i}: {}", dependency.as_utf8_lossy()); } println!("id: {compiler_id:?}"); println!("cc: {cc:?}"); diff --git a/src/tools/tilib.rs b/src/tools/tilib.rs index 264bb7c..20c85d9 100644 --- a/src/tools/tilib.rs +++ b/src/tools/tilib.rs @@ -11,7 +11,7 @@ use idb_rs::til::{ Basic, TILTypeInfo, TILTypeSizeSolver, Type, TypeVariant, Typeref, TyperefType, TyperefValue, }; -use idb_rs::{IDBParser, IDBSectionCompression}; +use idb_rs::{IDBParser, IDBSectionCompression, IDBString}; use std::fs::File; use std::io::{BufReader, Result, Write}; @@ -45,7 +45,7 @@ fn print_til_section(mut fmt: impl Write, section: &TILSection) -> Result<()> { // TODO open those files? What todo with then? write!(fmt, "Warning: ")?; for dependency in §ion.header.dependencies { - fmt.write_all(dependency)?; + fmt.write_all(dependency.as_bytes())?; writeln!(fmt, ": No such file or directory")?; } } @@ -83,7 +83,7 @@ fn print_header(fmt: &mut impl Write, section: &TILSection) -> Result<()> { // the description of the file // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x40b710 write!(fmt, "Description: ")?; - fmt.write_all(§ion.header.description)?; + fmt.write_all(§ion.header.description.as_bytes())?; writeln!(fmt)?; // flags from the section header @@ -248,12 +248,13 @@ fn print_symbols( write!(fmt, " {} ", sym_kind)?; // TODO investiage this - let name = if symbol.ordinal == 0 && symbol.name.first() == Some(&b'_') + let symbol_name = symbol.name.as_bytes(); + let name = if symbol.ordinal == 0 && symbol_name.first() == Some(&b'_') { // remove the first "_", if any - &symbol.name[1..] + &symbol.name.as_bytes()[1..] } else { - &symbol.name + symbol.name.as_bytes() }; // InnerRef fb47f2c2-3c08-4d40-b7ab-3c7736dce31d 0x409a3a print_til_type( @@ -338,7 +339,7 @@ fn print_types_by_ordinals( print_til_type_root( fmt, section, - Some(&final_type.name), + Some(final_type.name.as_bytes()), &final_type.tinfo, )?; writeln!(fmt, ";")?; @@ -352,12 +353,17 @@ fn print_types_by_name( solver: &mut TILTypeSizeSolver<'_>, ) -> Result<()> { for (idx, symbol) in section.types.iter().enumerate() { - if symbol.name.is_empty() { + if symbol.name.as_bytes().is_empty() { continue; } print_til_type_len(fmt, Some(idx), &symbol.tinfo, solver).unwrap(); write!(fmt, " ")?; - print_til_type_root(fmt, section, Some(&symbol.name), &symbol.tinfo)?; + print_til_type_root( + fmt, + section, + Some(symbol.name.as_bytes()), + &symbol.tinfo, + )?; writeln!(fmt, ";")?; } Ok(()) @@ -612,7 +618,7 @@ fn print_til_type_function( if i != 0 { write!(fmt, ", ")?; } - let param_name = param_name.as_ref().map(Vec::as_slice); + let param_name = param_name.as_ref().map(IDBString::as_bytes); print_til_type( fmt, section, param_name, param, false, true, false, true, )?; @@ -699,14 +705,14 @@ fn print_til_type_typedef( write!(fmt, " ")?; } let inner_ty = §ion.types[*idx]; - fmt.write_all(&inner_ty.name)?; + fmt.write_all(inner_ty.name.as_bytes())?; need_space = true; } TyperefValue::UnsolvedName(Some(name)) => { if need_space { write!(fmt, " ")?; } - fmt.write_all(name)?; + fmt.write_all(name.as_bytes())?; need_space = true; } // Nothing to print @@ -785,7 +791,7 @@ fn print_til_type_struct( write!(fmt, "{{")?; for member in members { - let member_name = member.name.as_deref(); + let member_name = member.name.as_ref().map(IDBString::as_bytes); print_til_type_complex_member( fmt, section, @@ -816,7 +822,7 @@ fn print_til_type_union( if let Some(align) = til_union.alignment { write!(fmt, "__attribute__((aligned({align}))) ")?; } - if let Some(name) = name { + if let Some(name) = &name { if print_name { fmt.write_all(name)?; write!(fmt, " ")?; @@ -824,7 +830,7 @@ fn print_til_type_union( } write!(fmt, "{{")?; for (member_name, member) in &til_union.members { - let member_name = member_name.as_deref(); + let member_name = member_name.as_ref().map(IDBString::as_bytes); print_til_type_complex_member( fmt, section, @@ -905,7 +911,7 @@ fn print_til_type_complex_member( if let Some(ref_type) = &typedef.ref_type { print_typeref_type_prefix(fmt, *ref_type)?; } - fmt.write_all(&name)?; + fmt.write_all(name.as_bytes())?; return Ok(()); } TyperefValue::UnsolvedOrd(_) | TyperefValue::UnsolvedName(None) => { @@ -926,7 +932,11 @@ fn print_til_type_complex_member( // we embed it let qualified_parent_name: Vec<_> = parent_name.iter().chain(b"::").copied().collect(); - if !inner_type.name.starts_with(&qualified_parent_name) { + if !inner_type + .name + .as_bytes() + .starts_with(&qualified_parent_name) + { return print_til_type( fmt, section, @@ -942,7 +952,7 @@ fn print_til_type_complex_member( print_til_type( fmt, section, - Some(&inner_type.name), + Some(inner_type.name.as_bytes()), &inner_type.tinfo, is_vft, print_pointer_space, @@ -987,7 +997,7 @@ fn print_til_type_enum( write!(fmt, "{{")?; for (member_name, value) in &til_enum.members { if let Some(member_name) = member_name { - fmt.write_all(member_name)?; + fmt.write_all(member_name.as_bytes())?; } write!(fmt, " = ")?; match til_enum.output_format { @@ -1183,7 +1193,7 @@ fn print_til_type_only( typeref_value: TyperefValue::UnsolvedName(Some(name)), ref_type: _, }) => { - fmt.write_all(name)?; + fmt.write_all(name.as_bytes())?; } TypeVariant::Typeref(Typeref { typeref_value: TyperefValue::UnsolvedName(None), @@ -1195,7 +1205,7 @@ fn print_til_type_only( }) => { //TypeVariant::Typeref(Typeref::Ordinal(ord)) => { let ty = §ion.types[*idx]; - fmt.write_all(&ty.name)?; + fmt.write_all(ty.name.as_bytes())?; } _ => {} };