From d8d00eb146241978ef21ed4d6c35ac9c68b1a86e Mon Sep 17 00:00:00 2001 From: metamuffin Date: Mon, 10 Feb 2025 17:38:55 +0100 Subject: read serialized file tables --- src/helper.rs | 35 ++++++- src/lib.rs | 1 + src/main.rs | 138 +-------------------------- src/serialized_file.rs | 248 +++++++++++++++++++++++++++++++++++++++++++++++++ src/unityfs.rs | 29 ++++-- 5 files changed, 309 insertions(+), 142 deletions(-) create mode 100644 src/serialized_file.rs (limited to 'src') diff --git a/src/helper.rs b/src/helper.rs index 0b126ad..cb52b8c 100644 --- a/src/helper.rs +++ b/src/helper.rs @@ -1,4 +1,4 @@ -use std::io::{Read, Result}; +use std::io::{Read, Result, Seek}; #[derive(Debug, Clone, Copy, PartialEq)] pub enum Endianness { @@ -23,9 +23,13 @@ pub trait ReadExt { fn read_u64(&mut self, e: Endianness) -> Result; fn read_u64_be(&mut self) -> Result; fn read_u64_le(&mut self) -> Result; + fn read_i64(&mut self, e: Endianness) -> Result; + fn read_i64_be(&mut self) -> Result; + fn read_i64_le(&mut self) -> Result; fn read_u128_be(&mut self) -> Result; fn read_cstr(&mut self) -> Result; } + impl ReadExt for T { fn read_u8(&mut self) -> Result { let mut buf = [0; 1]; @@ -112,6 +116,22 @@ impl ReadExt for T { self.read_exact(&mut buf)?; Ok(u64::from_le_bytes(buf)) } + fn read_i64(&mut self, e: Endianness) -> Result { + match e { + Endianness::Big => self.read_i64_be(), + Endianness::Little => self.read_i64_le(), + } + } + fn read_i64_be(&mut self) -> Result { + let mut buf = [0; 8]; + self.read_exact(&mut buf)?; + Ok(i64::from_be_bytes(buf)) + } + fn read_i64_le(&mut self) -> Result { + let mut buf = [0; 8]; + self.read_exact(&mut buf)?; + Ok(i64::from_le_bytes(buf)) + } fn read_u128_be(&mut self) -> Result { let mut buf = [0; 16]; self.read_exact(&mut buf)?; @@ -130,3 +150,16 @@ impl ReadExt for T { Ok(String::from_utf8_lossy(&s).to_string()) } } + +pub trait AlignExt { + fn align(&mut self, size: u64) -> Result<()>; +} +impl AlignExt for T { + fn align(&mut self, size: u64) -> Result<()> { + let off = self.stream_position()? % size; + if off != 0 { + self.seek_relative((size - off) as i64)?; + } + Ok(()) + } +} diff --git a/src/lib.rs b/src/lib.rs index d2370b3..5022d0d 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -1,3 +1,4 @@ pub mod unityfs; pub mod helper; pub mod common_strings; +pub mod serialized_file; diff --git a/src/main.rs b/src/main.rs index a0b35c3..4d91578 100644 --- a/src/main.rs +++ b/src/main.rs @@ -1,14 +1,5 @@ -use log::debug; -use std::{ - env::args, - fs::File, - io::{BufReader, Cursor, Read}, -}; -use unity_tools::{ - common_strings::COMMON_STRINGS, - helper::{Endianness, ReadExt}, - unityfs::UnityFS, -}; +use std::{env::args, fs::File, io::BufReader}; +use unity_tools::{serialized_file::read_serialized_file, unityfs::UnityFS}; fn main() -> anyhow::Result<()> { env_logger::init_from_env("LOG"); @@ -19,134 +10,15 @@ fn main() -> anyhow::Result<()> { if node.name.ends_with(".resource") || node.name.ends_with("resS") { continue; } - let mut cab = fs.read(&node)?; + let cab = fs.read(&node)?; // let mut writer = File::create(format!("/tmp/{}", node.name))?; // std::io::copy(&mut cab, &mut writer)?; // continue; - let mut metadata_size = cab.read_u32_be()?; - let mut file_size = cab.read_u32_be()? as u64; - let format = cab.read_u32_be()?; - let mut data_offset = cab.read_u32_be()? as u64; + let file = read_serialized_file(cab)?; + eprintln!("{file:#?}"); - debug!("format={format}"); - - assert!(format >= 9); - let e = match cab.read_u32_be()? { - 0 => Endianness::Little, - _ => Endianness::Big, - }; - debug!("endianess={e:?}"); - - if format >= 22 { - metadata_size = cab.read_u32(e)?; - file_size = cab.read_u64(e)?; - data_offset = cab.read_u64(e)?; - cab.read_u64(e)?; - } - debug!("metadata_size={metadata_size}"); - debug!("file_size={file_size}"); - debug!("data_offset={data_offset}"); - - let generator_version = cab.read_cstr()?; - let target_platform = cab.read_u32_le()?; - debug!("generator_version={generator_version:?}"); - debug!("target_platform={target_platform}"); - - let has_type_trees = cab.read_u8()? != 0; - let num_types = cab.read_u32(e)?; - debug!("has_type_trees={has_type_trees:?}"); - debug!("num_types={num_types}"); - - for _ in 0..num_types { - let class_id = cab.read_i32(e)?; - let stripped_type = cab.read_u8()? != 0; - let script_index = cab.read_i16(e)?; - let mut script_id = 0; - // TODO reftype - if class_id == 114 { - script_id = cab.read_u128_be()?; - } - let _old_hash = cab.read_u128_be()?; - - eprintln!("class_id={class_id}"); - eprintln!("stripped_type={stripped_type}"); - eprintln!("script_index={script_index}"); - eprintln!("script_id={script_id}"); - - if has_type_trees { - let num_nodes = cab.read_u32(e)?; - let size = cab.read_u32(e)?; - eprintln!("tree:num_nodes={num_nodes}"); - eprintln!("tree:size={size}"); - - let mut node_data = vec![0u8; num_nodes as usize * 32]; - cab.read_exact(&mut node_data)?; - let mut node_data = Cursor::new(node_data); - let mut string_data = vec![0u8; size as usize]; - cab.read_exact(&mut string_data)?; - - let get_string = |off: u32| { - let data = if off & 0x80000000 != 0 { - let off = off & 0x7fffffff; - &COMMON_STRINGS[(off & 0x7fffffff) as usize..] - } else { - &string_data[off as usize..] - }; - String::from_utf8( - data.iter() - .copied() - .take_while(|e| *e != 0) - .collect::>(), - ) - }; - - let mut nodes = Vec::new(); - for _ in 0..num_nodes { - nodes.push(TypeTreeNode { - version: node_data.read_u16(e)?, - level: node_data.read_u8()?, - type_flags: node_data.read_u8()?, - type_string: get_string(node_data.read_u32(e)?)?, - name_string: get_string(node_data.read_u32(e)?)?, - byte_size: node_data.read_i32(e)?, - index: node_data.read_i32(e)?, - flags: node_data.read_i32(e)?, - ref_type_hash: node_data.read_u64(e)?, - }); - } - eprintln!("{nodes:#?}"); - - if format >= 21 { - let num_deps = cab.read_u32(e)?; - for _ in 0..num_deps { - cab.read_u32(e)?; - } - } - } - - if format > 21 { - cab.read_u32_be()?; - } - } - - // let num_objects = cab.read_u32_le()?; - // debug!("num_objects={num_objects}"); - // for _ in 0..num_objects {} } Ok(()) } - -#[derive(Debug)] -struct TypeTreeNode { - version: u16, - level: u8, - type_flags: u8, - type_string: String, - name_string: String, - byte_size: i32, - index: i32, - flags: i32, - ref_type_hash: u64, -} diff --git a/src/serialized_file.rs b/src/serialized_file.rs new file mode 100644 index 0000000..becf1d7 --- /dev/null +++ b/src/serialized_file.rs @@ -0,0 +1,248 @@ +use crate::{ + common_strings::COMMON_STRINGS, + helper::{AlignExt, Endianness, ReadExt}, +}; +use anyhow::Result; +use log::{debug, trace}; +use std::io::{Cursor, Read, Seek}; + +#[derive(Debug)] +pub struct TypeTreeNode { + pub version: u16, + pub level: u8, + pub type_flags: u8, + pub type_string: String, + pub name_string: String, + pub byte_size: i32, + pub index: i32, + pub flags: i32, + pub ref_type_hash: u64, +} + +#[derive(Debug)] +pub struct SeralizedType { + pub class_id: i32, + pub stripped_type: bool, + pub script_type_index: i16, + pub script_id: u128, + + pub type_tree: Vec, + pub type_deps: Vec, +} + +#[derive(Debug)] +pub struct ObjectInfo { + path_id: i64, + data_offset: u64, + data_size: u32, + type_id: i32, +} + +#[derive(Debug)] +pub struct Script { + file_index: u32, + identifier: i64, +} + +#[derive(Debug)] +pub struct External { + something: String, + guid: u128, + r#type: i32, + path_name: String, +} + +#[derive(Debug)] +pub struct SerializedFile { + pub types: Vec, + pub externals: Vec, + pub scripts: Vec