aboutsummaryrefslogtreecommitdiff
path: root/src/serialized_file.rs
diff options
context:
space:
mode:
authormetamuffin <metamuffin@disroot.org>2025-02-10 17:38:55 +0100
committermetamuffin <metamuffin@disroot.org>2025-02-10 17:38:55 +0100
commitd8d00eb146241978ef21ed4d6c35ac9c68b1a86e (patch)
treec075bd4f9aa17e30aa05aa74db23377c72cf6823 /src/serialized_file.rs
parent3dade4b3815db7bfa1baf3fbb4fb332b29aba363 (diff)
downloadunity-tools-d8d00eb146241978ef21ed4d6c35ac9c68b1a86e.tar
unity-tools-d8d00eb146241978ef21ed4d6c35ac9c68b1a86e.tar.bz2
unity-tools-d8d00eb146241978ef21ed4d6c35ac9c68b1a86e.tar.zst
read serialized file tables
Diffstat (limited to 'src/serialized_file.rs')
-rw-r--r--src/serialized_file.rs248
1 files changed, 248 insertions, 0 deletions
diff --git a/src/serialized_file.rs b/src/serialized_file.rs
new file mode 100644
index 0000000..becf1d7
--- /dev/null
+++ b/src/serialized_file.rs
@@ -0,0 +1,248 @@
+use crate::{
+ common_strings::COMMON_STRINGS,
+ helper::{AlignExt, Endianness, ReadExt},
+};
+use anyhow::Result;
+use log::{debug, trace};
+use std::io::{Cursor, Read, Seek};
+
+#[derive(Debug)]
+pub struct TypeTreeNode {
+ pub version: u16,
+ pub level: u8,
+ pub type_flags: u8,
+ pub type_string: String,
+ pub name_string: String,
+ pub byte_size: i32,
+ pub index: i32,
+ pub flags: i32,
+ pub ref_type_hash: u64,
+}
+
+#[derive(Debug)]
+pub struct SeralizedType {
+ pub class_id: i32,
+ pub stripped_type: bool,
+ pub script_type_index: i16,
+ pub script_id: u128,
+
+ pub type_tree: Vec<TypeTreeNode>,
+ pub type_deps: Vec<u32>,
+}
+
+#[derive(Debug)]
+pub struct ObjectInfo {
+ path_id: i64,
+ data_offset: u64,
+ data_size: u32,
+ type_id: i32,
+}
+
+#[derive(Debug)]
+pub struct Script {
+ file_index: u32,
+ identifier: i64,
+}
+
+#[derive(Debug)]
+pub struct External {
+ something: String,
+ guid: u128,
+ r#type: i32,
+ path_name: String,
+}
+
+#[derive(Debug)]
+pub struct SerializedFile {
+ pub types: Vec<SeralizedType>,
+ pub externals: Vec<External>,
+ pub scripts: Vec<Script>,
+ pub objects: Vec<ObjectInfo>,
+ pub user_string: String,
+}
+
+pub fn read_serialized_file(mut file: impl Read + Seek) -> Result<SerializedFile> {
+ let mut metadata_size = file.read_u32_be()?;
+ let mut file_size = file.read_u32_be()? as u64;
+ let format = file.read_u32_be()?;
+ let mut data_offset = file.read_u32_be()? as u64;
+
+ debug!("format={format}");
+
+ assert!(format >= 9);
+ let e = match file.read_u32_be()? {
+ 0 => Endianness::Little,
+ _ => Endianness::Big,
+ };
+ debug!("endianess={e:?}");
+
+ if format >= 22 {
+ metadata_size = file.read_u32(e)?;
+ file_size = file.read_u64(e)?;
+ data_offset = file.read_u64(e)?;
+ file.read_u64(e)?;
+ }
+ debug!("metadata_size={metadata_size}");
+ debug!("file_size={file_size}");
+ debug!("data_offset={data_offset}");
+
+ let generator_version = file.read_cstr()?;
+ let target_platform = file.read_u32_le()?;
+ debug!("generator_version={generator_version:?}");
+ debug!("target_platform={target_platform}");
+
+ let has_type_trees = file.read_u8()? != 0;
+ let num_types = file.read_u32(e)?;
+ debug!("has_type_trees={has_type_trees:?}");
+ debug!("num_types={num_types}");
+
+ let mut types = Vec::new();
+
+ for _ in 0..num_types {
+ let class_id = file.read_i32(e)?;
+ let stripped_type = file.read_u8()? != 0;
+ let script_type_index = file.read_i16(e)?;
+ let mut script_id = 0;
+ // TODO reftype
+ if class_id == 114 {
+ script_id = file.read_u128_be()?;
+ }
+ let _old_hash = file.read_u128_be()?;
+
+ trace!("class_id={class_id}");
+ trace!("stripped_type={stripped_type}");
+ trace!("script_type_index={script_type_index}");
+ trace!("script_id={script_id}");
+
+ let mut type_deps = Vec::new();
+ let mut type_tree = Vec::new();
+ if has_type_trees {
+ let num_nodes = file.read_u32(e)?;
+ let size = file.read_u32(e)?;
+ trace!("tree:num_nodes={num_nodes}");
+ trace!("tree:size={size}");
+
+ let mut node_data = vec![0u8; num_nodes as usize * 32];
+ file.read_exact(&mut node_data)?;
+ let mut node_data = Cursor::new(node_data);
+ let mut string_data = vec![0u8; size as usize];
+ file.read_exact(&mut string_data)?;
+
+ let get_string = |off: u32| {
+ let data = if off & 0x80000000 != 0 {
+ let off = off & 0x7fffffff;
+ &COMMON_STRINGS[off as usize..]
+ } else {
+ &string_data[off as usize..]
+ };
+ String::from_utf8(
+ data.iter()
+ .copied()
+ .take_while(|e| *e != 0)
+ .collect::<Vec<u8>>(),
+ )
+ };
+
+ for _ in 0..num_nodes {
+ type_tree.push(TypeTreeNode {
+ version: node_data.read_u16(e)?,
+ level: node_data.read_u8()?,
+ type_flags: node_data.read_u8()?,
+ type_string: get_string(node_data.read_u32(e)?)?,
+ name_string: get_string(node_data.read_u32(e)?)?,
+ byte_size: node_data.read_i32(e)?,
+ index: node_data.read_i32(e)?,
+ flags: node_data.read_i32(e)?,
+ ref_type_hash: node_data.read_u64(e)?,
+ });
+ }
+
+ if format >= 21 {
+ let num_deps = file.read_u32(e)?;
+ trace!("num_deps={num_deps}");
+ for _ in 0..num_deps {
+ type_deps.push(file.read_u32(e)?);
+ }
+ }
+ }
+
+ types.push(SeralizedType {
+ class_id,
+ script_id,
+ script_type_index,
+ stripped_type,
+ type_deps,
+ type_tree,
+ })
+ }
+
+ let num_objects = file.read_u32(e)?;
+ debug!("num_objects={num_objects}");
+ let mut objects = Vec::new();
+ for _ in 0..num_objects {
+ file.align(4)?;
+ let path_id = file.read_i64(e)?;
+ let data_offset = if format >= 22 {
+ file.align(4)?;
+ file.read_u64(e)?
+ } else {
+ file.read_u32(e)? as u64
+ } + data_offset;
+ let data_size = file.read_u32(e)?;
+ let type_id = file.read_i32(e)?;
+ objects.push(ObjectInfo {
+ data_offset,
+ data_size,
+ path_id,
+ type_id,
+ })
+ }
+
+ let num_scripts = file.read_u32(e)?;
+ debug!("num_scripts={num_scripts}");
+ let mut scripts = Vec::new();
+ for _ in 0..num_scripts {
+ let file_index = file.read_u32(e)?;
+ file.align(4)?;
+ let identifier = file.read_i64(e)?;
+ scripts.push(Script {
+ file_index,
+ identifier,
+ })
+ }
+
+ let num_externals = file.read_u32(e)?;
+ debug!("num_externals={num_externals}");
+ let mut externals = Vec::new();
+ for _ in 0..num_externals {
+ let something = file.read_cstr()?;
+ let guid = file.read_u128_be()?;
+ let r#type = file.read_i32(e)?;
+ let path_name = file.read_cstr()?;
+ externals.push(External {
+ guid,
+ path_name,
+ something,
+ r#type,
+ })
+ }
+
+ if format >= 20 {
+ let num_ref_types = file.read_i32(e)?;
+ debug!("num_ref_types={num_ref_types}");
+ // let mut ref_types = Vec::new();
+ for _ in 0..num_ref_types {
+ todo!()
+ }
+ }
+
+ let user_string = file.read_cstr()?;
+
+ Ok(SerializedFile {
+ types,
+ externals,
+ objects,
+ scripts,
+ user_string,
+ })
+}