mirror of
https://github.com/Virtual-World-RE/NeoGF.git
synced 2024-11-15 07:45:33 +01:00
Update afstool.py
Added comments
This commit is contained in:
parent
46a32ce45b
commit
a4e659e37a
|
@ -9,18 +9,23 @@ import re
|
||||||
import time
|
import time
|
||||||
|
|
||||||
|
|
||||||
__version__ = "0.1.2"
|
__version__ = "0.1.3"
|
||||||
__author__ = "rigodron, algoflash, GGLinnk"
|
__author__ = "rigodron, algoflash, GGLinnk"
|
||||||
__license__ = "MIT"
|
__license__ = "MIT"
|
||||||
__status__ = "developpement"
|
__status__ = "developpement"
|
||||||
|
|
||||||
|
|
||||||
# Not tested:
|
# Creating afstool.py was a challenge because there is many implementations
|
||||||
|
# and configurations possible. In one hand allowing to configure the rebuild
|
||||||
|
# was usefull but in another it was also important to control errors generated
|
||||||
|
# by those conf files. Using custom exceptions was necessary.
|
||||||
|
|
||||||
|
# Not tested by afstest.py:
|
||||||
class AfsInvalidFileLenError(Exception): pass
|
class AfsInvalidFileLenError(Exception): pass
|
||||||
class AfsEmptyAfsError(Exception): pass
|
class AfsEmptyAfsError(Exception): pass
|
||||||
class AfsInvalidFilenameDirectoryLengthError(Exception): pass
|
class AfsInvalidFilenameDirectoryLengthError(Exception): pass
|
||||||
class AfsInvalidAfsFolderError(Exception): pass
|
class AfsInvalidAfsFolderError(Exception): pass
|
||||||
# Tested:
|
# Tested by afstest.py:
|
||||||
class AfsInvalidMagicNumberError(Exception): pass
|
class AfsInvalidMagicNumberError(Exception): pass
|
||||||
class AfsInvalidFilesRebuildStrategy(Exception): pass
|
class AfsInvalidFilesRebuildStrategy(Exception): pass
|
||||||
class AfsFilenameDirectoryValueError(Exception): pass
|
class AfsFilenameDirectoryValueError(Exception): pass
|
||||||
|
@ -40,8 +45,21 @@ class AfsEmptyBlockValueError(Exception): pass
|
||||||
class AfsEmptyBlockAlignError(Exception): pass
|
class AfsEmptyBlockAlignError(Exception): pass
|
||||||
|
|
||||||
|
|
||||||
|
#########################################################################
|
||||||
|
# class: FilenameResolver
|
||||||
|
# Constructor: system path of the unpack folder
|
||||||
|
# DESCRIPTION
|
||||||
|
# Use sys/filename_resolver.csv to resolve filename to their index
|
||||||
|
# in the TOC. Allow also to rename files since the FD and the TOC
|
||||||
|
# are not rebuild during pack.
|
||||||
|
# The resolver is necessary in multiple cases:
|
||||||
|
# * When multiple packed files have the same name in the FD
|
||||||
|
# * When there is no FD
|
||||||
|
# * When names contains invalid path operator (not implemented yet)
|
||||||
|
#########################################################################
|
||||||
class FilenameResolver:
|
class FilenameResolver:
|
||||||
__sys_path = None
|
__sys_path = None
|
||||||
|
# name_tuples: {(unpacked_filename, toc_index), ... }
|
||||||
__names_tuples = None
|
__names_tuples = None
|
||||||
__resolve_buffer = ""
|
__resolve_buffer = ""
|
||||||
__separator = '/'
|
__separator = '/'
|
||||||
|
@ -49,17 +67,20 @@ class FilenameResolver:
|
||||||
self.__sys_path = sys_path
|
self.__sys_path = sys_path
|
||||||
self.__names_tuples = {}
|
self.__names_tuples = {}
|
||||||
self.__load()
|
self.__load()
|
||||||
|
# Load name_tuples if there is a csv
|
||||||
def __load(self):
|
def __load(self):
|
||||||
if (self.__sys_path / "filename_resolver.csv").is_file():
|
if (self.__sys_path / "filename_resolver.csv").is_file():
|
||||||
self.__resolve_buffer = (self.__sys_path / "filename_resolver.csv").read_text()
|
self.__resolve_buffer = (self.__sys_path / "filename_resolver.csv").read_text()
|
||||||
for line in self.__resolve_buffer.split('\n'):
|
for line in self.__resolve_buffer.split('\n'):
|
||||||
name_tuple = line.split(self.__separator)
|
name_tuple = line.split(self.__separator)
|
||||||
self.__names_tuples[name_tuple[1]] = int(name_tuple[0])
|
self.__names_tuples[name_tuple[1]] = int(name_tuple[0])
|
||||||
|
# Save the resolve_buffer containing formated name_tuples to the csv if not empty
|
||||||
def save(self):
|
def save(self):
|
||||||
if len(self.__resolve_buffer) > 0:
|
if len(self.__resolve_buffer) > 0:
|
||||||
logging.info(f"Writting {Path('sys/filename_resolver.csv')}")
|
logging.info(f"Writting {Path('sys/filename_resolver.csv')}")
|
||||||
(self.__sys_path / "filename_resolver.csv").write_text(self.__resolve_buffer[:-1])
|
(self.__sys_path / "filename_resolver.csv").write_text(self.__resolve_buffer[:-1])
|
||||||
# resolve generate a unique filename when unpacking
|
# Resolve generate a unique filename when unpacking
|
||||||
|
# return the filename or new generated filename if duplicated
|
||||||
def resolve_new(self, fileindex:int, filename:str):
|
def resolve_new(self, fileindex:int, filename:str):
|
||||||
if filename in self.__names_tuples:
|
if filename in self.__names_tuples:
|
||||||
i = 1
|
i = 1
|
||||||
|
@ -72,11 +93,12 @@ class FilenameResolver:
|
||||||
return new_filename
|
return new_filename
|
||||||
self.__names_tuples[filename] = fileindex
|
self.__names_tuples[filename] = fileindex
|
||||||
return filename
|
return filename
|
||||||
# Add new entry forcing the unpacked_filename²
|
# Add new entry forcing the unpacked_filename
|
||||||
def add(self, fileindex:int, unpacked_filename:str):
|
def add(self, fileindex:int, unpacked_filename:str):
|
||||||
self.__names_tuples[unpacked_filename] = fileindex
|
self.__names_tuples[unpacked_filename] = fileindex
|
||||||
self.__resolve_buffer += f"{fileindex}{self.__separator}{unpacked_filename}\n"
|
self.__resolve_buffer += f"{fileindex}{self.__separator}{unpacked_filename}\n"
|
||||||
# return generated filename if it exist else filename
|
# return previously generated filename using the index of the file in the TOC
|
||||||
|
# else return filename
|
||||||
def resolve_from_index(self, fileindex:int, filename:str):
|
def resolve_from_index(self, fileindex:int, filename:str):
|
||||||
for filename_key, fileindex_value in self.__names_tuples.items():
|
for filename_key, fileindex_value in self.__names_tuples.items():
|
||||||
if fileindex_value == fileindex:
|
if fileindex_value == fileindex:
|
||||||
|
@ -85,14 +107,23 @@ class FilenameResolver:
|
||||||
|
|
||||||
|
|
||||||
# http://wiki.xentax.com/index.php/GRAF:AFS_AFS
|
# http://wiki.xentax.com/index.php/GRAF:AFS_AFS
|
||||||
|
#########################################################################
|
||||||
|
# class: Afs
|
||||||
|
# DESCRIPTION Afs handle all operations needed by the command parser
|
||||||
|
#########################################################################
|
||||||
class Afs:
|
class Afs:
|
||||||
MAGIC_00 = b"AFS\x00"
|
MAGIC_00 = b"AFS\x00"
|
||||||
MAGIC_20 = b"AFS\x20"
|
MAGIC_20 = b"AFS\x20"
|
||||||
|
# The header and each files are aligned to 0x800
|
||||||
ALIGN = 0x800
|
ALIGN = 0x800
|
||||||
|
# magic number and number of files
|
||||||
HEADER_LEN = 8
|
HEADER_LEN = 8
|
||||||
|
# Each entry in the FD have 32 chars for filename and the rest for date and last_fd_attribute
|
||||||
FILENAMEDIRECTORY_ENTRY_LEN = 0x30
|
FILENAMEDIRECTORY_ENTRY_LEN = 0x30
|
||||||
__file_count = None
|
__file_count = None
|
||||||
|
# this offset is at the en of the TOC and sometimes there is pad
|
||||||
__filenamedirectory_offset_offset = None
|
__filenamedirectory_offset_offset = None
|
||||||
|
# if there is a FD at the end of the AFS
|
||||||
__filenamedirectory_offset = None
|
__filenamedirectory_offset = None
|
||||||
__filenamedirectory_len = None
|
__filenamedirectory_len = None
|
||||||
__filenamedirectory = None
|
__filenamedirectory = None
|
||||||
|
@ -145,14 +176,24 @@ class Afs:
|
||||||
if updated_fdlast_index < self.__file_count:
|
if updated_fdlast_index < self.__file_count:
|
||||||
self.__filenamedirectory[updated_fdlast_index*Afs.FILENAMEDIRECTORY_ENTRY_LEN+44:updated_fdlast_index*Afs.FILENAMEDIRECTORY_ENTRY_LEN+48] = self.__get_file_len(fileindex).to_bytes(4, "little")
|
self.__filenamedirectory[updated_fdlast_index*Afs.FILENAMEDIRECTORY_ENTRY_LEN+44:updated_fdlast_index*Afs.FILENAMEDIRECTORY_ENTRY_LEN+48] = self.__get_file_len(fileindex).to_bytes(4, "little")
|
||||||
# fd_last_attribute_type == unknown
|
# fd_last_attribute_type == unknown
|
||||||
|
# Add padding to align datas to next block
|
||||||
def __pad(self, data:bytes):
|
def __pad(self, data:bytes):
|
||||||
if len(data) % Afs.ALIGN != 0:
|
if len(data) % Afs.ALIGN != 0:
|
||||||
data += b"\x00" * (Afs.ALIGN - (len(data) % Afs.ALIGN))
|
data += b"\x00" * (Afs.ALIGN - (len(data) % Afs.ALIGN))
|
||||||
return data
|
return data
|
||||||
|
# We can't know if there is a FD without searching and loading data for it
|
||||||
|
# So we have to clean loaded data if values are invalid
|
||||||
def __clean_filenamedirectory(self):
|
def __clean_filenamedirectory(self):
|
||||||
self.__filenamedirectory = None
|
self.__filenamedirectory = None
|
||||||
self.__filenamedirectory_offset = None
|
self.__filenamedirectory_offset = None
|
||||||
self.__filenamedirectory_len = None
|
self.__filenamedirectory_len = None
|
||||||
|
# Load the TOC and the FD from an AFS file
|
||||||
|
# this operation is difficult because there are many cases possible:
|
||||||
|
# is there or not a FD?
|
||||||
|
# is there padding at the end of files offset/length list in the TOC?
|
||||||
|
# So we have to search and control values and test it for errors
|
||||||
|
# If there is no FD self.__filename_directory is None
|
||||||
|
# return True if there is a FD else None
|
||||||
def __loadsys_from_afs(self, afs_file, afs_len:int):
|
def __loadsys_from_afs(self, afs_file, afs_len:int):
|
||||||
self.__tableofcontent = afs_file.read(Afs.HEADER_LEN)
|
self.__tableofcontent = afs_file.read(Afs.HEADER_LEN)
|
||||||
if self.__get_magic() not in [Afs.MAGIC_00, Afs.MAGIC_20]:
|
if self.__get_magic() not in [Afs.MAGIC_00, Afs.MAGIC_20]:
|
||||||
|
@ -162,15 +203,20 @@ class Afs:
|
||||||
tableofcontent_len = len(self.__tableofcontent)
|
tableofcontent_len = len(self.__tableofcontent)
|
||||||
|
|
||||||
offset = tableofcontent_len
|
offset = tableofcontent_len
|
||||||
|
# Now we have read the TOC and seeked to the end of it
|
||||||
|
# next values could be FD offset and length if there is one
|
||||||
|
|
||||||
|
# So we read 4 bytes to test if there is padding or not
|
||||||
tmp_block = int.from_bytes(afs_file.read(4), "little")
|
tmp_block = int.from_bytes(afs_file.read(4), "little")
|
||||||
if tmp_block != 0:
|
if tmp_block != 0:
|
||||||
self.__filenamedirectory_offset_offset = offset
|
self.__filenamedirectory_offset_offset = offset
|
||||||
self.__filenamedirectory_offset = tmp_block
|
self.__filenamedirectory_offset = tmp_block
|
||||||
|
# Here it could be padding
|
||||||
|
# If filenamedirectory_offset is not directly after the files offsets and lens
|
||||||
|
# --> we search the next uint32 != 0
|
||||||
else:
|
else:
|
||||||
# If filenamedirectory_offset is not directly after the files offsets and lens
|
|
||||||
# --> we search the next uint32 != 0
|
|
||||||
offset += 4
|
offset += 4
|
||||||
|
# We read by 0x800 blocks for better performances
|
||||||
block_len = 0x800
|
block_len = 0x800
|
||||||
tmp_block = afs_file.read(block_len)
|
tmp_block = afs_file.read(block_len)
|
||||||
while tmp_block:
|
while tmp_block:
|
||||||
|
@ -207,8 +253,10 @@ class Afs:
|
||||||
return False
|
return False
|
||||||
|
|
||||||
afs_file.seek(tableofcontent_len)
|
afs_file.seek(tableofcontent_len)
|
||||||
|
# Here FD is valid and we read it's length
|
||||||
self.__tableofcontent += afs_file.read(self.__filenamedirectory_offset_offset+8 - tableofcontent_len)
|
self.__tableofcontent += afs_file.read(self.__filenamedirectory_offset_offset+8 - tableofcontent_len)
|
||||||
return True
|
return True
|
||||||
|
# Load the TOC and FD from an unpacked afs. This time it's easier
|
||||||
def __loadsys_from_folder(self, sys_path:Path):
|
def __loadsys_from_folder(self, sys_path:Path):
|
||||||
self.__tableofcontent = bytearray( (sys_path / "tableofcontent.bin").read_bytes() )
|
self.__tableofcontent = bytearray( (sys_path / "tableofcontent.bin").read_bytes() )
|
||||||
self.__file_count = self.__get_file_count()
|
self.__file_count = self.__get_file_count()
|
||||||
|
@ -221,6 +269,7 @@ class Afs:
|
||||||
self.__filenamedirectory_len = self.__get_filenamedirectory_len()
|
self.__filenamedirectory_len = self.__get_filenamedirectory_len()
|
||||||
if self.__filenamedirectory_len != len(self.__filenamedirectory):
|
if self.__filenamedirectory_len != len(self.__filenamedirectory):
|
||||||
raise AfsInvalidFilenameDirectoryLengthError("Error - Tableofcontent filenamedirectory length does not match real filenamedirectory length.")
|
raise AfsInvalidFilenameDirectoryLengthError("Error - Tableofcontent filenamedirectory length does not match real filenamedirectory length.")
|
||||||
|
# Print is used for stats
|
||||||
def __print(self, title:str, lines_tuples, columns:list = list(range(7)), infos:str = ""):
|
def __print(self, title:str, lines_tuples, columns:list = list(range(7)), infos:str = ""):
|
||||||
stats_buffer = "#"*100+f"\n# {title}\n"+"#"*100+f"\n{infos}|"+"-"*99+"\n"
|
stats_buffer = "#"*100+f"\n# {title}\n"+"#"*100+f"\n{infos}|"+"-"*99+"\n"
|
||||||
if 0 in columns: stats_buffer += "| Index ";
|
if 0 in columns: stats_buffer += "| Index ";
|
||||||
|
@ -234,6 +283,7 @@ class Afs:
|
||||||
for line in lines_tuples:
|
for line in lines_tuples:
|
||||||
stats_buffer += line if type(line) == str else "| "+" | ".join(line)+"\n"
|
stats_buffer += line if type(line) == str else "| "+" | ".join(line)+"\n"
|
||||||
print(stats_buffer, end='')
|
print(stats_buffer, end='')
|
||||||
|
# This method is used to check the next file offset and control if there is overlapping during pack
|
||||||
# end offset not included (0,1) -> len=1
|
# end offset not included (0,1) -> len=1
|
||||||
# return a list of offsets where files and sys files begin
|
# return a list of offsets where files and sys files begin
|
||||||
def __get_offsets_map(self):
|
def __get_offsets_map(self):
|
||||||
|
@ -256,6 +306,7 @@ class Afs:
|
||||||
last_tuple = offsets_tuple
|
last_tuple = offsets_tuple
|
||||||
offsets_map[i] = offsets_tuple[0]
|
offsets_map[i] = offsets_tuple[0]
|
||||||
return offsets_map
|
return offsets_map
|
||||||
|
# This method is used for stats command
|
||||||
# end offset not included (0,1) -> len=1
|
# end offset not included (0,1) -> len=1
|
||||||
def __get_formated_map(self):
|
def __get_formated_map(self):
|
||||||
files_map = [("SYS TOC ", "00000000", f"{len(self.__tableofcontent):08x}", f"{len(self.__tableofcontent):08x}", "SYS TOC"+' '*12, "SYS TOC ", "SYS TOC")]
|
files_map = [("SYS TOC ", "00000000", f"{len(self.__tableofcontent):08x}", f"{len(self.__tableofcontent):08x}", "SYS TOC"+' '*12, "SYS TOC ", "SYS TOC")]
|
||||||
|
@ -273,6 +324,13 @@ class Afs:
|
||||||
f"{self.__filenamedirectory_offset + len(self.__filenamedirectory):08x}", \
|
f"{self.__filenamedirectory_offset + len(self.__filenamedirectory):08x}", \
|
||||||
f"{len(self.__filenamedirectory):08x}", "SYS FD"+' '*13, "SYS FD ", "SYS FD"))
|
f"{len(self.__filenamedirectory):08x}", "SYS FD"+' '*13, "SYS FD ", "SYS FD"))
|
||||||
return files_map
|
return files_map
|
||||||
|
# At this end of the FD there is 4 bytes used for different purposes
|
||||||
|
# To keep data we search what kind of data it is:
|
||||||
|
# return one of this values:
|
||||||
|
# * length
|
||||||
|
# * offset-length
|
||||||
|
# * 0x123 # (hex constant)
|
||||||
|
# * unknwon
|
||||||
def __get_fdlast_type(self):
|
def __get_fdlast_type(self):
|
||||||
# Try to get the type of FD last attribute
|
# Try to get the type of FD last attribute
|
||||||
length_type = True
|
length_type = True
|
||||||
|
@ -292,6 +350,11 @@ class Afs:
|
||||||
if constant_type: return f"0x{constant_type:x}"
|
if constant_type: return f"0x{constant_type:x}"
|
||||||
logging.info("Unknown FD last attribute type.")
|
logging.info("Unknown FD last attribute type.")
|
||||||
return "unknown"
|
return "unknown"
|
||||||
|
# At the end of unpack we use this function to write the 2 files:
|
||||||
|
# * "sys/afs_rebuild.csv"
|
||||||
|
# * "sys/afs_rebuild.csv"
|
||||||
|
# this file will contains every parameters of the AFS to allow exact pack copy when possible (fd_last_atribute != unknown)
|
||||||
|
# see documentation for further informations
|
||||||
def __write_rebuild_config(self, sys_path:Path, resolver:FilenameResolver):
|
def __write_rebuild_config(self, sys_path:Path, resolver:FilenameResolver):
|
||||||
config = ConfigParser(allow_no_value=True) # allow_no_value to allow adding comments
|
config = ConfigParser(allow_no_value=True) # allow_no_value to allow adding comments
|
||||||
config.optionxform = str # makes options case sensitive
|
config.optionxform = str # makes options case sensitive
|
||||||
|
@ -315,6 +378,7 @@ class Afs:
|
||||||
rebuild_csv += f"{unpacked_filename}/0x{i:x}/0x{self.__get_file_offset(i):x}/{filename}\n"
|
rebuild_csv += f"{unpacked_filename}/0x{i:x}/0x{self.__get_file_offset(i):x}/{filename}\n"
|
||||||
if len(rebuild_csv) > 0:
|
if len(rebuild_csv) > 0:
|
||||||
(sys_path / "afs_rebuild.csv").write_text(rebuild_csv[:-1])
|
(sys_path / "afs_rebuild.csv").write_text(rebuild_csv[:-1])
|
||||||
|
# Method used to unpack an AFS inside a folder
|
||||||
def unpack(self, afs_path:Path, folder_path:Path):
|
def unpack(self, afs_path:Path, folder_path:Path):
|
||||||
sys_path = folder_path / "sys"
|
sys_path = folder_path / "sys"
|
||||||
root_path = folder_path / "root"
|
root_path = folder_path / "root"
|
||||||
|
@ -351,6 +415,9 @@ class Afs:
|
||||||
if self.__filenamedirectory:
|
if self.__filenamedirectory:
|
||||||
resolver.save()
|
resolver.save()
|
||||||
self.__write_rebuild_config(sys_path, resolver)
|
self.__write_rebuild_config(sys_path, resolver)
|
||||||
|
# Methood used to pack un unpacked folder inside a new AFS file
|
||||||
|
# for a file pack will use the next file offset as max file length an raise an exception if the length overlap
|
||||||
|
# pack keep FD and TOC inchanged except for file length and FD dates updates
|
||||||
def pack(self, folder_path:Path, afs_path:Path = None):
|
def pack(self, folder_path:Path, afs_path:Path = None):
|
||||||
if afs_path is None:
|
if afs_path is None:
|
||||||
afs_path = folder_path / Path(folder_path.name).with_suffix(".afs")
|
afs_path = folder_path / Path(folder_path.name).with_suffix(".afs")
|
||||||
|
@ -401,6 +468,10 @@ class Afs:
|
||||||
logging.debug(f"Packing {sys_path / 'tableofcontent.bin'} at the beginning of the AFS.")
|
logging.debug(f"Packing {sys_path / 'tableofcontent.bin'} at the beginning of the AFS.")
|
||||||
afs_file.seek(0)
|
afs_file.seek(0)
|
||||||
afs_file.write(self.__tableofcontent)
|
afs_file.write(self.__tableofcontent)
|
||||||
|
# Rebuild will use following config files:
|
||||||
|
# * "sys/afs_rebuild.csv"
|
||||||
|
# * "sys/afs_rebuild.csv"
|
||||||
|
# It will rebuild the unpacked AFS sys files (TOC and FD) in the sys folder
|
||||||
def rebuild(self, folder_path:Path):
|
def rebuild(self, folder_path:Path):
|
||||||
config = ConfigParser()
|
config = ConfigParser()
|
||||||
root_path = folder_path / "root"
|
root_path = folder_path / "root"
|
||||||
|
@ -596,6 +667,10 @@ class Afs:
|
||||||
(sys_path / "filenamedirectory.bin").write_bytes(self.__filenamedirectory)
|
(sys_path / "filenamedirectory.bin").write_bytes(self.__filenamedirectory)
|
||||||
logging.info(f"Writting {Path('sys/tableofcontent.bin')}")
|
logging.info(f"Writting {Path('sys/tableofcontent.bin')}")
|
||||||
(sys_path / "tableofcontent.bin").write_bytes(self.__tableofcontent)
|
(sys_path / "tableofcontent.bin").write_bytes(self.__tableofcontent)
|
||||||
|
# Stats will print the AFS stats:
|
||||||
|
# Get full informations about header, TOC, FD, full memory mapping
|
||||||
|
# sorted by offsets (files and sys files), addresses space informations,
|
||||||
|
# and duplicated filenames grouped by filenames.
|
||||||
def stats(self, path:Path):
|
def stats(self, path:Path):
|
||||||
if path.is_file():
|
if path.is_file():
|
||||||
with path.open("rb") as afs_file:
|
with path.open("rb") as afs_file:
|
||||||
|
|
Loading…
Reference in New Issue
Block a user