pythonlib/games/ToolsTOR.py

import io
import json
import os
import re
import shutil
import struct
from dataclasses import dataclass
from itertools import tee
from pathlib import Path

import lxml.etree as etree
import pandas as pd
import pycdlib
from tqdm import tqdm
from pythonlib.formats.FileIO import FileIO
from pythonlib.formats.pak import Pak
from pythonlib.formats.scpk import Scpk

import pythonlib.utils.comptolib as comptolib
import pythonlib.formats.pak2 as pak2lib
from pythonlib.formats.theirsce import Theirsce
from pythonlib.formats.theirsce_instructions import (AluOperation, InstructionType,
                                                     TheirsceBaseInstruction)
from .ToolsTales import ToolsTales


@dataclass
class LineEntry:
    names: list[str]
    text: str
    offset: int

@dataclass
class NameEntry:
    index: int
    offsets: list[int]


VARIABLE_NAME = "[VARIABLE]"

class ToolsTOR(ToolsTales):
    
    POINTERS_BEGIN = 0xD76B0                                            # Offset to DAT.BIN pointer list start in SLPS_254.50 file
    POINTERS_END   = 0xE60C8                                            # Offset to DAT.BIN pointer list end in SLPS_254.50 file
    HIGH_BITS      = 0xFFFFFFC0
    LOW_BITS       = 0x3F
    
    
    #Path to used
    # fmt: off
    dat_bin_original    = '../Data/Tales-Of-Rebirth/Disc/Original/DAT.BIN'
    dat_bin_new         = '../Data/Tales-Of-Rebirth/Disc/New/DAT.BIN'
    elf_original        = '../Data/Tales-Of-Rebirth/Disc/Original/SLPS_254.50'
    elf_new             = '../Data/Tales-Of-Rebirth/Disc/New/SLPS_254.50'
    story_XML_new       = '../Tales-Of-Rebirth/Data/TOR/Story/'                        #Story XML files will be extracted here                      
    story_XML_patch     = '../Data/Tales-Of-Rebirth/Story/'               #Story XML files will be extracted here
    skit_XML_patch      = '../Data/Tales-Of-Rebirth/Skits/'                        #Skits XML files will be extracted here
    menu_XML_patch      = '../Tales-Of-Rebirth/Data/TOR/Menu/'
    skit_XML_new        = '../Tales-Of-Rebirth/Data/TOR/Skits/'
    dat_archive_extract = '../Data/Tales-Of-Rebirth/DAT/' 
    # fmt: on
    
    def __init__(self, project_file: Path) -> None:
        base_path = project_file.parent
        self.jsonTblTags = {}
        self.ijsonTblTags = {}
        with open(project_file, encoding="utf-8") as f:
            jsonRaw = json.load(f)

        self.paths: dict[str, Path] = {k: base_path / v for k, v in jsonRaw["paths"].items()}
        self.main_exe_name = jsonRaw["main_exe_name"]

        # super().__init__("TOR", str(self.paths["encoding_table"]), "Tales-Of-Rebirth")
        
        with open(self.paths["encoding_table"], encoding="utf-8") as f:
            jsonRaw = json.load(f)

        for k, v in jsonRaw.items():
            self.jsonTblTags[k] = {int(k2, 16): v2 for k2, v2 in v.items()}
        
        for k, v in self.jsonTblTags.items():
            self.ijsonTblTags[k] = {v2: k2 for k2, v2 in v.items()}
        self.id = 1
        # byteCode
        self.story_byte_code = b"\xF8"
        self.string_opcode = InstructionType.STRING
        self.list_status_insertion: list[str] = ['Done', 'Proofreading', 'Editing']


    # Extract the story files
    def extract_all_story(self, replace=False) -> None:
        print("Extracting Story files...")

        folder_path = self.paths["story_xml"]
        folder_path.mkdir(exist_ok=True)
        scpk_path = self.paths["extracted_files"] / "DAT" / "SCPK"

        for file in tqdm(list(scpk_path.glob("*.scpk"))):
            theirsce = Theirsce(Scpk.from_path(file).rsce)
            xml_text = self.get_xml_from_theirsce(theirsce, "Story")
            self.id = 1
            
            with open(folder_path / file.with_suffix(".xml").name, "wb") as xml:
                xml.write(xml_text)

            
    # Extract all the skits files
    def extract_all_skits(self, replace=False) -> None:
        print("Extracting Skit files...")

        folder_path = self.paths["skit_xml"]
        folder_path.mkdir(exist_ok=True)
        pak2_path = self.paths["extracted_files"] / "DAT" / "PAK2"

        for file in tqdm(list(pak2_path.glob("*.pak2"))):
            with open(file, "rb") as pak:
                theirsce = pak2lib.get_theirsce_from_pak2(pak.read())
            
            xml_text = self.get_xml_from_theirsce(Theirsce(theirsce), "Skits")
            
            xml_name = file.name.split(".")[0] + ".xml"
            with open(folder_path / xml_name, "wb") as xml:
                xml.write(xml_text)


    # Extract THEIRSCE to XML
    def get_xml_from_theirsce(self, rsce: Theirsce, section: str) -> bytes:
     
        #Create the XML file
        # root = etree.Element('SceneText')
        # etree.SubElement(root, "OriginalName").text = file_name

        #pointers_offset, texts_offset = self.extract_Story_Pointers(rsce)
        names, lines = self.extract_lines_with_speaker(rsce)

        for i, (k, v) in enumerate(names.items(), -1):
            names[k] = NameEntry(i, v)
  
        #Remove duplicates
        #list_informations = self.remove_duplicates(["Story"] * len(pointers_offset), pointers_offset, text_list)
        
        # list_lines = ( ['Story', line.offset, line.text] for line in lines)
        # list_names = ( ['Story', line.offset, line.text] for i, (k, v) in enumerate(found_names.items()))
        #Build the XML Structure with the information  

        root = etree.Element("SceneText")
        speakers_node = etree.SubElement(root, 'Speakers')
        etree.SubElement(speakers_node, 'Section').text = "Speaker"
        strings_node = etree.SubElement(root, 'Strings')
        etree.SubElement(strings_node, 'Section').text = section
        
        self.make_speakers_section(speakers_node, names)
        self.make_strings_section(strings_node, lines, names)
        
        # Return XML string
        return etree.tostring(root, encoding="UTF-8", pretty_print=True)

    
    def make_strings_section(self, root, lines: list[LineEntry], names: dict[str, NameEntry]):
        pass
        for line in lines:
            entry_node = etree.SubElement(root, "Entry")
            etree.SubElement(entry_node,"PointerOffset").text = str(line.offset)
            text_split = list(filter(None, re.split(self.COMMON_TAG, line.text)))
            
            if len(text_split) > 1 and text_split[0].startswith("<voice:"):
                etree.SubElement(entry_node,"VoiceId").text  = text_split[0][1:-1].split(":")[1]
                etree.SubElement(entry_node, "JapaneseText").text = ''.join(text_split[1:])
            else:
                etree.SubElement(entry_node, "JapaneseText").text = line.text
            
            etree.SubElement(entry_node,"EnglishText")
            etree.SubElement(entry_node,"Notes")

            if line.names:
                etree.SubElement(entry_node,"SpeakerId").text = ','.join([str(names[n].index) for n in line.names])
            etree.SubElement(entry_node,"Id").text = str(self.id)
            
            self.id = self.id + 1
            
            if line.text == '':
                statusText = 'Done'
            else:
                statusText = 'To Do'
            etree.SubElement(entry_node,"Status").text        = statusText
        
    
    def make_speakers_section(self, root, names: dict[str, NameEntry]):
        for k, v in names.items():
            entry_node = etree.SubElement(root, "Entry")
            if v.offsets:
                etree.SubElement(entry_node,"PointerOffset").text = ",".join([str(off) for off in v.offsets])
            else:
                etree.SubElement(entry_node,"PointerOffset")
            etree.SubElement(entry_node,"JapaneseText").text  = str(k)
            etree.SubElement(entry_node,"EnglishText")
            etree.SubElement(entry_node,"Notes")
            etree.SubElement(entry_node,"Id").text            = str(v.index)
            etree.SubElement(entry_node,"Status").text         = "To Do"

    
    def extract_lines_with_speaker(self, theirsce: Theirsce):
        # This will do a bit of everything thanks to the "nice"
        # architecture of the Theirsce class :)
    
        # Debug
        # sections = []
        # for _, section in enumerate(theirsce.sections):
        #     for _, sub in enumerate(section):
        #         sections.append(sub.off)

        # Setup three-way opcode generator
        d = TheirsceBaseInstruction(); d.type = InstructionType.INVALID
        a,b,c = tee(theirsce.walk_code(), 3)
        next(a, d)
        next(b, d); next(b, d)
        next(c, d); next(c, d); next(c, d)

        # Helper function, in the future I'll
        # just use a list of opcodes
        def skip():
            next(a, d); next(a, d)
            next(b, d); next(b, d)
            next(c, d); next(c, d)
        
        
        names = {VARIABLE_NAME: []}
        lines = []
        params = []
        used = False
        for op1, op2, op3 in zip(a,b,c):
            # Debug
            # if theirsce.tell() in sections:
            #     print()
            #     print("SECTION: ")

            # BREAK marks start of a local function
            # so local params are no longer in scope
            if op1.type is InstructionType.BREAK:
                if used == False:
                    for param in params:
                        text = self.bytes_to_text(theirsce, param.offset + theirsce.strings_offset)
                        lines.append(LineEntry([], text, op1.position + 1))
                params.clear()

                continue

            # This sequence mark the simple act of assigning
            # a string to a local variable, so we can detect
            # when they are used later in a function call
            if (op1.type is InstructionType.REFERENCE
                and op2.type is InstructionType.STRING 
                and op3.type is InstructionType.ALU
                and op3.operation == AluOperation.ASSIGNMENT 
                ):
                params.append(op2)
                skip()
                continue

            # This sequence represents the textbox call with
            # the name being a variable (NPCs do this)
            if (op1.type is InstructionType.REFERENCE
                and op2.type is InstructionType.STRING 
                and op3.type is InstructionType.SYSCALL
                and op3.function_index == 0x45
                ):
                if len(params) >= 1:
                    name = [self.bytes_to_text(theirsce, p.offset + theirsce.strings_offset) for p in params]
                    [names.setdefault(n, []).append(p.position + 1) for n, p in zip(name, params)]
                elif len(params) == 0:
                    name = []
                text = self.bytes_to_text(theirsce, op2.offset + theirsce.strings_offset)
                lines.append(LineEntry(name, text, op2.position + 1))
                #print(f"{params}: {text}")
                used = True
                skip()
                continue
            
            # This sequence represents the textbox call with
            # the text being a variable (Notice boxes do this)
            if (op1.type is InstructionType.STRING
                and op2.type is InstructionType.REFERENCE 
                and op3.type is InstructionType.SYSCALL
                and op3.function_index == 0x45
                ):
                name = [self.bytes_to_text(theirsce, op1.offset + theirsce.strings_offset)]
                names.setdefault(name[0], []).append(op1.position + 1)
                for param in params:
                    text = self.bytes_to_text(theirsce, param.offset + theirsce.strings_offset)
                    lines.append(LineEntry(name, text, param.position + 1))
                    #print(f"{text}: {name}")
                used = True
                params.clear()
                skip()
                continue
            
            # This sequence represents a regular textbox call
            # where both fields are an string (everything else, save for skits)
            if (op1.type is InstructionType.STRING
                and op2.type is InstructionType.STRING
                and op3.type is InstructionType.SYSCALL
                and op3.function_index == 0x45
                ):
                name = [self.bytes_to_text(theirsce, op1.offset + theirsce.strings_offset)]
                names.setdefault(name[0], []).append(op1.position + 1)
                text = self.bytes_to_text(theirsce, op2.offset + theirsce.strings_offset)
                lines.append(LineEntry(name, text, op2.position + 1))
                #print(f"{name}: {text}")
                skip()
                continue
            
            # Any other string in assorted code calls
            if op1.type is InstructionType.STRING:
                #print(theirsce.read_string_at(op1.offset + theirsce.strings_offset))
                text = self.bytes_to_text(theirsce, op1.offset + theirsce.strings_offset)
                lines.append(LineEntry([], text, op1.position + 1))
                continue
        
        return names, lines


    def extract_story_pointers_plain(self, theirsce: Theirsce):
        pointers_offset = []; texts_offset = []

        for opcode in theirsce.walk_code():
            if opcode.type == self.string_opcode:
                pointers_offset.append(theirsce.tell() - 2) # Maybe check this later
                texts_offset.append(opcode.offset + theirsce.strings_offset)
                    
        return pointers_offset, texts_offset

    #Convert a bytes object to text using TAGS and TBL in the json file
    def bytes_to_text(self, src: FileIO, offset: int = -1) -> str:
        finalText = ""
        tags = self.jsonTblTags['TAGS']
        chars = self.jsonTblTags['TBL']

        if (offset > 0):
            src.seek(offset, 0)

        while True:
            b = src.read(1)
            if b == b"\x00": break

            b = ord(b)
            # Custom Encoded Text
            if (0x99 <= b <= 0x9F) or (0xE0 <= b <= 0xEB):
                c = (b << 8) | src.read_uint8()
                finalText += chars.get(c, "{%02X}{%02X}" % (c >> 8, c & 0xFF))
                continue
            
            if b == 0x1:
                finalText += ("\n")
                continue
            
            # ASCII text
            if chr(b) in self.PRINTABLE_CHARS:
                finalText += chr(b)
                continue
            
            # cp932 text
            if 0xA0 < b < 0xE0:
                finalText += struct.pack("B", b).decode("cp932")
                continue

            if b == 0x81:
                next_b = src.read(1)
                if next_b == b"\x40":
                    finalText += "　"
                else:
                    finalText += "{%02X}" % b
                    finalText += "{%02X}" % ord(next_b)
                continue
            
            # Simple Tags
            if 0x3 <= b <= 0xF:
                parameter = src.read_uint32()

                tag_name = tags.get(b, f"{b:02X}")
                tag_param = self.jsonTblTags.get(tag_name.upper(), {}).get(parameter, None)  

                if tag_param is not None:
                    finalText += f"<{tag_param}>"
                else:
                    finalText += f"<{tag_name}:{parameter:X}>"

                continue
            
            # Variable tags (same as above but using rsce bytecode as parameter)
            if 0x13 <= b <= 0x1A:
                tag_name = f"unk{b:02X}"
                parameter = "".join([f"{c:02X}" for c in Theirsce.read_tag_bytes(src)])
         
                finalText += f"<{tag_name}:{parameter}>"
                continue
            
            # None of the above
            finalText += "{%02X}" % b
       
        return finalText
    
    def get_node_bytes(self, entry_node):
        
        #Grab the fields from the Entry in the XML
        status = entry_node.find("Status").text
        japanese_text = entry_node.find("JapaneseText").text
        english_text = entry_node.find("EnglishText").text
        
        #Use the values only for Status = Done and use English if non empty
        final_text = ''
        if (status in self.list_status_insertion):
            final_text = english_text or japanese_text or ''
        else:
            final_text = japanese_text or ''
        
        voiceId_node = entry_node.find("VoiceId")
        if (voiceId_node != None):
            final_text = '<voice:{}>'.format(voiceId_node.text) + final_text
            
        #Convert the text values to bytes using TBL, TAGS, COLORS, ...
        bytes_entry = self.text_to_bytes(final_text)
        
        return bytes_entry
    
    
    def get_new_theirsce(self, theirsce: Theirsce, xml: Path) -> Theirsce:
        
        #To store the new text_offset and pointers to update
        new_text_offsets = dict()
              
        #Read the XML for the corresponding THEIRSCE
        
        tree = etree.parse(xml)
        root = tree.getroot()

        #Go at the start of the dialog
        #Loop on every Entry and reinsert
        theirsce.seek(theirsce.strings_offset + 1)
        nodes = [ele for ele in root.iter('Entry') if ele.find('Id').text != "-1"]
        nodes = [ele for ele in nodes if ele.find('PointerOffset').text != "-1"]

        for entry_node in nodes:

            #Add the PointerOffset and TextOffset
            new_text_offsets[entry_node.find("PointerOffset").text] = theirsce.tell()
            #Use the node to get the new bytes
            bytes_entry = self.get_node_bytes(entry_node)

            #Write to the file
            theirsce.write(bytes_entry + b'\x00')
            
        #Update the pointers based on the new text_offset of  the entries
        for pointer_offset, text_offset in new_text_offsets.items():
            
            pointers_list = pointer_offset.split(",")
            new_value = text_offset - theirsce.strings_offset

            for pointer in pointers_list:
                theirsce.seek(int(pointer))
                theirsce.write( struct.pack("<H", new_value))
            
        return theirsce
    

    def pack_all_skits(self):
        print("Recreating Skit files...")

        out_path = self.paths["temp_files"] / "DAT" / "PAK2"
        out_path.mkdir(parents=True, exist_ok=True)
        xml_path = self.paths["skit_xml"]
        pak2_path = self.paths["extracted_files"] / "DAT" / "PAK2"

        for file in (pbar:= tqdm(list(pak2_path.glob("*.pak2")))):
            pbar.set_description_str(file.name)
            with open(file, "rb") as f:
                pak2_data = f.read()
            pak2_obj = pak2lib.get_data(pak2_data)

            old_rsce = Theirsce(pak2_obj.chunks.theirsce)
            xml_name = file.name.split(".")[0] + ".xml"
            new_rsce = self.get_new_theirsce(old_rsce, xml_path / xml_name)
            new_rsce.seek(0)
            pak2_obj.chunks.theirsce = new_rsce.read()
            
            with open(out_path / file.name, "wb") as f:
                f.write(pak2lib.create_pak2(pak2_obj))

    def debug_Story_Skits(self, section, file_name, text=False):

        if section == "Story":
            theirsce = self.get_theirsce_from_scpk(self.dat_archive_extract + 'SCPK/' + self.get_file_name(file_name) + '.scpk')
        else:
            with open(self.dat_archive_extract + "PAK2/" + file_name.split(".")[0] + '.3.pak2', "rb") as pak:
                data = pak.read()
            theirsce = io.BytesIO(pak2lib.get_theirsce_from_pak2(data))

        rsce = Theirsce(path=theirsce)
        # pointers_offset, texts_offset = self.extract_Story_Pointers(rsce)
        names, lines = self.extract_lines_with_speaker(rsce)

        for i, (k, v) in enumerate(names.items(), -1):
            names[k] = NameEntry(i, v)

        with open('../{}.theirsce'.format(file_name), 'wb') as f:
            f.write(theirsce.getvalue())

        text_list = []
        if text:
            text_list = [line.text for line in lines]

        df = pd.DataFrame({"Jap_Text": text_list})
        df['Text_Offset'] = df['Text_Offset'].apply(lambda x: hex(x)[2:])
        df['Pointers_Offset'] = df['Pointers_Offset'].apply(lambda x: hex(x)[2:])
        df.to_excel('../{}.xlsx'.format(self.get_file_name(file_name)), index=False)

            
    def get_datbin_file_data(self) -> list[tuple[int, int]]:
        slps_path = self.paths["original_files"] / self.main_exe_name
        with open(slps_path, "rb") as elf:
            elf.seek(self.POINTERS_BEGIN, 0)
            blob = elf.read(self.POINTERS_END-self.POINTERS_BEGIN)
            
        pointers = struct.unpack(f"<{len(blob)//4}I", blob)
        file_data: list[tuple[int, int]] = []
        for c, n in zip(pointers, pointers[1:]):
            remainder = c & self.LOW_BITS
            start = c & self.HIGH_BITS
            end = (n & self.HIGH_BITS) - remainder
            file_data.append((start, end - start)) 
        
        return file_data

    # Extract the file DAT.BIN to the different directorties
    def extract_main_archive(self) -> None:
        dat_bin_path = self.paths["extracted_files"] / "DAT"
        
        self.clean_folder(dat_bin_path)

        print("Extracting DAT.BIN files...")
        with open( self.dat_bin_original, "rb") as f:
            for i, (offset, size) in enumerate(tqdm(self.get_datbin_file_data(), desc="Extracting files", unit="file")):
                
                # Ignore 0 byte files
                if size == 0:
                    continue

                f.seek(offset, 0)
                data = f.read(size)
                
                if comptolib.is_compressed(data):
                    c_type = struct.unpack("<b", data[:1])[0]
                    data = comptolib.decompress_data(data)
                    extension = self.get_extension(data)
                    fname = f"{i:05d}.{c_type}.{extension}"
                else:
                    extension = self.get_extension(data)
                    fname = f"{i:05d}.{extension}"
                
                final_path = dat_bin_path / extension.upper()
                final_path.mkdir(exist_ok=True)
        
                with open(final_path / fname, "wb") as output:
                    output.write(data)


    def get_style_pointers(self, text_start, text_max, base_offset, start_offset, style, file: FileIO):
        file.seek(0, 2)
        f_size = file.tell()
    
        file.seek(start_offset)
        pointers_offset = []
        pointers_value  = []
        split = [ele for ele in re.split(r'(P)|(\d+)', style) if ele]
        ok = True
        
        while ok:
            for step in split:
                if step == "P":
                    text_offset = struct.unpack("<I", file.read(4))[0] + base_offset

                    if text_offset < f_size and text_offset >= text_start and text_offset < text_max:
                        pointers_value.append(text_offset)
                        pointers_offset.append(file.tell()-4)
                        
                    else:
                        ok = False
                else:
                    file.read(int(step))
        
        return pointers_offset, pointers_value
    

    def extract_all_menu(self) -> None:
        print("Extracting Menu Files...")

        xml_path = self.paths["menu_xml"]
        xml_path.mkdir(exist_ok=True)

        # Read json descriptor file
        with open(self.paths["menu_table"], encoding="utf-8") as f:
            menu_json = json.load(f)

        for entry in tqdm(menu_json):

            if entry["file_path"] == "${main_exe}":
                file_path = self.paths["original_files"] / self.main_exe_name
            else:
                file_path = self.paths["extracted_files"] / "DAT" / entry["file_path"]

            if entry["is_pak"]:
                pak = Pak.from_path(file_path, int(entry["pak_type"]))

                for p_file in entry["files"]:
                    f_index = int(p_file["file"])
                    with FileIO(pak[f_index].data, "rb") as f:
                        xml_data = self.extract_menu_file(p_file, f)

                    with open(xml_path / f"{file_path.stem}_{f_index:03d}.xml", "wb") as xmlFile:
                        xmlFile.write(xml_data)

            else:
                with FileIO(file_path, "rb") as f:
                    xml_data = self.extract_menu_file(entry, f)

                with open(xml_path / f"{file_path.stem}.xml", "wb") as xmlFile:
                    xmlFile.write(xml_data)
            

    def extract_menu_file(self, file_def, f: FileIO):
        section_list = []
        pointers_offset_list = []
        texts_list = []

        base_offset = int(file_def["base_offset"])
        xml_root = etree.Element("MenuText")
        # print("BaseOffset:{}".format(base_offset))

        for section in file_def['sections']:
            
            text_start = int(section['text_start'])
            text_end = int(section['text_end'])
            
            #Extract Pointers of the file
            # print("Extract Pointers")
            pointers_offset, pointers_value = self.get_style_pointers(text_start, text_end, base_offset, section['pointers_start'], section['style'], f)
            # print([hex(pv) for pv in pointers_value])
        
            #Extract Text from the pointers
            # print("Extract Text")
            texts = [ self.bytes_to_text(f, ele) for ele in pointers_value]
            
            #Make a list
            section_list.extend( [section['section']] * len(texts)) 
            pointers_offset_list.extend( pointers_offset)
            texts_list.extend( texts )
    
            #Remove duplicates
            list_informations = self.remove_duplicates(section_list, pointers_offset_list, texts_list)

            #Build the XML Structure with the information
            xml_section = self.create_Node_XML(xml_root, list_informations, section['section'])
        
        #Write to XML file
        return etree.tostring(xml_root, encoding="UTF-8", pretty_print=True)
        

    def create_Node_XML(self, root, list_informations, section):
        strings_node = etree.SubElement(root, 'Strings')
        etree.SubElement(strings_node, 'Section').text = section

        for s, pointers_offset, text in list_informations:
            self.create_Entry(strings_node,  pointers_offset, text)
         
        return root

        
    def pack_main_archive(self):
        sectors: list[int] = [0]
        remainders: list[int] = []
        buffer = 0

        # Copy the original SLPS to Disc/New
        shutil.copy(self.elf_original, self.elf_new)
   
        print("Packing DAT.BIN files...")
        output_dat_path = self.paths["final_files"] / "DAT.BIN"
        original_files = self.paths["extracted_files"] / "DAT"
        total_files = (self.POINTERS_END - self.POINTERS_BEGIN) // 4
    
            
        # Get all original DAT.BIN files
        file_list: dict[int, Path] = {}
        for file in original_files.glob("*/*"):
            file_index = int(file.name[:5])
            file_list[file_index] = file

        # Overlay whatever we have compiled
        file_list: dict[int, Path] = {}
        for file in self.paths["patched_temp"].glob("*/*"):
            file_index = int(file.name[:5])
            file_list[file_index] = file
                
        with open(output_dat_path, "wb") as output_dat:
            for i in tqdm(range(total_files)):
                file = file_list.get(i)
                if not file:
                    remainders.append(0); sectors.append(buffer)
                    continue

                with open(file, "rb") as f2:
                    data = f2.read()
                
                comp_type = re.search(self.VALID_FILE_NAME, file.name).group(2)
                if comp_type != None:
                    data = comptolib.compress_data(data, version=int(comp_type))
            
                output_dat.write(data)
                size = len(data)
                remainder = 0x40 - (size % 0x40)
                if remainder == 0x40: remainder = 0
                output_dat.write(b"\x00" * remainder)
              
        
                remainders.append(remainder)
                buffer += size + remainder
                sectors.append(buffer)
        
        #Use the new SLPS updated and update the pointers for the SCPK
        original_slps = self.paths["original_files"] / self.main_exe_name
        patched_slps = self.paths["final_files"] / self.main_exe_name
        with open(original_slps, "rb") as f:
            slps = f.read()

        with open(patched_slps, "wb") as f:
            f.write(slps)
            f.seek(self.POINTERS_BEGIN)
            for sector, remainder in zip(sectors, remainders):
                f.write(struct.pack("<I", sector + remainder))
        
    
    def pack_all_story(self):
        print("Recreating Story files...")

        # TODO: use pathlib for everything
        out_path = Path(self.story_XML_patch) / "New"
        xml_path = Path(self.story_XML_new) / "XML"
        scpk_path = Path(self.dat_archive_extract) / "SCPK"

        for file in (pbar:= tqdm(list(scpk_path.glob("*.scpk")))):
            pbar.set_description_str(file.name)
            curr_scpk = Scpk.from_path(file)
            old_rsce = Theirsce(curr_scpk.rsce)
            new_rsce = self.get_new_theirsce(old_rsce, xml_path / file.with_suffix(".xml").name)
            new_rsce.seek(0)
            curr_scpk.rsce = new_rsce.read()
            
            with open(out_path / file.name, "wb") as f:
                f.write(curr_scpk.to_bytes())

            
    def insert_All(self):
        
        #Updates SCPK based on XMLs data
        
        self.pack_main_archive()


    def extract_Iso(self, umd_iso: Path) -> None:  

        print("Extracting ISO files...")
        
        iso = pycdlib.PyCdlib()
        iso.open(str(umd_iso))

        extract_to = self.paths["original_files"]
        self.clean_folder(extract_to)

        files = []
        for dirname, _, filelist in iso.walk(iso_path="/"):
            files += [dirname + x for x in filelist]
                
        for file in files:   
            out_path = extract_to / file[1:]   
            out_path.parent.mkdir(parents=True, exist_ok=True)
            
            with iso.open_file_from_iso(iso_path=file) as f, open(str(out_path).split(";")[0], "wb+") as output:
                with tqdm(total=f.length(), desc=f"Extracting {file[1:].split(';')[0]}", unit="B", unit_divisor=1024, unit_scale=True) as pbar:
                    while data := f.read(2048):
                        output.write(data)
                        pbar.update(len(data))

        iso.close()


    def clean_folder(self, path: Path) -> None:
        target_files = list(path.iterdir())
        if len(target_files) != 0:
            print("Cleaning folder...")
            for file in target_files:
                if file.is_dir():
                    shutil.rmtree(file)
                elif file.name.lower() != ".gitignore":
                    file.unlink(missing_ok=False)
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
+								import io
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
+								import json
 								import os
 								import re
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
+								import shutil
 								import struct
 								from dataclasses import dataclass
 								from itertools import tee
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
+								from pathlib import Path
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
 								import lxml.etree as etree
 								import pandas as pd
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								import pycdlib
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
+								from tqdm import tqdm
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								from pythonlib.formats.FileIO import FileIO
 								from pythonlib.formats.pak import Pak
-												Folder structure

Trying to make it more package-y

											
										
										
											2023-05-19 08:07:41 -05:00
+								from pythonlib.formats.scpk import Scpk
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
-												Folder structure

Trying to make it more package-y

											
										
										
											2023-05-19 08:07:41 -05:00
+								import pythonlib.utils.comptolib as comptolib
 								import pythonlib.formats.pak2 as pak2lib
 								from pythonlib.formats.theirsce import Theirsce
 								from pythonlib.formats.theirsce_instructions import (AluOperation, InstructionType,
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
+								                                                     TheirsceBaseInstruction)
 								from .ToolsTales import ToolsTales
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
 								@dataclass
 								class LineEntry:
 								    names: list[str]
 								    text: str
 								    offset: int
 								@dataclass
 								class NameEntry:
 								    index: int
 								    offsets: list[int]
 								VARIABLE_NAME = "[VARIABLE]"
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
 								class ToolsTOR(ToolsTales):
 								    POINTERS_BEGIN = 0xD76B0                                            # Offset to DAT.BIN pointer list start in SLPS_254.50 file
 								    POINTERS_END   = 0xE60C8                                            # Offset to DAT.BIN pointer list end in SLPS_254.50 file
 								    HIGH_BITS      = 0xFFFFFFC0
 								    LOW_BITS       = 0x3F
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
 								    #Path to used
-												Folder structure

Trying to make it more package-y

											
										
										
											2023-05-19 08:07:41 -05:00
+								    # fmt: off
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
+								    dat_bin_original    = '../Data/Tales-Of-Rebirth/Disc/Original/DAT.BIN'
 								    dat_bin_new         = '../Data/Tales-Of-Rebirth/Disc/New/DAT.BIN'
 								    elf_original        = '../Data/Tales-Of-Rebirth/Disc/Original/SLPS_254.50'
 								    elf_new             = '../Data/Tales-Of-Rebirth/Disc/New/SLPS_254.50'
 								    story_XML_new       = '../Tales-Of-Rebirth/Data/TOR/Story/'                        #Story XML files will be extracted here
 								    story_XML_patch     = '../Data/Tales-Of-Rebirth/Story/'               #Story XML files will be extracted here
 								    skit_XML_patch      = '../Data/Tales-Of-Rebirth/Skits/'                        #Skits XML files will be extracted here
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								    menu_XML_patch      = '../Tales-Of-Rebirth/Data/TOR/Menu/'
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
+								    skit_XML_new        = '../Tales-Of-Rebirth/Data/TOR/Skits/'
 								    dat_archive_extract = '../Data/Tales-Of-Rebirth/DAT/'
-												Folder structure

Trying to make it more package-y

											
										
										
											2023-05-19 08:07:41 -05:00
+								    # fmt: on
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								    def __init__(self, project_file: Path) -> None:
 								        base_path = project_file.parent
 								        self.jsonTblTags = {}
 								        self.ijsonTblTags = {}
 								        with open(project_file, encoding="utf-8") as f:
 								            jsonRaw = json.load(f)
 								        self.paths: dict[str, Path] = {k: base_path / v for k, v in jsonRaw["paths"].items()}
 								        self.main_exe_name = jsonRaw["main_exe_name"]
 								        # super().__init__("TOR", str(self.paths["encoding_table"]), "Tales-Of-Rebirth")
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        with open(self.paths["encoding_table"], encoding="utf-8") as f:
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
+								            jsonRaw = json.load(f)
 								        for k, v in jsonRaw.items():
 								            self.jsonTblTags[k] = {int(k2, 16): v2 for k2, v2 in v.items()}
-												Move functions to TOR instead of parent class

											
										
										
											2022-07-16 15:11:15 -04:00
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
+								        for k, v in self.jsonTblTags.items():
 								            self.ijsonTblTags[k] = {v2: k2 for k2, v2 in v.items()}
-												Move functions to TOR instead of parent class

											
										
										
											2022-07-16 15:11:15 -04:00
+								        self.id = 1
-												Formatting changes

											
										
										
											2023-05-19 07:30:53 -05:00
+								        # byteCode
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
+								        self.story_byte_code = b"\xF8"
-												Theirsce specific text extraction, part 1

											
										
										
											2023-01-06 22:39:17 -05:00
+								        self.string_opcode = InstructionType.STRING
-												Move transfer stuff

											
										
										
											2023-06-10 23:38:14 -05:00
+								        self.list_status_insertion: list[str] = ['Done', 'Proofreading', 'Editing']
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
-												Add functions to transfer Lauren translations

											
										
										
											2023-01-06 22:16:30 -05:00
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
+								    # Extract the story files
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
+								    def extract_all_story(self, replace=False) -> None:
 								        print("Extracting Story files...")
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
-												Update ToolsTOR.py

											
										
										
											2023-06-10 20:38:48 -05:00
+								        folder_path = self.paths["story_xml"]
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        folder_path.mkdir(exist_ok=True)
 								        scpk_path = self.paths["extracted_files"] / "DAT" / "SCPK"
-												Fix progress bars

											
										
										
											2023-05-19 10:14:55 -05:00
 								        for file in tqdm(list(scpk_path.glob("*.scpk"))):
-												Update ToolsTOR.py

											
										
										
											2023-05-22 20:49:45 -05:00
+								            theirsce = Theirsce(Scpk.from_path(file).rsce)
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
+								            xml_text = self.get_xml_from_theirsce(theirsce, "Story")
-												Remove Section and Duplicate

											
										
										
											2022-07-04 16:10:43 -04:00
+								            self.id = 1
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
 								            with open(folder_path / file.with_suffix(".xml").name, "wb") as xml:
 								                xml.write(xml_text)
-												Create new function to extract all skits

											
										
										
											2022-08-13 00:13:24 -04:00
 								    # Extract all the skits files
-												Capitalization memes

											
										
										
											2023-05-19 08:23:47 -05:00
+								    def extract_all_skits(self, replace=False) -> None:
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
+								        print("Extracting Skit files...")
-												Update ToolsTOR.py

											
										
										
											2023-06-10 20:38:48 -05:00
+								        folder_path = self.paths["skit_xml"]
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        folder_path.mkdir(exist_ok=True)
 								        pak2_path = self.paths["extracted_files"] / "DAT" / "PAK2"
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
-												Fix progress bars

											
										
										
											2023-05-19 10:14:55 -05:00
+								        for file in tqdm(list(pak2_path.glob("*.pak2"))):
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
+								            with open(file, "rb") as pak:
 								                theirsce = pak2lib.get_theirsce_from_pak2(pak.read())
 								            xml_text = self.get_xml_from_theirsce(Theirsce(theirsce), "Skits")
-												correct path memes

											
										
										
											2023-05-22 22:37:41 -05:00
+								            xml_name = file.name.split(".")[0] + ".xml"
 								            with open(folder_path / xml_name, "wb") as xml:
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
+								                xml.write(xml_text)
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
+								    # Extract THEIRSCE to XML
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
+								    def get_xml_from_theirsce(self, rsce: Theirsce, section: str) -> bytes:
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
 								        #Create the XML file
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
+								        # root = etree.Element('SceneText')
 								        # etree.SubElement(root, "OriginalName").text = file_name
-												Theirsce specific text extraction, part 1

											
										
										
											2023-01-06 22:39:17 -05:00
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
+								        #pointers_offset, texts_offset = self.extract_Story_Pointers(rsce)
 								        names, lines = self.extract_lines_with_speaker(rsce)
 								        for i, (k, v) in enumerate(names.items(), -1):
 								            names[k] = NameEntry(i, v)
-												correct Menu reinsertion of Skits Name

											
										
										
											2022-02-11 21:16:19 -05:00
 								        #Remove duplicates
-												Remove Section and Duplicate

											
										
										
											2022-07-04 16:10:43 -04:00
+								        #list_informations = self.remove_duplicates(["Story"] * len(pointers_offset), pointers_offset, text_list)
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
+								        # list_lines = ( ['Story', line.offset, line.text] for line in lines)
 								        # list_names = ( ['Story', line.offset, line.text] for i, (k, v) in enumerate(found_names.items()))
-												Adjust extract_All_Story_Files

Add Section and Destination parameters

- update Extract_Theirsce_XML
   - Add theirsce file as parameter
   - Add destination and section
- update extract_All_Story_Files so it works with new parameters

											
										
										
											2022-08-12 21:49:23 -04:00
+								        #Build the XML Structure with the information
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
 								        root = etree.Element("SceneText")
 								        speakers_node = etree.SubElement(root, 'Speakers')
-												Fix "Speaker" and voice_id replace

											
										
										
											2023-01-07 22:00:46 -05:00
+								        etree.SubElement(speakers_node, 'Section').text = "Speaker"
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
+								        strings_node = etree.SubElement(root, 'Strings')
 								        etree.SubElement(strings_node, 'Section').text = section
 								        self.make_speakers_section(speakers_node, names)
 								        self.make_strings_section(strings_node, lines, names)
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
-												Rewrite skit and story extraction

No more in-between copies when extracting, also moved the xml saving to the extracting functions and progress bars!

											
										
										
											2023-05-19 07:55:15 -05:00
+								        # Return XML string
 								        return etree.tostring(root, encoding="UTF-8", pretty_print=True)
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
 								    def make_strings_section(self, root, lines: list[LineEntry], names: dict[str, NameEntry]):
 								        pass
 								        for line in lines:
 								            entry_node = etree.SubElement(root, "Entry")
 								            etree.SubElement(entry_node,"PointerOffset").text = str(line.offset)
 								            text_split = list(filter(None, re.split(self.COMMON_TAG, line.text)))
 								            if len(text_split) > 1 and text_split[0].startswith("<voice:"):
 								                etree.SubElement(entry_node,"VoiceId").text  = text_split[0][1:-1].split(":")[1]
 								                etree.SubElement(entry_node, "JapaneseText").text = ''.join(text_split[1:])
 								            else:
 								                etree.SubElement(entry_node, "JapaneseText").text = line.text
 								            etree.SubElement(entry_node,"EnglishText")
 								            etree.SubElement(entry_node,"Notes")
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
+								            if line.names:
 								                etree.SubElement(entry_node,"SpeakerId").text = ','.join([str(names[n].index) for n in line.names])
 								            etree.SubElement(entry_node,"Id").text = str(self.id)
 								            self.id = self.id + 1
 								            if line.text == '':
 								                statusText = 'Done'
 								            else:
 								                statusText = 'To Do'
 								            etree.SubElement(entry_node,"Status").text        = statusText
 								    def make_speakers_section(self, root, names: dict[str, NameEntry]):
 								        for k, v in names.items():
 								            entry_node = etree.SubElement(root, "Entry")
-												Make PointerOffset self-closing

											
										
										
											2023-01-06 23:16:52 -05:00
+								            if v.offsets:
 								                etree.SubElement(entry_node,"PointerOffset").text = ",".join([str(off) for off in v.offsets])
 								            else:
 								                etree.SubElement(entry_node,"PointerOffset")
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
+								            etree.SubElement(entry_node,"JapaneseText").text  = str(k)
 								            etree.SubElement(entry_node,"EnglishText")
 								            etree.SubElement(entry_node,"Notes")
 								            etree.SubElement(entry_node,"Id").text            = str(v.index)
 								            etree.SubElement(entry_node,"Status").text         = "To Do"
 								    def extract_lines_with_speaker(self, theirsce: Theirsce):
 								        # This will do a bit of everything thanks to the "nice"
 								        # architecture of the Theirsce class :)
 								        # Debug
 								        # sections = []
 								        # for _, section in enumerate(theirsce.sections):
 								        #     for _, sub in enumerate(section):
 								        #         sections.append(sub.off)
 								        # Setup three-way opcode generator
 								        d = TheirsceBaseInstruction(); d.type = InstructionType.INVALID
 								        a,b,c = tee(theirsce.walk_code(), 3)
 								        next(a, d)
 								        next(b, d); next(b, d)
 								        next(c, d); next(c, d); next(c, d)
 								        # Helper function, in the future I'll
 								        # just use a list of opcodes
 								        def skip():
 								            next(a, d); next(a, d)
 								            next(b, d); next(b, d)
 								            next(c, d); next(c, d)
 								        names = {VARIABLE_NAME: []}
 								        lines = []
 								        params = []
 								        used = False
 								        for op1, op2, op3 in zip(a,b,c):
 								            # Debug
 								            # if theirsce.tell() in sections:
 								            #     print()
 								            #     print("SECTION: ")
 								            # BREAK marks start of a local function
 								            # so local params are no longer in scope
 								            if op1.type is InstructionType.BREAK:
 								                if used == False:
 								                    for param in params:
 								                        text = self.bytes_to_text(theirsce, param.offset + theirsce.strings_offset)
 								                        lines.append(LineEntry([], text, op1.position + 1))
 								                params.clear()
 								                continue
 								            # This sequence mark the simple act of assigning
 								            # a string to a local variable, so we can detect
 								            # when they are used later in a function call
 								            if (op1.type is InstructionType.REFERENCE
 								                and op2.type is InstructionType.STRING
 								                and op3.type is InstructionType.ALU
 								                and op3.operation == AluOperation.ASSIGNMENT
 								                ):
 								                params.append(op2)
 								                skip()
 								                continue
 								            # This sequence represents the textbox call with
 								            # the name being a variable (NPCs do this)
 								            if (op1.type is InstructionType.REFERENCE
 								                and op2.type is InstructionType.STRING
 								                and op3.type is InstructionType.SYSCALL
 								                and op3.function_index == 0x45
 								                ):
 								                if len(params) >= 1:
 								                    name = [self.bytes_to_text(theirsce, p.offset + theirsce.strings_offset) for p in params]
 								                    [names.setdefault(n, []).append(p.position + 1) for n, p in zip(name, params)]
 								                elif len(params) == 0:
 								                    name = []
 								                text = self.bytes_to_text(theirsce, op2.offset + theirsce.strings_offset)
 								                lines.append(LineEntry(name, text, op2.position + 1))
 								                #print(f"{params}: {text}")
 								                used = True
 								                skip()
 								                continue
 								            # This sequence represents the textbox call with
 								            # the text being a variable (Notice boxes do this)
 								            if (op1.type is InstructionType.STRING
 								                and op2.type is InstructionType.REFERENCE
 								                and op3.type is InstructionType.SYSCALL
 								                and op3.function_index == 0x45
 								                ):
 								                name = [self.bytes_to_text(theirsce, op1.offset + theirsce.strings_offset)]
 								                names.setdefault(name[0], []).append(op1.position + 1)
 								                for param in params:
 								                    text = self.bytes_to_text(theirsce, param.offset + theirsce.strings_offset)
 								                    lines.append(LineEntry(name, text, param.position + 1))
 								                    #print(f"{text}: {name}")
 								                used = True
 								                params.clear()
 								                skip()
 								                continue
 								            # This sequence represents a regular textbox call
 								            # where both fields are an string (everything else, save for skits)
 								            if (op1.type is InstructionType.STRING
 								                and op2.type is InstructionType.STRING
 								                and op3.type is InstructionType.SYSCALL
 								                and op3.function_index == 0x45
 								                ):
 								                name = [self.bytes_to_text(theirsce, op1.offset + theirsce.strings_offset)]
 								                names.setdefault(name[0], []).append(op1.position + 1)
 								                text = self.bytes_to_text(theirsce, op2.offset + theirsce.strings_offset)
 								                lines.append(LineEntry(name, text, op2.position + 1))
 								                #print(f"{name}: {text}")
 								                skip()
 								                continue
 								            # Any other string in assorted code calls
 								            if op1.type is InstructionType.STRING:
 								                #print(theirsce.read_string_at(op1.offset + theirsce.strings_offset))
 								                text = self.bytes_to_text(theirsce, op1.offset + theirsce.strings_offset)
 								                lines.append(LineEntry([], text, op1.position + 1))
 								                continue
 								        return names, lines
 								    def extract_story_pointers_plain(self, theirsce: Theirsce):
-												Theirsce specific text extraction, part 1

											
										
										
											2023-01-06 22:39:17 -05:00
+								        pointers_offset = []; texts_offset = []
 								        for opcode in theirsce.walk_code():
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
+								            if opcode.type == self.string_opcode:
-												Theirsce specific text extraction, part 1

											
										
										
											2023-01-06 22:39:17 -05:00
+								                pointers_offset.append(theirsce.tell() - 2) # Maybe check this later
 								                texts_offset.append(opcode.offset + theirsce.strings_offset)
 								        return pointers_offset, texts_offset
-												Move functions to TOR instead of parent class

											
										
										
											2022-07-16 15:11:15 -04:00
+								    #Convert a bytes object to text using TAGS and TBL in the json file
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								    def bytes_to_text(self, src: FileIO, offset: int = -1) -> str:
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
+								        finalText = ""
 								        tags = self.jsonTblTags['TAGS']
 								        chars = self.jsonTblTags['TBL']
-												Move functions to TOR instead of parent class

											
										
										
											2022-07-16 15:11:15 -04:00
+								        if (offset > 0):
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								            src.seek(offset, 0)
-												Move functions to TOR instead of parent class

											
										
										
											2022-07-16 15:11:15 -04:00
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
+								        while True:
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								            b = src.read(1)
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								            if b == b"\x00": break
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
 								            b = ord(b)
 								            # Custom Encoded Text
 								            if (0x99 <= b <= 0x9F) or (0xE0 <= b <= 0xEB):
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								                c = (b << 8) | src.read_uint8()
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
+								                finalText += chars.get(c, "{%02X}{%02X}" % (c >> 8, c & 0xFF))
 								                continue
 								            if b == 0x1:
 								                finalText += ("\n")
 								                continue
 								            # ASCII text
 								            if chr(b) in self.PRINTABLE_CHARS:
 								                finalText += chr(b)
 								                continue
 								            # cp932 text
 								            if 0xA0 < b < 0xE0:
 								                finalText += struct.pack("B", b).decode("cp932")
 								                continue
 								            if b == 0x81:
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								                next_b = src.read(1)
-												Move functions to TOR instead of parent class

											
										
										
											2022-07-16 15:11:15 -04:00
+								                if next_b == b"\x40":
 								                    finalText += "　"
 								                else:
 								                    finalText += "{%02X}" % b
 								                    finalText += "{%02X}" % ord(next_b)
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
+								                continue
 								            # Simple Tags
 								            if 0x3 <= b <= 0xF:
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								                parameter = src.read_uint32()
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
 								                tag_name = tags.get(b, f"{b:02X}")
 								                tag_param = self.jsonTblTags.get(tag_name.upper(), {}).get(parameter, None)
 								                if tag_param is not None:
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								                    finalText += f"<{tag_param}>"
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
+								                else:
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								                    finalText += f"<{tag_name}:{parameter:X}>"
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
 								                continue
 								            # Variable tags (same as above but using rsce bytecode as parameter)
 								            if 0x13 <= b <= 0x1A:
 								                tag_name = f"unk{b:02X}"
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								                parameter = "".join([f"{c:02X}" for c in Theirsce.read_tag_bytes(src)])
-												Rework tag acquisition and text conversion

											
										
										
											2023-05-16 00:05:37 -05:00
 								                finalText += f"<{tag_name}:{parameter}>"
 								                continue
 								            # None of the above
 								            finalText += "{%02X}" % b
-												Move functions to TOR instead of parent class

											
										
										
											2022-07-16 15:11:15 -04:00
-												Update dump process with speaker nodes

											
										
										
											2023-01-06 22:45:40 -05:00
+								        return finalText
-												Move functions to TOR instead of parent class

											
										
										
											2022-07-16 15:11:15 -04:00
-												Capitalization

											
										
										
											2023-05-22 12:53:18 -05:00
+								    def get_node_bytes(self, entry_node):
-												Create new function get_Node_Bytes

Take a node and return Bytes

											
										
										
											2022-06-28 21:39:01 -04:00
 								        #Grab the fields from the Entry in the XML
 								        status = entry_node.find("Status").text
 								        japanese_text = entry_node.find("JapaneseText").text
 								        english_text = entry_node.find("EnglishText").text
 								        #Use the values only for Status = Done and use English if non empty
 								        final_text = ''
-												Replace previous variable by list_status_insertion

											
										
										
											2022-06-28 21:41:25 -04:00
+								        if (status in self.list_status_insertion):
-												Create new function get_Node_Bytes

Take a node and return Bytes

											
										
										
											2022-06-28 21:39:01 -04:00
+								            final_text = english_text or japanese_text or ''
 								        else:
 								            final_text = japanese_text or ''
-												Update TSS functions

update voiceId

											
										
										
											2022-10-22 21:18:01 -04:00
 								        voiceId_node = entry_node.find("VoiceId")
 								        if (voiceId_node != None):
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
+								            final_text = '<voice:{}>'.format(voiceId_node.text) + final_text
-												Adding destination parameter to the  function

											
										
										
											2022-08-15 12:56:58 -04:00
-												Create new function get_Node_Bytes

Take a node and return Bytes

											
										
										
											2022-06-28 21:39:01 -04:00
+								        #Convert the text values to bytes using TBL, TAGS, COLORS, ...
 								        bytes_entry = self.text_to_bytes(final_text)
-												Display current item in skit and story progress bar

											
										
										
											2023-05-22 21:49:15 -05:00
+								        return bytes_entry
-												Create new function get_Node_Bytes

Take a node and return Bytes

											
										
										
											2022-06-28 21:39:01 -04:00
-												New Story insert code

											
										
										
											2023-05-22 12:53:52 -05:00
+								    def get_new_theirsce(self, theirsce: Theirsce, xml: Path) -> Theirsce:
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
 								        #To store the new text_offset and pointers to update
 								        new_text_offsets = dict()
 								        #Read the XML for the corresponding THEIRSCE
-												Remove Section and Duplicate

											
										
										
											2022-07-04 16:10:43 -04:00
-												New Story insert code

											
										
										
											2023-05-22 12:53:52 -05:00
+								        tree = etree.parse(xml)
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
+								        root = tree.getroot()
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
-												Comments and rename getNewTheirsce

											
										
										
											2022-06-28 21:47:33 -04:00
+								        #Go at the start of the dialog
 								        #Loop on every Entry and reinsert
-												New Story insert code

											
										
										
											2023-05-22 12:53:52 -05:00
+								        theirsce.seek(theirsce.strings_offset + 1)
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
+								        nodes = [ele for ele in root.iter('Entry') if ele.find('Id').text != "-1"]
 								        nodes = [ele for ele in nodes if ele.find('PointerOffset').text != "-1"]
 								        for entry_node in nodes:
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
+								            #Add the PointerOffset and TextOffset
 								            new_text_offsets[entry_node.find("PointerOffset").text] = theirsce.tell()
-												Replace old code by calling get_Node_Bytes

											
										
										
											2022-06-28 21:43:07 -04:00
+								            #Use the node to get the new bytes
-												New Story insert code

											
										
										
											2023-05-22 12:53:52 -05:00
+								            bytes_entry = self.get_node_bytes(entry_node)
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
 								            #Write to the file
-												Replace old code by calling get_Node_Bytes

											
										
										
											2022-06-28 21:43:07 -04:00
+								            theirsce.write(bytes_entry + b'\x00')
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
-												Comments and rename getNewTheirsce

											
										
										
											2022-06-28 21:47:33 -04:00
+								        #Update the pointers based on the new text_offset of  the entries
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
+								        for pointer_offset, text_offset in new_text_offsets.items():
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
+								            pointers_list = pointer_offset.split(",")
-												New Story insert code

											
										
										
											2023-05-22 12:53:52 -05:00
+								            new_value = text_offset - theirsce.strings_offset
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
 								            for pointer in pointers_list:
 								                theirsce.seek(int(pointer))
-												Change pointers to 2 bytes

											
										
										
											2022-06-28 21:31:01 -04:00
+								                theirsce.write( struct.pack("<H", new_value))
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
 								        return theirsce
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
-												New skits insert code

											
										
										
											2023-05-22 13:02:07 -05:00
+								    def pack_all_skits(self):
 								        print("Recreating Skit files...")
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        out_path = self.paths["temp_files"] / "DAT" / "PAK2"
 								        out_path.mkdir(parents=True, exist_ok=True)
-												Update ToolsTOR.py

											
										
										
											2023-06-10 20:38:48 -05:00
+								        xml_path = self.paths["skit_xml"]
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        pak2_path = self.paths["extracted_files"] / "DAT" / "PAK2"
-												New skits insert code

											
										
										
											2023-05-22 13:02:07 -05:00
-												Display current item in skit and story progress bar

											
										
										
											2023-05-22 21:49:15 -05:00
+								        for file in (pbar:= tqdm(list(pak2_path.glob("*.pak2")))):
 								            pbar.set_description_str(file.name)
-												New skits insert code

											
										
										
											2023-05-22 13:02:07 -05:00
+								            with open(file, "rb") as f:
 								                pak2_data = f.read()
 								            pak2_obj = pak2lib.get_data(pak2_data)
 								            old_rsce = Theirsce(pak2_obj.chunks.theirsce)
-												correct path memes

											
										
										
											2023-05-22 22:37:41 -05:00
+								            xml_name = file.name.split(".")[0] + ".xml"
 								            new_rsce = self.get_new_theirsce(old_rsce, xml_path / xml_name)
-												New skits insert code

											
										
										
											2023-05-22 13:02:07 -05:00
+								            new_rsce.seek(0)
-												correct path memes

											
										
										
											2023-05-22 22:37:41 -05:00
+								            pak2_obj.chunks.theirsce = new_rsce.read()
-												New skits insert code

											
										
										
											2023-05-22 13:02:07 -05:00
 								            with open(out_path / file.name, "wb") as f:
 								                f.write(pak2lib.create_pak2(pak2_obj))
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
 								    def debug_Story_Skits(self, section, file_name, text=False):
 								        if section == "Story":
 								            theirsce = self.get_theirsce_from_scpk(self.dat_archive_extract + 'SCPK/' + self.get_file_name(file_name) + '.scpk')
 								        else:
 								            with open(self.dat_archive_extract + "PAK2/" + file_name.split(".")[0] + '.3.pak2', "rb") as pak:
 								                data = pak.read()
 								            theirsce = io.BytesIO(pak2lib.get_theirsce_from_pak2(data))
-												Fix "Speaker" and voice_id replace

											
										
										
											2023-01-07 22:00:46 -05:00
+								        rsce = Theirsce(path=theirsce)
 								        # pointers_offset, texts_offset = self.extract_Story_Pointers(rsce)
 								        names, lines = self.extract_lines_with_speaker(rsce)
 								        for i, (k, v) in enumerate(names.items(), -1):
 								            names[k] = NameEntry(i, v)
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
+								        with open('../{}.theirsce'.format(file_name), 'wb') as f:
 								            f.write(theirsce.getvalue())
 								        text_list = []
 								        if text:
-												Fix "Speaker" and voice_id replace

											
										
										
											2023-01-07 22:00:46 -05:00
+								            text_list = [line.text for line in lines]
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
-												Fix "Speaker" and voice_id replace

											
										
										
											2023-01-07 22:00:46 -05:00
+								        df = pd.DataFrame({"Jap_Text": text_list})
-												Add a replace flag

Add a replace tag

											
										
										
											2022-12-21 19:10:18 -05:00
+								        df['Text_Offset'] = df['Text_Offset'].apply(lambda x: hex(x)[2:])
 								        df['Pointers_Offset'] = df['Pointers_Offset'].apply(lambda x: hex(x)[2:])
 								        df.to_excel('../{}.xlsx'.format(self.get_file_name(file_name)), index=False)
-												Move and tweak get pointers into talesTOR

code seemed TOR specific anyway

											
										
										
											2023-05-19 07:45:20 -05:00
-												Don't skip files when extracting DAT.BIN

											
										
										
											2023-05-23 12:13:58 -05:00
+								    def get_datbin_file_data(self) -> list[tuple[int, int]]:
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        slps_path = self.paths["original_files"] / self.main_exe_name
 								        with open(slps_path, "rb") as elf:
-												Move and tweak get pointers into talesTOR

code seemed TOR specific anyway

											
										
										
											2023-05-19 07:45:20 -05:00
+								            elf.seek(self.POINTERS_BEGIN, 0)
 								            blob = elf.read(self.POINTERS_END-self.POINTERS_BEGIN)
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        pointers = struct.unpack(f"<{len(blob)//4}I", blob)
-												Don't skip files when extracting DAT.BIN

											
										
										
											2023-05-23 12:13:58 -05:00
+								        file_data: list[tuple[int, int]] = []
-												Rewrite DAT.BIN extraction

											
										
										
											2023-05-19 07:48:01 -05:00
+								        for c, n in zip(pointers, pointers[1:]):
 								            remainder = c & self.LOW_BITS
 								            start = c & self.HIGH_BITS
 								            end = (n & self.HIGH_BITS) - remainder
-												Don't skip files when extracting DAT.BIN

											
										
										
											2023-05-23 12:13:58 -05:00
+								            file_data.append((start, end - start))
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
-												Rewrite DAT.BIN extraction

											
										
										
											2023-05-19 07:48:01 -05:00
+								        return file_data
 								    # Extract the file DAT.BIN to the different directorties
 								    def extract_main_archive(self) -> None:
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        dat_bin_path = self.paths["extracted_files"] / "DAT"
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
-												Update ToolsTOR.py

											
										
										
											2023-07-27 22:00:32 -05:00
+								        self.clean_folder(dat_bin_path)
-												Fix wrong start offsets on DAT.BIN extraction

And added cleaning before copy

											
										
										
											2023-05-19 10:15:42 -05:00
 								        print("Extracting DAT.BIN files...")
-												Rewrite DAT.BIN extraction

											
										
										
											2023-05-19 07:48:01 -05:00
+								        with open( self.dat_bin_original, "rb") as f:
-												Don't skip files when extracting DAT.BIN

											
										
										
											2023-05-23 12:13:58 -05:00
+								            for i, (offset, size) in enumerate(tqdm(self.get_datbin_file_data(), desc="Extracting files", unit="file")):
-												Rewrite DAT.BIN extraction

											
										
										
											2023-05-19 07:48:01 -05:00
-												Basic set of files to extract TOR SCPK files

- Basic example in TOR_Test.py to extract the Scenario files to XML

											
										
										
											2022-01-23 08:25:40 -05:00
+								                # Ignore 0 byte files
-												Rewrite DAT.BIN extraction

											
										
										
											2023-05-19 07:48:01 -05:00
+								                if size == 0:
 								                    continue
 								                f.seek(offset, 0)
 								                data = f.read(size)
 								                if comptolib.is_compressed(data):
 								                    c_type = struct.unpack("<b", data[:1])[0]
 								                    data = comptolib.decompress_data(data)
 								                    extension = self.get_extension(data)
 								                    fname = f"{i:05d}.{c_type}.{extension}"
 								                else:
 								                    extension = self.get_extension(data)
 								                    fname = f"{i:05d}.{extension}"
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								                final_path = dat_bin_path / extension.upper()
 								                final_path.mkdir(exist_ok=True)
-												Rewrite DAT.BIN extraction

											
										
										
											2023-05-19 07:48:01 -05:00
 								                with open(final_path / fname, "wb") as output:
 								                    output.write(data)
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
 								    def get_style_pointers(self, text_start, text_max, base_offset, start_offset, style, file: FileIO):
 								        file.seek(0, 2)
 								        f_size = file.tell()
 								        file.seek(start_offset)
 								        pointers_offset = []
 								        pointers_value  = []
 								        split = [ele for ele in re.split(r'(P)|(\d+)', style) if ele]
 								        ok = True
 								        while ok:
 								            for step in split:
 								                if step == "P":
 								                    text_offset = struct.unpack("<I", file.read(4))[0] + base_offset
 								                    if text_offset < f_size and text_offset >= text_start and text_offset < text_max:
 								                        pointers_value.append(text_offset)
 								                        pointers_offset.append(file.tell()-4)
 								                    else:
 								                        ok = False
 								                else:
 								                    file.read(int(step))
 								        return pointers_offset, pointers_value
 								    def extract_all_menu(self) -> None:
 								        print("Extracting Menu Files...")
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
 								        xml_path = self.paths["menu_xml"]
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								        xml_path.mkdir(exist_ok=True)
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        # Read json descriptor file
 								        with open(self.paths["menu_table"], encoding="utf-8") as f:
 								            menu_json = json.load(f)
 								        for entry in tqdm(menu_json):
 								            if entry["file_path"] == "${main_exe}":
 								                file_path = self.paths["original_files"] / self.main_exe_name
 								            else:
 								                file_path = self.paths["extracted_files"] / "DAT" / entry["file_path"]
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								            if entry["is_pak"]:
 								                pak = Pak.from_path(file_path, int(entry["pak_type"]))
 								                for p_file in entry["files"]:
 								                    f_index = int(p_file["file"])
 								                    with FileIO(pak[f_index].data, "rb") as f:
 								                        xml_data = self.extract_menu_file(p_file, f)
 								                    with open(xml_path / f"{file_path.stem}_{f_index:03d}.xml", "wb") as xmlFile:
 								                        xmlFile.write(xml_data)
 								            else:
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								                with FileIO(file_path, "rb") as f:
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								                    xml_data = self.extract_menu_file(entry, f)
 								                with open(xml_path / f"{file_path.stem}.xml", "wb") as xmlFile:
 								                    xmlFile.write(xml_data)
 								    def extract_menu_file(self, file_def, f: FileIO):
 								        section_list = []
 								        pointers_offset_list = []
 								        texts_list = []
 								        base_offset = int(file_def["base_offset"])
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        xml_root = etree.Element("MenuText")
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
+								        # print("BaseOffset:{}".format(base_offset))
 								        for section in file_def['sections']:
 								            text_start = int(section['text_start'])
 								            text_end = int(section['text_end'])
 								            #Extract Pointers of the file
 								            # print("Extract Pointers")
 								            pointers_offset, pointers_value = self.get_style_pointers(text_start, text_end, base_offset, section['pointers_start'], section['style'], f)
 								            # print([hex(pv) for pv in pointers_value])
 								            #Extract Text from the pointers
 								            # print("Extract Text")
 								            texts = [ self.bytes_to_text(f, ele) for ele in pointers_value]
 								            #Make a list
 								            section_list.extend( [section['section']] * len(texts))
 								            pointers_offset_list.extend( pointers_offset)
 								            texts_list.extend( texts )
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								            #Remove duplicates
 								            list_informations = self.remove_duplicates(section_list, pointers_offset_list, texts_list)
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								            #Build the XML Structure with the information
 								            xml_section = self.create_Node_XML(xml_root, list_informations, section['section'])
-												menu stuff

big ugly commit, cuz idc

											
										
										
											2023-05-27 17:10:21 -05:00
 								        #Write to XML file
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        return etree.tostring(xml_root, encoding="UTF-8", pretty_print=True)
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
 								    def create_Node_XML(self, root, list_informations, section):
 								        strings_node = etree.SubElement(root, 'Strings')
 								        etree.SubElement(strings_node, 'Section').text = section
 								        for s, pointers_offset, text in list_informations:
 								            self.create_Entry(strings_node,  pointers_offset, text)
 								        return root
-												fixing 11181.pak3 and adding preparing Menu File function

											
										
										
											2022-03-20 10:10:58 -04:00
-												Capitalization memes

											
										
										
											2023-05-19 08:23:47 -05:00
+								    def pack_main_archive(self):
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        sectors: list[int] = [0]
 								        remainders: list[int] = []
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
+								        buffer = 0
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
 								        # Copy the original SLPS to Disc/New
 								        shutil.copy(self.elf_original, self.elf_new)
-												Remove Section and Duplicate

											
										
										
											2022-07-04 16:10:43 -04:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        print("Packing DAT.BIN files...")
 								        output_dat_path = self.paths["final_files"] / "DAT.BIN"
 								        original_files = self.paths["extracted_files"] / "DAT"
 								        total_files = (self.POINTERS_END - self.POINTERS_BEGIN) // 4
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        # Get all original DAT.BIN files
 								        file_list: dict[int, Path] = {}
 								        for file in original_files.glob("*/*"):
 								            file_index = int(file.name[:5])
 								            file_list[file_index] = file
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        # Overlay whatever we have compiled
 								        file_list: dict[int, Path] = {}
 								        for file in self.paths["patched_temp"].glob("*/*"):
 								            file_index = int(file.name[:5])
 								            file_list[file_index] = file
 								        with open(output_dat_path, "wb") as output_dat:
 								            for i in tqdm(range(total_files)):
 								                file = file_list.get(i)
 								                if not file:
 								                    remainders.append(0); sectors.append(buffer)
 								                    continue
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								                with open(file, "rb") as f2:
-												Fixing different issues during repacking (#105)

* Fix Reinsertion issues with Pointeroffset

* Add batch files

* fix issues with SCPK and PAK2 not being created in folder New

* Adding Editing and Copy SLPS

* Fixing Tags Unkn + VoiceId in Story
											
										
										
											2023-05-14 16:50:41 -04:00
+								                    data = f2.read()
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								                comp_type = re.search(self.VALID_FILE_NAME, file.name).group(2)
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
+								                if comp_type != None:
 								                    data = comptolib.compress_data(data, version=int(comp_type))
 								                output_dat.write(data)
 								                size = len(data)
 								                remainder = 0x40 - (size % 0x40)
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								                if remainder == 0x40: remainder = 0
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
+								                output_dat.write(b"\x00" * remainder)
 								                remainders.append(remainder)
 								                buffer += size + remainder
 								                sectors.append(buffer)
-												Use the SLPS updated for SCPK pointers

											
										
										
											2022-08-05 15:22:45 -04:00
+								        #Use the new SLPS updated and update the pointers for the SCPK
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        original_slps = self.paths["original_files"] / self.main_exe_name
 								        patched_slps = self.paths["final_files"] / self.main_exe_name
 								        with open(original_slps, "rb") as f:
 								            slps = f.read()
 								        with open(patched_slps, "wb") as f:
 								            f.write(slps)
 								            f.seek(self.POINTERS_BEGIN)
 								            for sector, remainder in zip(sectors, remainders):
 								                f.write(struct.pack("<I", sector + remainder))
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
-												Updating Scripts and doing test with TOR

											
										
										
											2022-01-30 19:19:43 -05:00
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
-												New Story insert code

											
										
										
											2023-05-22 12:53:52 -05:00
+								    def pack_all_story(self):
 								        print("Recreating Story files...")
 								        # TODO: use pathlib for everything
 								        out_path = Path(self.story_XML_patch) / "New"
-												correct path memes

											
										
										
											2023-05-22 22:37:41 -05:00
+								        xml_path = Path(self.story_XML_new) / "XML"
-												New Story insert code

											
										
										
											2023-05-22 12:53:52 -05:00
+								        scpk_path = Path(self.dat_archive_extract) / "SCPK"
-												Display current item in skit and story progress bar

											
										
										
											2023-05-22 21:49:15 -05:00
+								        for file in (pbar:= tqdm(list(scpk_path.glob("*.scpk")))):
 								            pbar.set_description_str(file.name)
-												fix SCPK and skit packing typos

											
										
										
											2023-05-22 20:48:10 -05:00
+								            curr_scpk = Scpk.from_path(file)
-												New Story insert code

											
										
										
											2023-05-22 12:53:52 -05:00
+								            old_rsce = Theirsce(curr_scpk.rsce)
 								            new_rsce = self.get_new_theirsce(old_rsce, xml_path / file.with_suffix(".xml").name)
 								            new_rsce.seek(0)
 								            curr_scpk.rsce = new_rsce.read()
 								            with open(out_path / file.name, "wb") as f:
 								                f.write(curr_scpk.to_bytes())
-												Updates some scripts

											
										
										
											2022-02-18 15:42:52 -05:00
 								    def insert_All(self):
 								        #Updates SCPK based on XMLs data
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
+								        self.pack_main_archive()
 								    def extract_Iso(self, umd_iso: Path) -> None:
 								        print("Extracting ISO files...")
 								        iso = pycdlib.PyCdlib()
 								        iso.open(str(umd_iso))
 								        extract_to = self.paths["original_files"]
-												Update ToolsTOR.py

											
										
										
											2023-07-27 22:00:32 -05:00
+								        self.clean_folder(extract_to)
-												move to project.json

forgive me lord for I have sinned and this is a single commit

											
										
										
											2023-06-01 21:54:43 -05:00
 								        files = []
 								        for dirname, _, filelist in iso.walk(iso_path="/"):
 								            files += [dirname + x for x in filelist]
 								        for file in files:
 								            out_path = extract_to / file[1:]
 								            out_path.parent.mkdir(parents=True, exist_ok=True)
 								            with iso.open_file_from_iso(iso_path=file) as f, open(str(out_path).split(";")[0], "wb+") as output:
 								                with tqdm(total=f.length(), desc=f"Extracting {file[1:].split(';')[0]}", unit="B", unit_divisor=1024, unit_scale=True) as pbar:
 								                    while data := f.read(2048):
 								                        output.write(data)
 								                        pbar.update(len(data))
-												Update ToolsTOR.py

											
										
										
											2023-07-27 22:00:32 -05:00
+								        iso.close()
 								    def clean_folder(self, path: Path) -> None:
 								        target_files = list(path.iterdir())
 								        if len(target_files) != 0:
 								            print("Cleaning folder...")
 								            for file in target_files:
 								                if file.is_dir():
 								                    shutil.rmtree(file)
 								                elif file.name.lower() != ".gitignore":
 								                    file.unlink(missing_ok=False)