Updating Scripts and doing test with TOR

2026-02-13 15:25:50 -08:00 · 2022-01-30 19:19:43 -05:00
parent 4f59122bac
commit 3c6c455abb
14 changed files with 400 additions and 69 deletions
--- a/Event.dat
+++ b/Event.dat
--- a/SLPS_254.50
+++ b/SLPS_254.50
--- a/TBL_All.json
+++ b/TBL_All.json
@@ -1917,9 +1917,7 @@
 		"58762": "\u5766",
 		"57527": "\u52ab",
 		"57498": "\u7d05",
-		"39944": "\u3000",
-		"39945": "\u3000",
-		"39947": "\u3000",
+		"33088": "\u3000",
 		"60352": "\u7526",
 		"40158": "\u81c6",
 		"39603": "\u203b",
@@ -1961,7 +1959,7 @@
 		"0xD": "button",
 		"0xE": "font"
 	},
-	"name":
+	"NAMES":
 	{
 		"1": "<Veigue>",
 		"2": "<Mao>",
@@ -1974,7 +1972,7 @@
 		"9": "<Annie (NPC)>",
 		"8191": "<OnScreenChar>"
 	},
-	"color":
+	"COLORS":
 	{
 		"1": "<Blue>",
 		"2": "<Red>",
--- a/TOR_Test.py
+++ b/TOR_Test.py
@@ -9,5 +9,37 @@ import pandas as pd


 tool = ToolsTOR.ToolsTOR("tbl")
+tool.extractMainArchive()
+
+
 tool.extractAllStory()

+tool.insertStoryFile("10247.scpk")
+tool.insertMainArchive()
+
+
+text = '自由青年'
+text = '<Blue><Eugene> is awesome'
+bytesFinal = tool.textToBytes(text)
+
+def is_compressed(data):
+    if len(data) < 0x09:
+        return False
+
+    expected_size = struct.unpack("<L", data[1:5])[0]
+    tail_data = abs(len(data) - (expected_size + 9))
+    if expected_size == len(data) - 9:
+        return True
+    elif tail_data <= 0x10 and data[expected_size + 9 :] == b"#" * tail_data:
+        return True # SCPK files have these trailing "#" bytes :(
+    return False
+        
+
+
+with open("event.dat", "rb") as f:
+    data = f.read()
+  
+
+is_compressed(data)
+
+comptolib.decompress_data(data)
--- a/ToolsTOR.py
+++ b/ToolsTOR.py
@@ -17,6 +17,8 @@ import io

 class ToolsTOR(ToolsTales):
    
+    COMMON_TAG = r"(<\w+:?\w+>)"
+    HEX_TAG    = r"(\{[0-9A-F]{2}\})"
    POINTERS_BEGIN = 0xD76B0                                            # Offset to DAT.BIN pointer list start in SLPS_254.50 file
    POINTERS_END   = 0xE60C8                                            # Offset to DAT.BIN pointer list end in SLPS_254.50 file
    HIGH_BITS      = 0xFFFFFFC0
@@ -24,15 +26,18 @@ class ToolsTOR(ToolsTales):
    PRINTABLE_CHARS = "".join(
            (string.digits, string.ascii_letters, string.punctuation, " ")
        )
+    VALID_FILE_NAME = r"([0-9]{2,5})(?:\.)?([1,3])?\.(\w+)$"
+    
    
    #Path to used
-    datBinPath       = '../Data/Disc/Original/DAT.BIN'
-    elfPathExtract   = '../Data/Disc/Original/SLPS_254.50'
-    storyPathArchives= '../Data/Story/SCPK'                        #Story XML files will be extracted here                      
+    datBinOriginal   = '../Data/Disc/Original/DAT.BIN'
+    datBinNew        = '../Data/Disc/New/DAT.BIN'
+    elfOriginal      = '../Data/Disc/Original/SLPS_254.50'
+    elfNew           = '../Data/Disc/New/SLPS_254.50'
+    storyPathArchives= '../Data/Story/SCPK/'                        #Story XML files will be extracted here                      
    storyPathXML     = '../Data/Story/XML/'                     #SCPK will be repacked here
    skitPathArchives = '../Data//Skits/'                        #Skits XML files will be extracted here              
-    datPathExtract   = '../Data/DAT/'
-    allPathInsert    = '../Data/Disc/PSP_GAME/USRDIR'    
+    datPathExtract   = '../Data/DAT/' 
    
    def __init__(self, tbl):
        
@@ -40,14 +45,18 @@ class ToolsTOR(ToolsTales):
        
        with open("TBL_All.json") as f:
            jsonRaw = json.load(f)
+            jsonTblTags = jsonTblTags ={ k1:{ int(k2,16) if (k1 != "TBL") else k2:v2 for k2,v2 in jsonRaw[k1].items()} for k1,v1 in jsonRaw.items()}
            self.jsonTblTags ={ k1:{ int(k2,16) if (k1 != "TBL") else k2:v2 for k2,v2 in jsonRaw[k1].items()} for k1,v1 in jsonRaw.items()}
                
-     
+        self.itable = dict([[i, struct.pack(">H", int(j))] for j, i in self.jsonTblTags['TBL'].items()])
+        self.itags = dict([[i, j] for j, i in self.jsonTblTags['TAGS'].items()])
+        self.inames = dict([[i, j] for j, i in self.jsonTblTags['NAMES'].items()])
+        self.icolors = dict([[i, j] for j, i in self.jsonTblTags['COLORS'].items()])
        
        
    def get_pointers(self):

-        f = open(self.elfPathExtract , "rb")
+        f = open(self.elfOriginal , "rb")
    
        f.seek(self.POINTERS_BEGIN, 0)
        pointers = []
@@ -101,15 +110,23 @@ class ToolsTOR(ToolsTales):
        pointers_offset = []
        texts_offset = []
        
-        
+        previous_addr = 0
        while theirsce.tell() < strings_offset:
            b = theirsce.read(1)
            if b == b"\xF8":
                addr = struct.unpack("<H", theirsce.read(2))[0]
-                if (addr < fsize - strings_offset) and (addr > 0):
-                    # theirsce_data[name].append(theirsce.tell() - 2)
+                
+                current_pos = theirsce.tell()
+                theirsce.seek( addr + strings_offset-1)
+                bValidation = theirsce.read(1)
+                theirsce.seek(current_pos)
+                
+                if (addr < fsize - strings_offset) and (addr > 0) and (bValidation == b'\x00'):
+                    
                    pointers_offset.append(theirsce.tell() - 2)
                    texts_offset.append(addr + strings_offset)
+                    previous_addr = addr
+                    
        return pointers_offset, texts_offset
        
    
@@ -141,11 +158,14 @@ class ToolsTOR(ToolsTales):
                b2 = struct.unpack("<L", theirsce.read(4))[0]
                if b in TAGS:
                    tag_name = TAGS.get(b)
+                    
                    tag_param = None
-                    if (tag_name.upper() + "S") in globals():
-                        tag_param = eval("%sS.get(b2, None)" % tag_name.upper())
+                    tag_search = tag_name.upper()+'S'
+                    if (tag_search in self.jsonTblTags.keys()):
+                        tags2 = self.jsonTblTags[tag_search]
+                        tag_param = tags2.get(b2, None) 
                    if tag_param != None:
-                        finalText += "<%s>" % tag_param
+                        finalText += tag_param
                    else:
                        finalText += ("<%s:%08X>" % (tag_name, b2))
                else:
@@ -174,6 +194,56 @@ class ToolsTOR(ToolsTales):
            
        return finalText
    
+    #Convert text to Bytes object to reinsert text into THEIRSCE and other files
+    def textToBytes(self, text):
+        
+        
+       
+        unames = []
+        
+        splitLineBreak = text.split('\x0A')
+        nb = len(splitLineBreak)
+        
+        bytesFinal = b''
+        i=0
+        for line in splitLineBreak:
+            string_hex = re.split(self.HEX_TAG, line)
+            string_hex = [sh for sh in string_hex if sh]
+        
+            for s in string_hex:
+                if re.match(self.HEX_TAG, s):
+                    bytesFinal += struct.pack("B", int(s[1:3], 16))
+                else:
+                    s_com = re.split(self.COMMON_TAG, s)
+                    s_com = [sc for sc in s_com if sc]
+                    for c in s_com:
+                        if re.match(self.COMMON_TAG, c):
+                            if ":" in c:
+                                split = c.split(":")
+                                if split[0][1:] in self.itags.keys():
+                                    bytesFinal += struct.pack("B", self.itags[split[0][1:]])
+                                    bytesFinal += struct.pack("<I", int(split[1][:8], 16))
+                                else:
+                                    bytesFinal += struct.pack("B", int(split[0][1:], 16))
+                                    bytesFinal += struct.pack("<I", int(split[1][:8], 16))
+                            if c in self.inames:
+                                bytesFinal += struct.pack("B", 0xB)
+                                bytesFinal += struct.pack("<I", self.inames[c])
+                            if c in self.icolors:
+                                bytesFinal += struct.pack("B", 0x5)
+                                bytesFinal += struct.pack("<I", self.icolors[c])
+                        else:
+                            for c2 in c:
+                                if c2 in self.itable.keys():
+                                    bytesFinal += self.itable[c2]
+                                else:
+                                    bytesFinal += c2.encode("cp932")
+            i=i+1
+            if (nb >=2 and i<nb):
+                bytesFinal += b'\x01'
+        
+        return bytesFinal
+        
    # Extract THEIRSCE to XML
    def extractTheirSceXML(self, scpkFileName):
     
@@ -182,12 +252,15 @@ class ToolsTOR(ToolsTales):
        etree.SubElement(root, "OriginalName").text = scpkFileName
        
        stringsNode = etree.SubElement(root, "Strings")
-        etree.SubElement(stringsNode, "Type").text = "Static"
        
        #Open the SCPK file to grab the THEIRSCE file
        with open(scpkFileName, "rb") as scpk:
            theirsce = self.get_theirsce_from_scpk(scpk)
            
+            if (scpkFileName.endswith(".scpk")):
+                with open("Debug/{}.theirsce".format( self.get_file_name(scpkFileName)), "wb") as f:
+                    f.write(theirsce.read())
+        theirsce.seek(0)
        #Validate the header
        header = theirsce.read(8)
        if header != b"THEIRSCE":
@@ -205,6 +278,7 @@ class ToolsTOR(ToolsTales):
        pointers_offset, texts_offset = self.extraxtStoryPointers(theirsce, strings_offset, fsize)
        
        
+        
        #Extract the text from each pointers
        textList = []
        for i in range(len(texts_offset)):
@@ -233,11 +307,135 @@ class ToolsTOR(ToolsTales):
        with open(os.path.join( self.storyPathXML, self.get_file_name(scpkFileName)+".xml"), "wb") as xmlFile:
            xmlFile.write(txt)
        
+    def getNewTheirsce(self, theirsce, scpkFileName):
+        
+        #To store the new text_offset and pointers to update
+        new_text_offsets = dict()
+        
+        #Grab strings_offset for pointers
+        theirsce.read(12)
+        strings_offset = struct.unpack("<L", theirsce.read(4))[0]
+        print(strings_offset)
+              
+        #Read the XML for the corresponding THEIRSCE
+        file = self.storyPathXML+ self.get_file_name(scpkFileName)+'.xml'
+        print("XML : {}".format(self.get_file_name(scpkFileName)+'.xml'))
+        tree = etree.parse(file)
+        root = tree.getroot()
+        
+        theirsce.seek(strings_offset+1)
+        for entry_node in root.iter("Entry"):
+            
+            #Add the PointerOffset and TextOffset
+            new_text_offsets[entry_node.find("PointerOffset").text] = theirsce.tell()
+            
+            #Grab the fields from the Entry in the XML
+            status = entry_node.find("Status").text
+            japanese_text = entry_node.find("JapaneseText").text
+            english_text = entry_node.find("EnglishText").text
+            
+            #Use the values only for Status = Done and use English if non empty
+            final_text = ''
+            if (status == "Done"):
+                final_text = english_text or japanese_text or ''
+            else:
+                final_text = japanese_text or ''
+            
+
+            #Convert the text values to bytes using TBL, TAGS, COLORS, ...
+            bytesEntry = self.textToBytes(final_text)
+
+            #Write to the file
+            theirsce.write(bytesEntry + b'\x00')
+            
+        #Update the pointers
+        for pointer_offset, text_offset in new_text_offsets.items():
+            
+            theirsce.seek(int(pointer_offset))
+            theirsce.write( struct.pack("<H", text_offset - strings_offset))
+            
+        return theirsce
+            
+    #Repack SCPK files for Story
+    def insertStoryFile(self, scpkFileName):
+        
+        #Copy the original SCPK file to the folder used for the new version
+        shutil.copy( self.datPathExtract + "SCPK/" + scpkFileName, self.storyPathArchives + scpkFileName)
+        
+        #Open the new SCPK file in Read+Write mode
+        with open( self.storyPathArchives + scpkFileName, 'r+b') as scpk:
+              
+            
+            #Get nb_files and files_size
+            scpk.read(4)
+            scpk.read(4)
+            nb_files = struct.unpack("<L", scpk.read(4))[0]
+            scpk.read(4)
+            file_size_dict = dict()
+            for i in range(nb_files):
+                pointer_offset = scpk.tell()
+                file_size_dict[struct.unpack("<L", scpk.read(4))[0]] = pointer_offset
+                         
+            #Extract each files and append to the final data_final
+            dataFinal = b''
+            pos = scpk.tell()
+            for fsize, pointer_offset in file_size_dict.items():
+                
+                data = scpk.read(fsize)
+                
+                data_compressed = data
+                if self.is_compressed(data):
+                    
+                    data_uncompressed = comptolib.decompress_data(data)
+
+                    if data_uncompressed[:8] == b"THEIRSCE":
+                        
+                        #Only for debug to have  the original THEIRSCE
+                        #with open("test_original_comp.theirsce", "wb") as f:
+                        #    print("Size original: {}".format(len(data_uncompressed)))
+                        #    f.write(data)
+                        #with open("test_original.theirsce", "wb") as f:
+                        #    f.write(data_uncompressed)
+                            
+                        #Update THEIRSCE uncompressed file and write to a test file
+                        theirsce = self.getNewTheirsce(io.BytesIO(data_uncompressed), scpkFileName)
+                        
+                        theirsce.seek(0)
+                        data_new_uncompressed = theirsce.read()
+                        print("Size new: {}".format(len(data_new_uncompressed)))
+                        #Only for debug to have  the new THEIRSCE
+                        
+                        
+                        #Compress the new THEIRSCE file
+                        c_type = struct.unpack("<b", data[:1])[0]
+                        print(c_type)
+                        data_compressed = comptolib.compress_data(data_new_uncompressed, version=c_type)
+                    
+                        #with open("test_new_comp.theirsce", "wb") as f:               
+                        #    f.write(data_compressed)
+                            
+                        #with open("test_new.theirsce", "wb") as f:
+                        #    f.write(data_uncompressed)
+                            
+                        #Updating the header of the SCPK file to adjust the size
+                        new_size = len(data_new_uncompressed)
+                        if (new_size > len(data_uncompressed)):
+                            
+                            scpk.seek( pointer_offset)
+                            scpk.write( struct.pack("<I", new_size))
+                            
+                dataFinal += data_compressed
+                
+            
+            scpk.seek(pos)
+            scpk.write(dataFinal)
+            
+    
    # Extract the file DAT.BIn to the different directorties
    def extractMainArchive(self):
        
     
-        f = open( self.datBinPath, "rb")
+        f = open( self.datBinOriginal, "rb")
    
        pointers = self.get_pointers()
        total_files = len(pointers)
@@ -253,7 +451,8 @@ class ToolsTOR(ToolsTales):
                continue
            data = f.read(size)
            file_name = "%05d" % i
-    
+            
+            
            if self.is_compressed(data):
                c_type = struct.unpack("<b", data[:1])[0]
                data = comptolib.decompress_data(data)
@@ -271,7 +470,6 @@ class ToolsTOR(ToolsTales):
                    file_name,
                    extension,
                )
-            
            folderPath = os.path.join( self.datPathExtract, extension.upper())
            self.mkdir( folderPath )
    
@@ -280,4 +478,75 @@ class ToolsTOR(ToolsTales):
            print("Writing file %05d/%05d..." % (i, total_files), end="\r")
    
        print("Writing file %05d/%05d..." % (i, total_files))
-        f.close()
+        f.close()
+        
+    def insertMainArchive(self):
+        sectors = [0]
+        remainders = []
+        buffer = 0
+    
+        output_dat_path = self.datBinNew
+        output_dat = open(output_dat_path, "wb")
+    
+        print("Packing files into %s..." % os.path.basename(output_dat_path))
+        
+        #Make a list with all the files of DAT.bin
+        file_list = []
+        for path, subdir, filenames in os.walk(r"G:\TalesHacking\PythonLib_Playground\Data\DAT"):
+            if len(filenames) > 0:
+                file_list.extend( [os.path.join(path,file) for file in filenames])
+            
+            
+        list_test = [os.path.splitext(os.path.basename(ele))[0] for ele in file_list]
+        previous = -1
+        dummies = 0
+    
+        for file in sorted(file_list, key=self.get_file_name):
+            size = 0
+            remainder = 0
+            current = int(re.search(self.VALID_FILE_NAME, file).group(1))
+    
+            if current != previous + 1:
+                while previous < current - 1:
+                    remainders.append(remainder)
+                    buffer += size + remainder
+                    sectors.append(buffer)
+                    previous += 1
+                    dummies += 1
+    
+            comp_type = re.search(self.VALID_FILE_NAME, file).group(2)
+            with open(file, "rb") as f2:
+                data = f2.read()
+                
+            if comp_type != None:
+                data = comptolib.compress_data(data, version=int(comp_type))
+        
+            output_dat.write(data)
+            size = len(data)
+            print("file: {}   size: {}".format(file, size))
+            remainder = 0x40 - (size % 0x40)
+            if remainder == 0x40:
+                remainder = 0
+            output_dat.write(b"\x00" * remainder)
+          
+    
+            remainders.append(remainder)
+            buffer += size + remainder
+            sectors.append(buffer)
+            previous += 1
+    
+            print(
+                "Writing file %05d/%05d..." % (current - dummies, len(file_list)), end="\r"
+            )
+    
+        print("Writing file %05d/%05d..." % (current - dummies, len(file_list)))
+        
+        shutil.copy( self.elfOriginal, self.elfNew)
+        output_elf = open(self.elfNew, "r+b")
+        output_elf.seek(self.POINTERS_BEGIN)
+    
+        for i in range(len(sectors) - 1):
+            output_elf.write(struct.pack("<L", sectors[i] + remainders[i]))
+    
+        output_dat.close()
+        output_elf.close()
--- a/ToolsTales.py
+++ b/ToolsTales.py
@@ -207,52 +207,7 @@ class ToolsTales:
            yield i
            i = s.find(p, i+1)
    
-    def bytesToText(self, text):
-        print("Converting")
-        
-        
-        def findall(p, s):
-            '''Yields all the positions of
-            the pattern p in the string s.'''
-            i = s.find(p)
-            while i != -1:
-                yield i
-                i = s.find(p, i+1)
-            
-            
-        
-        text = '[Veigue] is a nice guy'
-        textInitial = text
-        dictFound = dict()
-        listFoundPositions = []
-        listKeys = []
-        listValues = []
-        
-        #Loop over all elements of the tbl file
-        #key is in bytes
-        #value is the text
-        tblDict = dict()
-        for key,value in tblDict.items():
-            
-            #Look for all the matches 
-            matches = [i for i in findall(value, textInitial) if i not in listFoundPositions]
-            
-            lenMatches = len(matches)
-            if lenMatches > 0:
-                print(value)
-                text = text.replace(value, '')  
-                
-                lenValue = len(value)
-                x = [listFoundPositions.extend( list(range(posStart, posStart+lenValue))) for posStart in matches]
-                listKeys.extend( matches)
-                listValues.extend( [key] * lenMatches)
-            if text == "":
-                break
-        
-            b''.join([listValues[pos] for pos in sorted( listKeys)])
-                
-  
-    
+
            
        
        
--- a/pycache/ToolsTOR.cpython-38.pyc
+++ b/pycache/ToolsTOR.cpython-38.pyc
--- a/pycache/ToolsTales.cpython-38.pyc
+++ b/pycache/ToolsTales.cpython-38.pyc
--- a/bytes.bin
+++ b/bytes.bin
--- a/createIsoTest.py
+++ b/createIsoTest.py
@@ -0,0 +1,77 @@
+
+import sys
+import os
+try:
+    from cStringIO import StringIO as BytesIO
+except ImportError:
+    from io import BytesIO
+
+# Import pycdlib itself.
+import pycdlib
+
+def get_file_name(path):
+    return os.path.basename(path)
+    
+
+# Create a new PyCdlib object.
+iso = pycdlib.PyCdlib()
+iso.open("Tales of Rebirth (Japan) - Copie.iso")
+outiso = BytesIO()
+
+iso.write_fp(outiso)
+iso.close()
+outiso.seek(0)
+dataOriginal = outiso.read()
+
+
+
+iso = pycdlib.PyCdlib()
+outiso.seek(0)
+iso.open_fp(outiso)
+
+
+with open("Tales of Rebirth (Japan) - Copie.iso", "rb") as f:
+    dataIso = f.read()
+
+
+
+
+#Grab datBin files
+newDatBinPath = "../Data/Disc/New/Dat.bin"
+with open(newDatBinPath, "rb") as datbin:
+    datbin_data = datbin.read()
+
+    
+#Grab SLPS file
+newElfPath = "../Data/Disc/New/SLPS_254.50"
+with open(newElfPath, "rb") as slps:
+    slps_data = slps.read()
+
+
+with open("Tales of Rebirth (Japan) - Copie.iso", "r+b") as f:
+    
+    #DAT.bin
+    f.seek(0x6775E800)
+    f.write(datbin_data)
+    
+    f.seek(0x89000)
+    f.write(slps_data)
+    
+
+    
+originalFilePath = "../Data/Disc/Original"
+listFiles = [os.path.join(originalFilePath, ele) for ele in os.listdir(originalFilePath) if ele not in ['DAT.BIN', 'SLPS_254.50']]
+
+for file in listFiles:
+    with open(file, "rb") as f:
+        data = f.read()
+        iso.add_fp(BytesIO(data), len(data), '/{};1'.format(os.path.basename(file)))
+
+
+# Write out the ISO to the file called 'new.iso'.  This will fully master the
+# ISO, creating a file that can be burned onto a CD.
+iso.write('new.iso')
+
+# Close the ISO object.  After this call, the PyCdlib object has forgotten
+# everything about the previous ISO, and can be re-used.
+iso.close()
--- a/test_new.theirsce
+++ b/test_new.theirsce
--- a/test_new_comp.theirsce
+++ b/test_new_comp.theirsce
--- a/test_original.theirsce
+++ b/test_original.theirsce
--- a/test_original_comp.theirsce
+++ b/test_original_comp.theirsce