Various USM fixes coming from samples in issue #4

mos9527 · mos9527 · commit 902c035cdd24 · 2025-12-23T10:49:50.000+08:00
usm: USM cipher identity fix
usm: Always prepend header data
usm: Allow HCACodec key specification in get_audios
Add `save()` helper methods to builder classes
diff --git a/PyCriCodecsEx/acb.py b/PyCriCodecsEx/acb.py
@@ -320,3 +320,12 @@ def build(self) -> bytes:
         # Check whether all AWB indices are valid
         binary = UTFBuilder(self.acb.dictarray, encoding=self.acb.encoding, table_name=self.acb.table_name)
         return binary.bytes()
+
+    def save(self, filepath: str) -> None:
+        """Saves the built ACB to a file.
+
+        Args:
+            filepath (str): The path to save the ACB file to.
+        """
+        with open(filepath, "wb") as f:
+            f.write(self.build())
diff --git a/PyCriCodecsEx/awb.py b/PyCriCodecsEx/awb.py
@@ -165,4 +165,13 @@ def build(self) -> bytes:
             if len(fl) % self.align != 0 and idx != len(self.infiles) - 1:
                 fl = fl.ljust(len(fl) + (self.align - (len(fl) % self.align)), b"\x00")
             outfile.write(fl)
-        return outfile.getvalue()
+        return outfile.getvalue()
+
+    def save(self, filepath: str) -> None:
+        """Saves the built AWB to a file.
+
+        Args:
+            filepath (str): The path to save the AWB file to.
+        """
+        with open(filepath, "wb") as f:
+            f.write(self.build())    
diff --git a/PyCriCodecsEx/usm.py b/PyCriCodecsEx/usm.py
@@ -21,6 +21,7 @@ class USMCrypt:
     videomask2: bytearray
     audiomask: bytearray
     usm_key: int = 0
+
     def init_key(self, key: str):
         if type(key) == str:
             if len(key) <= 16:
@@ -97,13 +98,14 @@ def init_key(self, key: str):
                 self.audiomask[x] = self.videomask2[x]
 
     # Decrypt SFV chunks or ALP chunks, should only be used if the video data is encrypted.
-    def VideoMask(self, memObj: bytearray) -> bytearray:
+    def VideoMask(self, memObj: bytearray) -> bytearray:        
         head = memObj[:0x40]
-        memObj = memObj[0x40:]
+        memObj = memObj[0x40:]          
         size = len(memObj)
         # memObj len is a cached property, very fast to lookup
         if size <= 0x200:
             return head + memObj
+        assert type(memObj) == bytearray, "memObj must be a bytearray."
         data_view = memoryview(memObj).cast("Q")
 
         # mask 2
@@ -112,24 +114,48 @@ def VideoMask(self, memObj: bytearray) -> bytearray:
         vmask = self.videomask2
         vmask_view = memoryview(vmask).cast("Q")
 
-        mask_index = 0
-
         for i in range(32, size // 8):
-            data_view[i] ^= mask_view[mask_index]
-            mask_view[mask_index] = data_view[i] ^ vmask_view[mask_index]
-            mask_index = (mask_index + 1) % 4
-
+            data_view[i] ^= mask_view[i % 4]
+            mask_view[i % 4] = data_view[i] ^ vmask_view[i % 4]
+        
         # mask 1
         mask = bytearray(self.videomask1)
         mask_view = memoryview(mask).cast("Q")
-        mask_index = 0
         for i in range(32):
-            mask_view[mask_index] ^= data_view[i + 32]
-            data_view[i] ^= mask_view[mask_index]
-            mask_index = (mask_index + 1) % 4
-
+            mask_view[i % 4] ^= data_view[i + 32]
+            data_view[i] ^= mask_view[i % 4]                  
         return head + memObj
 
+    # Encrypt SFV chunks or ALP chunks, should only be used if the video data needs to be encrypted.
+    def VideoMaskInv(self, memObj: bytearray) -> bytearray:
+        head = memObj[:0x40]
+        memObj = memObj[0x40:]          
+        size = len(memObj)
+        # memObj len is a cached property, very fast to lookup
+        if size <= 0x200:
+            return head + memObj
+        assert type(memObj) == bytearray, "memObj must be a bytearray."
+        data_view = memoryview(memObj).cast("Q")
+
+        # mask 1
+        mask = bytearray(self.videomask1)
+        mask_view = memoryview(mask).cast("Q")  
+        for i in range(32):
+            mask_view[i % 4] ^= data_view[i + 32]
+            data_view[i] ^= mask_view[i % 4]
+
+        # mask 2
+        mask = bytearray(self.videomask2)
+        mask_view = memoryview(mask).cast("Q")
+        vmask = self.videomask2
+        vmask_view = memoryview(vmask).cast("Q")
+
+        for i in range(32, size // 8):
+            temp = data_view[i]
+            data_view[i] ^= mask_view[i % 4]
+            mask_view[i % 4] = temp ^ vmask_view[i % 4]
+        return head + memObj
+    
     # Decrypts SFA chunks, should just be used with ADX files.
     def AudioMask(self, memObj: bytearray) -> bytearray:
         head = memObj[:0x140]
@@ -202,7 +228,7 @@ def framerate(self):
         # Lesson learned. Do NOT trust the metadata.
         # num, denom = self.stream["r_frame_rate"].split("/")
         # return int(int(num) / int(denom))
-        return 1 / min((dt for _, _, _, dt in self.frames()))
+        return 1 / min((dt for _, _, _, dt in self.frames() if dt))
 
     @cached_property
     def avg_framerate(self):
@@ -211,7 +237,7 @@ def avg_framerate(self):
         # if avg_frame_rate:
         #     num, denom = avg_frame_rate.split("/")
         #     return int(int(num) / int(denom))
-        return self.frame_count / sum((dt for _, _, _, dt in self.frames()))
+        return self.frame_count / sum((dt for _, _, _, dt in self.frames() if dt))
 
     @property
     def packets(self):
@@ -232,7 +258,8 @@ def frame_count(self):
     def frames(self):
         """Generator of [frame data, frame dict, is keyframe, duration]"""
         offsets = [int(packet["pos"]) for packet in self.packets] + [self.filesize]
-        for i, frame in enumerate(self.packets):
+        offsets[0] = 0 # Includes the metadata packet as well
+        for i, frame in enumerate(self.packets):            
             frame_size = offsets[i + 1] - offsets[i]
             self.file.seek(offsets[i])
             raw_frame = self.file.read(frame_size)
@@ -266,8 +293,9 @@ def generate_SFV(self, builder: "USMBuilder"):
                 0,
                 0,
             )
+            data += b"\x00" * padlen
             if builder.encrypt:
-                data = builder.VideoMask(data)
+                data = builder.VideoMaskInv(bytearray(data))
             SFV_chunk += data
             SFV_chunk = SFV_chunk.ljust(datalen + 0x18 + padlen + 0x8, b"\x00")
             SFV_list.append(SFV_chunk)
@@ -354,7 +382,7 @@ def __init__(self, filename : str | BinaryIO, key: str | int = None):
 
         Args:
             filename (str): The path to the USM file.
-            key (str, optional): The decryption key. Either int64 or a hex string. Defaults to None.
+            key (str, optional): The USM decryption key. Either int64 or a hex string. Defaults to None.
         """
         self.filename = filename
         self.decrypt = False
@@ -507,19 +535,19 @@ def get_video(self) -> VP9Codec | H264Codec | MPEG1Codec:
         stream.filename = sfname
         return stream
 
-    def get_audios(self, hca_key = 0, hca_subkey = 0) -> List[ADXCodec | HCACodec]:
+    def get_audios(self, hca_key = -1, hca_subkey = 0) -> List[ADXCodec | HCACodec]:
         """Create a list of audio codecs from the available streams.
         
         Args:
-            hca_key (int, optional): The HCA decryption key. Either int64 or a hex string. Defaults to 0 - in which
+            hca_key (int, optional): The HCA decryption key. Either int64 or a hex string. Defaults to -1, in which
                                      case the key for USM (if used) would also be used for HCA decryption.
             hca_subkey (int, optional): The HCA decryption subkey. Either int64 or a hex string. Defaults to 0.
         """
         match self.audio_codec:
             case ADXCodec.AUDIO_CODEC:
                 return [ADXCodec(s[2], s[1]) for s in self.streams if s[0] == USMChunckHeaderType.SFA.value]
             case HCACodec.AUDIO_CODEC:
-                return [HCACodec(s[2], s[1], key=hca_key or self.usm_key, subkey=hca_subkey) for s in self.streams if s[0] == USMChunckHeaderType.SFA.value] # HCAs are never encrypted in USM
+                return [HCACodec(s[2], s[1], key=hca_key if hca_key != -1 else self.usm_key, subkey=hca_subkey) for s in self.streams if s[0] == USMChunckHeaderType.SFA.value] # HCAs are never encrypted in USM
             case _:
                 return []
 
@@ -530,23 +558,23 @@ class USMBuilder(USMCrypt):
 
     key: int = None
     encrypt: bool = False
-    encrypt_audio: bool = False
 
     def __init__(
         self,
-        key = None,
-        encrypt_audio = False
+        key = None
     ) -> None:
         """Initialize the USMBuilder from set source files.
 
         Args:
-            key (str | int, optional): The encryption key. Either int64 or a hex string. Defaults to None.
-            encrypt_audio (bool, optional): Whether to also encrypt the audio. Defaults to False.
+            key (str | int, optional): The USM encryption key. Either int64 or a hex string. Defaults to None.
+        
+        Note:
+            For USM with key set, HCA audio streams *usually* use the same key for encryption.
+            Thus when adding HCA audio streams, make sure your HCACodec is initialized with a key itself.
         """
         if key:
             self.init_key(key)
             self.encrypt = True
-        self.encrypt_audio = encrypt_audio
         self.audio_streams = []
 
     def add_video(self, video : str | H264Codec | VP9Codec | MPEG1Codec):
@@ -624,6 +652,15 @@ def chunk_key_sort(chunk):
         self.usm += chunks
         return self.usm
 
+    def save(self, filepath: str) -> None:
+        """Saves the built USM to a file.
+
+        Args:
+            filepath (str): The path to save the USM file to.
+        """
+        with open(filepath, "wb") as f:
+            f.write(self.build())
+
     def _build_header(
         self, SFV_list: list, SFA_chunks: list, SBT_chunks: list  # TODO: Not used
     ) -> bytes:
diff --git a/Tests/issue4.py b/Tests/issue4.py
@@ -1,41 +1,58 @@
 # USM Sample from Digimon Story: Cyber Sleuth (PC)
 # Uses same key for both HCA and USM decryption
-# HCA Key {2897314143465725881}, // 283553DCE3FD5FB9
-# USM Key 2897314143465725881
+USM_KEY = 2897314143465725881
 from . import sample_file_path, temp_file_path
-from PyCriCodecsEx.usm import USM, USMBuilder, ADXCodec, HCACodec
-
-def test_usm_decode_and_mux():
-    usm = USM(temp_file_path('S01_B.usm'), 2897314143465725881)
+from PyCriCodecsEx.usm import USM, USMBuilder, ADXCodec, HCACodec, VP9Codec
+import ffmpeg, os
+def mux_av(video_src: str, audio_src: str, output: str, delete: bool = False):
+    (        
+        ffmpeg.output(
+            ffmpeg.input(video_src), 
+            ffmpeg.input(audio_src),
+            output, 
+            vcodec='copy',
+            acodec='copy',
+        ).overwrite_output()
+    ).run()
+    if delete:
+        print('* Cleaning up temporary files')        
+        os.unlink(video_src)
+        os.unlink(audio_src)
+    print(f'* Result available at: {output}')
+def decode_one(path : str):
+    usm = USM(path, USM_KEY)
     audio = usm.get_audios()
     video = usm.get_video()
     audio = audio[0] if audio else None
-    # Mux into MP4
-    import ffmpeg, os
-    def mux_av(video_src: str, audio_src: str, output: str, delete: bool = False):
-        (        
-            ffmpeg.output(
-                ffmpeg.input(video_src), 
-                ffmpeg.input(audio_src),
-                output, 
-                vcodec='copy',
-                acodec='copy',
-            ).overwrite_output()
-        ).run()
-        if delete:
-            print('* Cleaning up temporary files')        
-            os.unlink(video_src)
-            os.unlink(audio_src)
-        print(f'* Result available at: {output}')
-    saved_video = temp_file_path('tmp_video.mp4')
-    saved_audio = temp_file_path('tmp_audio.wav')
-    saved_hca = temp_file_path('tmp_audio.hca')
-    result = temp_file_path('muxed_result1.mp4')
-    open(saved_hca,'wb').write(audio.get_hca())
+    return audio, video
+def test_usm_decode_and_mux():    
+    saved_video = temp_file_path('tmp_video.ivf') # <- must be IVF container
+    saved_audio = temp_file_path('tmp_audio.wav')    
+    result = temp_file_path('muxed_result1.mp4')    
+    # Decode    
+    audio, video = decode_one(temp_file_path('S01_B.usm'))
     video.save(saved_video)
     audio.save(saved_audio)
+    # Mux
     mux_av(saved_video, saved_audio, result)
     print('Remux Done.')
+    # Rebuild
+    usm_builder = USMBuilder(USM_KEY)
+    usm_builder.add_video(saved_video)
+    usm_builder.add_audio(HCACodec(saved_audio, key=USM_KEY))
+    rebuilt_usm_path = temp_file_path('rebuilt_usm.usm')
+    usm_builder.save(rebuilt_usm_path)
+    print(f'Rebuilt USM saved at: {rebuilt_usm_path}')
+    # Decoded again
+    audio2, video2 = decode_one(rebuilt_usm_path)
+    saved_video2 = temp_file_path('tmp_video2.ivf') # <- must be IVF container
+    saved_audio2 = temp_file_path('tmp_audio2.wav')    
+    result2 = temp_file_path('muxed_result2.mp4')    
+    video2.save(saved_video2)
+    audio2.save(saved_audio2)
+    # Mux again
+    mux_av(saved_video2, saved_audio2, result2)
+    print('Remux Done (decode-mux).')
 
 if __name__ == "__main__":
     test_usm_decode_and_mux()