pyffi.formats.bsa

Last Built: Mar 06, 2020

Source code for pyffi.formats.bsa

"""
:mod:`pyffi.formats.bsa` --- Bethesda Archive (.bsa)
====================================================

.. warning::

   This module is still a work in progress,
   and is not yet ready for production use.

A .bsa file is an archive format used by Bethesda (Morrowind, Oblivion,
Fallout 3).

Implementation
--------------

.. autoclass:: BsaFormat
   :show-inheritance:
   :members:

Regression tests
----------------

Read a BSA file
^^^^^^^^^^^^^^^
>>> # check and read bsa file
>>> from os.path import dirname
>>> dirpath = __file__
>>> for i in range(4): #recurse up to root repo dir
...     dirpath = dirname(dirpath)
>>> repo_root = dirpath
>>> format_root = os.path.join(repo_root, 'tests', 'formats', 'bsa')
>>> stream = open(os.path.join(format_root, 'test.bsa'), 'rb')
>>> data = BsaFormat.Data()
>>> data.inspect_quick(stream)
>>> data.version
103
>>> data.inspect(stream)
>>> data.folders_offset
36
>>> hex(data.archive_flags.get_attributes_values(data))
'0x703'
>>> data.num_folders
1
>>> data.num_files
7
>>> #data.read(stream)
>>> # TODO check something else...

Parse all BSA files in a directory tree
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
>>> for stream, data in BsaFormat.walkData(format_root):
...     try:
...         # the replace call makes the doctest also pass on windows
...         os_path = stream.name
...         split = (os_path.split(os.sep))[-4:]
...         rejoin = os.path.join(*split).replace(os.sep, "/")
...         print("reading %s" % rejoin)
...         data.read(stream)
...     except Exception:
...         print(
...             "Warning: read failed due corrupt file,"
...             " corrupt format description, or bug.") # doctest: +REPORT_NDIFF
reading tests/formats/bsa/test.bsa

Create an BSA file from scratch and write to file
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^

>>> data = BsaFormat.Data()
>>> # TODO store something...
>>> from tempfile import TemporaryFile
>>> stream = TemporaryFile()
>>> #data.write(stream)
"""

# ***** BEGIN LICENSE BLOCK *****
#
# Copyright (c) 2007-2012, Python File Format Interface
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
#
#    * Redistributions of source code must retain the above copyright
#      notice, this list of conditions and the following disclaimer.
#
#    * Redistributions in binary form must reproduce the above
#      copyright notice, this list of conditions and the following
#      disclaimer in the documentation and/or other materials provided
#      with the distribution.
#
#    * Neither the name of the Python File Format Interface
#      project nor the names of its contributors may be used to endorse
#      or promote products derived from this software without specific
#      prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
# FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
# COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
# INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
# BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
# LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
# ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
# POSSIBILITY OF SUCH DAMAGE.
#
# ***** END LICENSE BLOCK *****


import logging
import struct
import os
import re

import pyffi.object_models.xml
import pyffi.object_models.common
from pyffi.object_models.xml.basic import BasicBase
import pyffi.object_models
from pyffi.utils.graph import EdgeFilter


[docs]class BsaFormat(pyffi.object_models.xml.FileFormat): """This class implements the BSA format.""" xml_file_name = 'bsa.xml' # where to look for bsa.xml and in what order: # BSAXMLPATH env var, or BsaFormat module directory xml_file_path = [os.getenv('BSAXMLPATH'), os.path.dirname(__file__)] # file name regular expression match RE_FILENAME = re.compile(r'^.*\.bsa$', re.IGNORECASE) # basic types UInt32 = pyffi.object_models.common.UInt ZString = pyffi.object_models.common.ZString # implementation of bsa-specific basic types
[docs] class Hash(pyffi.object_models.common.UInt64): def __str__(self): return "0x%016X" % self._value
[docs] def get_detail_display(self): return self.__str__()
[docs] class BZString(pyffi.object_models.common.SizedString):
[docs] def get_size(self, data=None): return 2 + len(self._value)
[docs] def read(self, stream, data=None): length, = struct.unpack('<B', stream.read(1)) self._value = stream.read(length)[:-1] # strip trailing null byte
[docs] def write(self, stream, data=None): stream.write(struct.pack('<B', len(self._value))) stream.write(self._value) stream.write(struct.pack('<B', 0))
[docs] class FileVersion(pyffi.object_models.common.UInt): """Basic type which implements the header of a BSA file.""" def __init__(self, **kwargs): BasicBase.__init__(self, **kwargs)
[docs] def read(self, stream, data): """Read header string from stream and check it. :param stream: The stream to read from. :type stream: file """ hdrstr = stream.read(4) # check if the string is correct if hdrstr == "\x00\x01\x00\x00".encode("ascii"): # morrowind style, set version too! self._value = 0 elif hdrstr == "BSA\x00".encode("ascii"): # oblivion an up: read version self._value, = struct.unpack("<I", stream.read(4)) else: raise ValueError( "invalid BSA header:" " expected '\\x00\\x01\\x00\\x00' or 'BSA\\x00'" " but got '%s'" % hdrstr)
[docs] def write(self, stream, data): """Write the header string to stream. :param stream: The stream to write to. :type stream: file """ if self._value >= 103: stream.write("BSA\x00".encode("ascii")) stream.write(struct.pack("<I", self._value)) else: stream.write("\x00\x01\x00\x00".encode("ascii"))
[docs] def get_size(self, data=None): """Return number of bytes the header string occupies in a file. :return: Number of bytes. """ return 4
[docs] @staticmethod def version_number(version_str): """Converts version string into an integer. :param version_str: The version string. :type version_str: str :return: A version integer. >>> BsaFormat.version_number('103') 103 >>> BsaFormat.version_number('XXX') -1 """ try: return int(version_str) except ValueError: # not supported return -1
[docs] class Header(pyffi.object_models.FileFormat.Data): """A class to contain the actual bsa data."""
[docs] def inspect_quick(self, stream): """Quickly checks if stream contains BSA data, and gets the version, by looking at the first 8 bytes. :param stream: The stream to inspect. :type stream: file """ pos = stream.tell() try: self._version_value_.read(stream, data=self) finally: stream.seek(pos)
# overriding pyffi.object_models.FileFormat.Data methods
[docs] def inspect(self, stream): """Quickly checks if stream contains BSA data, and reads the header. :param stream: The stream to inspect. :type stream: file """ pos = stream.tell() try: self.inspect_quick(stream) BsaFormat._Header.read(self, stream, data=self) finally: stream.seek(pos)
[docs] def read(self, stream): """Read a bsa file. :param stream: The stream from which to read. :type stream: ``file`` """ logger = logging.getLogger("pyffi.bsa.data") # inspect self.inspect_quick(stream) # read file logger.debug("Reading header at 0x%08X." % stream.tell()) BsaFormat._Header.read(self, stream, data=self) if self.version == 0: # morrowind logger.debug("Reading file records at 0x%08X." % stream.tell()) self.old_files.read(stream, data=self) logger.debug( "Reading file name offsets at 0x%08X." % stream.tell()) for old_file in self.old_files: old_file._name_offset_value_.read(stream, data=self) logger.debug("Reading file names at 0x%08X." % stream.tell()) for old_file in self.old_files: old_file._name_value_.read(stream, data=self) logger.debug("Reading file hashes at 0x%08X." % stream.tell()) for old_file in self.old_files: old_file._name_hash_value_.read(stream, data=self) # "read" the files logger.debug( "Seeking end of raw file data at 0x%08X." % stream.tell()) total_num_bytes = 0 for old_file in self.old_files: total_num_bytes += old_file.data_size stream.seek(total_num_bytes, os.SEEK_CUR) else: # oblivion and up logger.debug( "Reading folder records at 0x%08X." % stream.tell()) self.folders.read(stream, data=self) logger.debug( "Reading folder names and file records at 0x%08X." % stream.tell()) for folder in self.folders: folder._name_value_.read(stream, data=self) folder._files_value_.read(stream, data=self) logger.debug("Reading file names at 0x%08X." % stream.tell()) for folder in self.folders: for file_ in folder.files: file_._name_value_.read(stream, data=self) # "read" the files logger.debug( "Seeking end of raw file data at 0x%08X." % stream.tell()) total_num_bytes = 0 for folder in self.folders: for file_ in folder.files: total_num_bytes += file_.file_size.num_bytes stream.seek(total_num_bytes, os.SEEK_CUR) # check if we are at the end of the file if stream.read(1): raise ValueError( 'end of file not reached: corrupt bsa file?')
[docs] def write(self, stream): """Write a bsa file. :param stream: The stream to which to write. :type stream: ``file`` """ # write the file raise NotImplementedError
if __name__ == '__main__': import doctest doctest.testmod()