123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301 |
- #-----------------------------------------------------------------------------
- # Copyright (c) 2005-2021, PyInstaller Development Team.
- #
- # Distributed under the terms of the GNU General Public License (version 2
- # or later) with exception for distributing the bootloader.
- #
- # The full license is in the file COPYING.txt, distributed with this software.
- #
- # SPDX-License-Identifier: (GPL-2.0-or-later WITH Bootloader-exception)
- #-----------------------------------------------------------------------------
- # TODO clean up this module
- # Subclasses may not need marshal or struct, but since they are builtin, importing is safe.
- #
- # While an Archive is really an abstraction for any "filesystem within a file", it is tuned for use with the
- # imputil.FuncImporter. This assumes it contains python code objects, indexed by the the internal name (i.e.,
- # without '.py' suffix).
- # See pyi_carchive.py for a more general archive (contains anything) that can be understood by a C program.
- # **NOTE** This module is used during bootstrap.
- # Import *ONLY* builtin modules.
- import _thread as thread
- import marshal
- import struct
- import sys
- import zlib
- # For decrypting Python modules.
- CRYPT_BLOCK_SIZE = 16
- # content types for PYZ
- PYZ_TYPE_MODULE = 0
- PYZ_TYPE_PKG = 1
- PYZ_TYPE_DATA = 2
- PYZ_TYPE_NSPKG = 3 # PEP-420 namespace package
- class FilePos(object):
- """
- This class keeps track of the file object representing and current position in a file.
- """
- def __init__(self):
- # The file object representing this file.
- self.file = None
- # The position in the file when it was last closed.
- self.pos = 0
- class ArchiveFile(object):
- """
- File class support auto open when access member from file object This class is use to avoid file locking on windows.
- """
- def __init__(self, *args, **kwargs):
- self.args = args
- self.kwargs = kwargs
- self._filePos = {}
- def local(self):
- """
- Return an instance of FilePos for the current thread. This is a crude # re-implementation of threading.local,
- which isn't a built-in module # and therefore isn't available.
- """
- ti = thread.get_ident()
- if ti not in self._filePos:
- self._filePos[ti] = FilePos()
- return self._filePos[ti]
- def __getattr__(self, name):
- """
- Make this class act like a file, by invoking most methods on its underlying file object.
- """
- file = self.local().file
- assert file
- return getattr(file, name)
- def __enter__(self):
- """
- Open file and seek to pos record from last close.
- """
- # The file shouldn't be open yet.
- fp = self.local()
- assert not fp.file
- # Open the file and seek to the last position.
- fp.file = open(*self.args, **self.kwargs)
- fp.file.seek(fp.pos)
- def __exit__(self, type, value, traceback):
- """
- Close file and record pos.
- """
- # The file should still be open.
- fp = self.local()
- assert fp.file
- # Close the file and record its position.
- fp.pos = fp.file.tell()
- fp.file.close()
- fp.file = None
- class ArchiveReadError(RuntimeError):
- pass
- class ArchiveReader(object):
- """
- A base class for a repository of python code objects. The extract method is used by imputil.ArchiveImporter to
- get code objects by name (fully qualified name), so an end-user "import a.b" becomes:
- extract('a.__init__')
- extract('a.b')
- """
- MAGIC = b'PYL\0'
- HDRLEN = 12 # default is MAGIC followed by python's magic, int pos of toc
- TOCPOS = 8
- os = None
- _bincache = None
- def __init__(self, path=None, start=0):
- """
- Initialize an Archive. If path is omitted, it will be an empty Archive.
- """
- self.toc = None
- self.path = path
- self.start = start
- # In Python3, the MAGIC_NUMBER value is available in the importlib module. However, in the bootstrap phase
- # we cannot use importlib directly, but rather its frozen variant.
- import _frozen_importlib
- self.pymagic = _frozen_importlib._bootstrap_external.MAGIC_NUMBER
- if path is not None:
- self.lib = ArchiveFile(self.path, 'rb')
- with self.lib:
- self.checkmagic()
- self.loadtoc()
- def loadtoc(self):
- """
- Overridable. Default: After magic comes an int (4 byte native) giving the position of the TOC within
- self.lib. Default: The TOC is a marshal-able string.
- """
- self.lib.seek(self.start + self.TOCPOS)
- (offset,) = struct.unpack('!i', self.lib.read(4))
- self.lib.seek(self.start + offset)
- # Use marshal.loads() since load() arg must be a file object. Convert the loaded list into a dict for
- # faster access.
- self.toc = dict(marshal.loads(self.lib.read()))
- #------ This is what is called by FuncImporter ------
- def is_package(self, name):
- ispkg, pos = self.toc.get(name, (0, None))
- if pos is None:
- return None
- return bool(ispkg)
- #------ Core method - Override as needed ------
- def extract(self, name):
- """
- Get the object corresponding to name, or None. For use with imputil ArchiveImporter, object is a python code
- object. 'name' is the name as specified in an 'import name'. 'import a.b' becomes:
- extract('a') (return None because 'a' is not a code object)
- extract('a.__init__') (return a code object)
- extract('a.b') (return a code object)
- Default implementation:
- self.toc is a dict
- self.toc[name] is pos
- self.lib has the code object marshal-ed at pos
- """
- ispkg, pos = self.toc.get(name, (0, None))
- if pos is None:
- return None
- with self.lib:
- self.lib.seek(self.start + pos)
- # Use marshal.loads() since load() arg must be a file object.
- obj = marshal.loads(self.lib.read())
- return ispkg, obj
- #------ Informational methods ------
- def contents(self):
- """
- Return a list of the contents Default implementation assumes self.toc is a dict like object. Not required by
- ArchiveImporter.
- """
- return list(self.toc.keys())
- def checkmagic(self):
- """
- Overridable. Check to see if the file object self.lib actually has a file we understand.
- """
- self.lib.seek(self.start) # default - magic is at the start of file
- if self.lib.read(len(self.MAGIC)) != self.MAGIC:
- raise ArchiveReadError("%s is not a valid %s archive file" % (self.path, self.__class__.__name__))
- if self.lib.read(len(self.pymagic)) != self.pymagic:
- raise ArchiveReadError("%s has version mismatch to dll" % self.path)
- self.lib.read(4)
- class Cipher(object):
- """
- This class is used only to decrypt Python modules.
- """
- def __init__(self):
- # At build-time the key is given to us from inside the spec file. At bootstrap-time, we must look for it
- # ourselves, by trying to import the generated 'pyi_crypto_key' module.
- import pyimod00_crypto_key
- key = pyimod00_crypto_key.key
- assert type(key) is str
- if len(key) > CRYPT_BLOCK_SIZE:
- self.key = key[0:CRYPT_BLOCK_SIZE]
- else:
- self.key = key.zfill(CRYPT_BLOCK_SIZE)
- assert len(self.key) == CRYPT_BLOCK_SIZE
- import tinyaes
- self._aesmod = tinyaes
- # Issue #1663: Remove the AES module from sys.modules list. Otherwise it interferes with using 'tinyaes' module
- # in users' code.
- del sys.modules['tinyaes']
- def __create_cipher(self, iv):
- # The 'AES' class is stateful, and this factory method is used to re-initialize the block cipher class with
- # each call to xcrypt().
- return self._aesmod.AES(self.key.encode(), iv)
- def decrypt(self, data):
- cipher = self.__create_cipher(data[:CRYPT_BLOCK_SIZE])
- return cipher.CTR_xcrypt_buffer(data[CRYPT_BLOCK_SIZE:])
- class ZlibArchiveReader(ArchiveReader):
- """
- ZlibArchive - an archive with compressed entries. Archive is read from the executable created by PyInstaller.
- This archive is used for bundling python modules inside the executable.
- NOTE: The whole ZlibArchive (PYZ) is compressed, so it is not necessary to compress individual modules.
- """
- MAGIC = b'PYZ\0'
- TOCPOS = 8
- HDRLEN = ArchiveReader.HDRLEN + 5
- def __init__(self, path=None, offset=None):
- if path is None:
- offset = 0
- elif offset is None:
- for i in range(len(path) - 1, -1, -1):
- if path[i] == '?':
- try:
- offset = int(path[i + 1:])
- except ValueError:
- # Just ignore any spurious "?" in the path (like in Windows UNC \\?\<path>).
- continue
- path = path[:i]
- break
- else:
- offset = 0
- super().__init__(path, offset)
- # Try to import the key module. Its lack of availability indicates that the encryption is disabled.
- try:
- import pyimod00_crypto_key # noqa: F401
- self.cipher = Cipher()
- except ImportError:
- self.cipher = None
- def is_package(self, name):
- (typ, pos, length) = self.toc.get(name, (0, None, 0))
- if pos is None:
- return None
- return typ in (PYZ_TYPE_PKG, PYZ_TYPE_NSPKG)
- def is_pep420_namespace_package(self, name):
- (typ, pos, length) = self.toc.get(name, (0, None, 0))
- if pos is None:
- return None
- return typ == PYZ_TYPE_NSPKG
- def extract(self, name):
- (typ, pos, length) = self.toc.get(name, (0, None, 0))
- if pos is None:
- return None
- with self.lib:
- self.lib.seek(self.start + pos)
- obj = self.lib.read(length)
- try:
- if self.cipher:
- obj = self.cipher.decrypt(obj)
- obj = zlib.decompress(obj)
- if typ in (PYZ_TYPE_MODULE, PYZ_TYPE_PKG, PYZ_TYPE_NSPKG):
- obj = marshal.loads(obj)
- except EOFError as e:
- raise ImportError("PYZ entry '%s' failed to unmarshal" % name) from e
- return typ, obj
|