Initial commit
This commit is contained in:
160
PyAnalyzer-UnpackStealers/.gitignore
vendored
Normal file
160
PyAnalyzer-UnpackStealers/.gitignore
vendored
Normal file
@@ -0,0 +1,160 @@
|
||||
# Byte-compiled / optimized / DLL files
|
||||
__pycache__/
|
||||
*.py[cod]
|
||||
*$py.class
|
||||
|
||||
# C extensions
|
||||
*.so
|
||||
|
||||
# Distribution / packaging
|
||||
.Python
|
||||
build/
|
||||
develop-eggs/
|
||||
dist/
|
||||
downloads/
|
||||
eggs/
|
||||
.eggs/
|
||||
lib/
|
||||
lib64/
|
||||
parts/
|
||||
sdist/
|
||||
var/
|
||||
wheels/
|
||||
share/python-wheels/
|
||||
*.egg-info/
|
||||
.installed.cfg
|
||||
*.egg
|
||||
MANIFEST
|
||||
|
||||
# PyInstaller
|
||||
# Usually these files are written by a python script from a template
|
||||
# before PyInstaller builds the exe, so as to inject date/other infos into it.
|
||||
*.manifest
|
||||
*.spec
|
||||
|
||||
# Installer logs
|
||||
pip-log.txt
|
||||
pip-delete-this-directory.txt
|
||||
|
||||
# Unit test / coverage reports
|
||||
htmlcov/
|
||||
.tox/
|
||||
.nox/
|
||||
.coverage
|
||||
.coverage.*
|
||||
.cache
|
||||
nosetests.xml
|
||||
coverage.xml
|
||||
*.cover
|
||||
*.py,cover
|
||||
.hypothesis/
|
||||
.pytest_cache/
|
||||
cover/
|
||||
|
||||
# Translations
|
||||
*.mo
|
||||
*.pot
|
||||
|
||||
# Django stuff:
|
||||
*.log
|
||||
local_settings.py
|
||||
db.sqlite3
|
||||
db.sqlite3-journal
|
||||
|
||||
# Flask stuff:
|
||||
instance/
|
||||
.webassets-cache
|
||||
|
||||
# Scrapy stuff:
|
||||
.scrapy
|
||||
|
||||
# Sphinx documentation
|
||||
docs/_build/
|
||||
|
||||
# PyBuilder
|
||||
.pybuilder/
|
||||
target/
|
||||
|
||||
# Jupyter Notebook
|
||||
.ipynb_checkpoints
|
||||
|
||||
# IPython
|
||||
profile_default/
|
||||
ipython_config.py
|
||||
|
||||
# pyenv
|
||||
# For a library or package, you might want to ignore these files since the code is
|
||||
# intended to run in multiple environments; otherwise, check them in:
|
||||
# .python-version
|
||||
|
||||
# pipenv
|
||||
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
|
||||
# However, in case of collaboration, if having platform-specific dependencies or dependencies
|
||||
# having no cross-platform support, pipenv may install dependencies that don't work, or not
|
||||
# install all needed dependencies.
|
||||
#Pipfile.lock
|
||||
|
||||
# poetry
|
||||
# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
|
||||
# This is especially recommended for binary packages to ensure reproducibility, and is more
|
||||
# commonly ignored for libraries.
|
||||
# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
|
||||
#poetry.lock
|
||||
|
||||
# pdm
|
||||
# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
|
||||
#pdm.lock
|
||||
# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
|
||||
# in version control.
|
||||
# https://pdm.fming.dev/#use-with-ide
|
||||
.pdm.toml
|
||||
|
||||
# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
|
||||
__pypackages__/
|
||||
|
||||
# Celery stuff
|
||||
celerybeat-schedule
|
||||
celerybeat.pid
|
||||
|
||||
# SageMath parsed files
|
||||
*.sage.py
|
||||
|
||||
# Environments
|
||||
.env
|
||||
.venv
|
||||
env/
|
||||
venv/
|
||||
ENV/
|
||||
env.bak/
|
||||
venv.bak/
|
||||
|
||||
# Spyder project settings
|
||||
.spyderproject
|
||||
.spyproject
|
||||
|
||||
# Rope project settings
|
||||
.ropeproject
|
||||
|
||||
# mkdocs documentation
|
||||
/site
|
||||
|
||||
# mypy
|
||||
.mypy_cache/
|
||||
.dmypy.json
|
||||
dmypy.json
|
||||
|
||||
# Pyre type checker
|
||||
.pyre/
|
||||
|
||||
# pytype static type analyzer
|
||||
.pytype/
|
||||
|
||||
# Cython debug symbols
|
||||
cython_debug/
|
||||
|
||||
# PyCharm
|
||||
# JetBrains specific template is maintained in a separate JetBrains.gitignore that can
|
||||
# be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
|
||||
# and can be added to the global gitignore or merged into this file. For a more nuclear
|
||||
# option (not recommended) you can uncomment the following to ignore the entire idea folder.
|
||||
#.idea/
|
||||
21
PyAnalyzer-UnpackStealers/LICENSE
Normal file
21
PyAnalyzer-UnpackStealers/LICENSE
Normal file
@@ -0,0 +1,21 @@
|
||||
MIT License
|
||||
|
||||
Copyright (c) 2024 gumbobr0t
|
||||
|
||||
Permission is hereby granted, free of charge, to any person obtaining a copy
|
||||
of this software and associated documentation files (the "Software"), to deal
|
||||
in the Software without restriction, including without limitation the rights
|
||||
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
||||
copies of the Software, and to permit persons to whom the Software is
|
||||
furnished to do so, subject to the following conditions:
|
||||
|
||||
The above copyright notice and this permission notice shall be included in all
|
||||
copies or substantial portions of the Software.
|
||||
|
||||
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||||
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||||
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
||||
SOFTWARE.
|
||||
10
PyAnalyzer-UnpackStealers/README.md
Normal file
10
PyAnalyzer-UnpackStealers/README.md
Normal file
@@ -0,0 +1,10 @@
|
||||
# PyAnalyzer
|
||||
Simple python script utilizing pycdc and pyinstxtractor to decompile and disassemble pyinstaller packed executables.
|
||||
|
||||
⚠️**You might need to build the pycdc executable yourself and place it inside the `resources` folder, because it does not work on every system.**
|
||||
https://github.com/zrax/pycdc
|
||||
|
||||
Example usage:
|
||||
`python main.py FILE_TO_ANALYZE.exe`
|
||||
|
||||
Thanks to zrax and extremecoders for the disassemblers and unpackers.
|
||||
95
PyAnalyzer-UnpackStealers/main.py
Normal file
95
PyAnalyzer-UnpackStealers/main.py
Normal file
@@ -0,0 +1,95 @@
|
||||
import subprocess
|
||||
import os
|
||||
import shutil
|
||||
import sys
|
||||
import logging
|
||||
|
||||
logging.basicConfig(filename='analyzer.log', level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
|
||||
|
||||
def decompile_pyc(pyc_file, source_dir):
|
||||
try:
|
||||
pycdc_process = subprocess.Popen(['resources\pycdc.exe', pyc_file], stdout=subprocess.PIPE, stderr=subprocess.PIPE, stdin=subprocess.PIPE, shell=True)
|
||||
stdout, stderr = pycdc_process.communicate()
|
||||
decoded_code = stdout.decode('utf-8')
|
||||
pyc_filename = os.path.basename(pyc_file)
|
||||
py_filename = pyc_filename[:-4] + '.py'
|
||||
|
||||
count = 2
|
||||
while os.path.exists(os.path.join(source_dir, py_filename)):
|
||||
py_filename = pyc_filename[:-4] + f'_{count}.py'
|
||||
count += 1
|
||||
|
||||
py_filepath = os.path.join(source_dir, py_filename)
|
||||
with open(py_filepath, 'w') as py_file:
|
||||
py_file.write(decoded_code)
|
||||
logging.info(f"Decompiled {pyc_filename}")
|
||||
print(f"Decompiled {pyc_filename}")
|
||||
except Exception as e:
|
||||
logging.error(f"Error decompiling pyc: {e}")
|
||||
print(f"Error decompiling pyc: {e}")
|
||||
return
|
||||
|
||||
def main():
|
||||
logging.info("Starting analysis.")
|
||||
if len(sys.argv) != 2:
|
||||
logging.error("Usage: python script.py FILE_TO_ANALYZE.exe")
|
||||
print("Usage: python script.py FILE_TO_ANALYZE.exe")
|
||||
sys.exit(1)
|
||||
|
||||
file_to_analyze = sys.argv[1]
|
||||
extracted_dir = file_to_analyze + '_extracted'
|
||||
source_dir = file_to_analyze + '_source'
|
||||
entry_points_dir = os.path.join(source_dir, 'entry_points')
|
||||
|
||||
os.makedirs(source_dir, exist_ok=True)
|
||||
os.makedirs(entry_points_dir, exist_ok=True)
|
||||
|
||||
try:
|
||||
pycdc_process = subprocess.Popen(['python', 'resources\pyinstxtractor.py', file_to_analyze, '-w', extracted_dir], stdout=subprocess.PIPE, stderr=subprocess.PIPE, stdin=subprocess.PIPE, shell=True)
|
||||
stdout, stderr = pycdc_process.communicate()
|
||||
output_lines = stdout.decode('utf-8').splitlines()
|
||||
|
||||
entry_points = [line.split()[-1] for line in output_lines if 'Possible entry point' in line]
|
||||
logging.info(f"Possible entry points: {entry_points}")
|
||||
|
||||
for root, dirs, files in os.walk(extracted_dir):
|
||||
for file in files:
|
||||
if file.endswith('.pyc'):
|
||||
pyc_file = os.path.join(root, file)
|
||||
pyc_filename = os.path.basename(pyc_file)
|
||||
if pyc_filename in entry_points:
|
||||
logging.info(f"Decompiling entry point: {pyc_filename}")
|
||||
decompile_pyc(pyc_file, source_dir)
|
||||
source_file = os.path.join(source_dir, pyc_filename[:-4] + '.py')
|
||||
entry_point_dest = os.path.join(entry_points_dir, pyc_filename[:-4] + '.py')
|
||||
shutil.move(source_file, entry_point_dest)
|
||||
|
||||
continue_with_others = input("Do you want to continue with decompiling other files? (y/n): ").strip().lower()
|
||||
if continue_with_others != 'y':
|
||||
logging.info("Decompilation of other files cancelled.")
|
||||
print("Decompilation of other files cancelled.")
|
||||
shutil.rmtree(extracted_dir)
|
||||
logging.info("Analysis completed.")
|
||||
print("Analysis completed.")
|
||||
sys.exit(0)
|
||||
|
||||
for root, dirs, files in os.walk(extracted_dir):
|
||||
for file in files:
|
||||
if file.endswith('.pyc'):
|
||||
pyc_file = os.path.join(root, file)
|
||||
pyc_filename = os.path.basename(pyc_file)
|
||||
if pyc_filename not in entry_points:
|
||||
logging.info(f"Decompiling: {pyc_filename}")
|
||||
decompile_pyc(pyc_file, source_dir)
|
||||
|
||||
except subprocess.CalledProcessError as e:
|
||||
logging.error(f"Error extracting bytecode: {e}")
|
||||
print(f"Error extracting bytecode: {e}")
|
||||
sys.exit(1)
|
||||
|
||||
shutil.rmtree(extracted_dir)
|
||||
logging.info("Analysis completed.")
|
||||
print("Analysis completed.")
|
||||
|
||||
if __name__ == '__main__':
|
||||
main()
|
||||
1
PyAnalyzer-UnpackStealers/requirements.txt
Normal file
1
PyAnalyzer-UnpackStealers/requirements.txt
Normal file
@@ -0,0 +1 @@
|
||||
logging
|
||||
BIN
PyAnalyzer-UnpackStealers/resources/pycdc.exe
Normal file
BIN
PyAnalyzer-UnpackStealers/resources/pycdc.exe
Normal file
Binary file not shown.
468
PyAnalyzer-UnpackStealers/resources/pyinstxtractor.py
Normal file
468
PyAnalyzer-UnpackStealers/resources/pyinstxtractor.py
Normal file
@@ -0,0 +1,468 @@
|
||||
"""
|
||||
PyInstaller Extractor v2.0 (Supports pyinstaller 5.13.0, 5.12.0, 5.11.0, 5.10.1, 5.10.0, 5.9.0, 5.8.0, 5.7.0, 5.6.2, 5.6.1, 5.6, 5.5, 5.4.1, 5.4, 5.3, 5.2, 5.1, 5.0.1, 5.0, 4.10, 4.9, 4.8, 4.7, 4.6, 4.5.1, 4.5, 4.4, 4.3, 4.2, 4.1, 4.0, 3.6, 3.5, 3.4, 3.3, 3.2, 3.1, 3.0, 2.1, 2.0)
|
||||
Author : Extreme Coders
|
||||
E-mail : extremecoders(at)hotmail(dot)com
|
||||
Web : https://0xec.blogspot.com
|
||||
Date : 26-March-2020
|
||||
Url : https://github.com/extremecoders-re/pyinstxtractor
|
||||
|
||||
For any suggestions, leave a comment on
|
||||
https://forum.tuts4you.com/topic/34455-pyinstaller-extractor/
|
||||
|
||||
This script extracts a pyinstaller generated executable file.
|
||||
Pyinstaller installation is not needed. The script has it all.
|
||||
|
||||
For best results, it is recommended to run this script in the
|
||||
same version of python as was used to create the executable.
|
||||
This is just to prevent unmarshalling errors(if any) while
|
||||
extracting the PYZ archive.
|
||||
|
||||
Usage : Just copy this script to the directory where your exe resides
|
||||
and run the script with the exe file name as a parameter
|
||||
|
||||
C:\path\to\exe\>python pyinstxtractor.py <filename>
|
||||
$ /path/to/exe/python pyinstxtractor.py <filename>
|
||||
|
||||
Licensed under GNU General Public License (GPL) v3.
|
||||
You are free to modify this source.
|
||||
|
||||
CHANGELOG
|
||||
================================================
|
||||
|
||||
Version 1.1 (Jan 28, 2014)
|
||||
-------------------------------------------------
|
||||
- First Release
|
||||
- Supports only pyinstaller 2.0
|
||||
|
||||
Version 1.2 (Sept 12, 2015)
|
||||
-------------------------------------------------
|
||||
- Added support for pyinstaller 2.1 and 3.0 dev
|
||||
- Cleaned up code
|
||||
- Script is now more verbose
|
||||
- Executable extracted within a dedicated sub-directory
|
||||
|
||||
(Support for pyinstaller 3.0 dev is experimental)
|
||||
|
||||
Version 1.3 (Dec 12, 2015)
|
||||
-------------------------------------------------
|
||||
- Added support for pyinstaller 3.0 final
|
||||
- Script is compatible with both python 2.x & 3.x (Thanks to Moritz Kroll @ Avira Operations GmbH & Co. KG)
|
||||
|
||||
Version 1.4 (Jan 19, 2016)
|
||||
-------------------------------------------------
|
||||
- Fixed a bug when writing pyc files >= version 3.3 (Thanks to Daniello Alto: https://github.com/Djamana)
|
||||
|
||||
Version 1.5 (March 1, 2016)
|
||||
-------------------------------------------------
|
||||
- Added support for pyinstaller 3.1 (Thanks to Berwyn Hoyt for reporting)
|
||||
|
||||
Version 1.6 (Sept 5, 2016)
|
||||
-------------------------------------------------
|
||||
- Added support for pyinstaller 3.2
|
||||
- Extractor will use a random name while extracting unnamed files.
|
||||
- For encrypted pyz archives it will dump the contents as is. Previously, the tool would fail.
|
||||
|
||||
Version 1.7 (March 13, 2017)
|
||||
-------------------------------------------------
|
||||
- Made the script compatible with python 2.6 (Thanks to Ross for reporting)
|
||||
|
||||
Version 1.8 (April 28, 2017)
|
||||
-------------------------------------------------
|
||||
- Support for sub-directories in .pyz files (Thanks to Moritz Kroll @ Avira Operations GmbH & Co. KG)
|
||||
|
||||
Version 1.9 (November 29, 2017)
|
||||
-------------------------------------------------
|
||||
- Added support for pyinstaller 3.3
|
||||
- Display the scripts which are run at entry (Thanks to Michael Gillespie @ malwarehunterteam for the feature request)
|
||||
|
||||
Version 2.0 (March 26, 2020)
|
||||
-------------------------------------------------
|
||||
- Project migrated to github
|
||||
- Supports pyinstaller 3.6
|
||||
- Added support for Python 3.7, 3.8
|
||||
- The header of all extracted pyc's are now automatically fixed
|
||||
"""
|
||||
|
||||
from __future__ import print_function
|
||||
import os
|
||||
import struct
|
||||
import marshal
|
||||
import zlib
|
||||
import sys
|
||||
from uuid import uuid4 as uniquename
|
||||
|
||||
|
||||
class CTOCEntry:
|
||||
def __init__(self, position, cmprsdDataSize, uncmprsdDataSize, cmprsFlag, typeCmprsData, name):
|
||||
self.position = position
|
||||
self.cmprsdDataSize = cmprsdDataSize
|
||||
self.uncmprsdDataSize = uncmprsdDataSize
|
||||
self.cmprsFlag = cmprsFlag
|
||||
self.typeCmprsData = typeCmprsData
|
||||
self.name = name
|
||||
|
||||
|
||||
class PyInstArchive:
|
||||
PYINST20_COOKIE_SIZE = 24 # For pyinstaller 2.0
|
||||
PYINST21_COOKIE_SIZE = 24 + 64 # For pyinstaller 2.1+
|
||||
MAGIC = b'MEI\014\013\012\013\016' # Magic number which identifies pyinstaller
|
||||
|
||||
def __init__(self, path):
|
||||
self.filePath = path
|
||||
self.pycMagic = b'\0' * 4
|
||||
self.barePycList = [] # List of pyc's whose headers have to be fixed
|
||||
|
||||
|
||||
def open(self):
|
||||
try:
|
||||
self.fPtr = open(self.filePath, 'rb')
|
||||
self.fileSize = os.stat(self.filePath).st_size
|
||||
except:
|
||||
print('[!] Error: Could not open {0}'.format(self.filePath))
|
||||
return False
|
||||
return True
|
||||
|
||||
|
||||
def close(self):
|
||||
try:
|
||||
self.fPtr.close()
|
||||
except:
|
||||
pass
|
||||
|
||||
|
||||
def checkFile(self):
|
||||
print('[+] Processing {0}'.format(self.filePath))
|
||||
|
||||
searchChunkSize = 8192
|
||||
endPos = self.fileSize
|
||||
self.cookiePos = -1
|
||||
|
||||
if endPos < len(self.MAGIC):
|
||||
print('[!] Error : File is too short or truncated')
|
||||
return False
|
||||
|
||||
while True:
|
||||
startPos = endPos - searchChunkSize if endPos >= searchChunkSize else 0
|
||||
chunkSize = endPos - startPos
|
||||
|
||||
if chunkSize < len(self.MAGIC):
|
||||
break
|
||||
|
||||
self.fPtr.seek(startPos, os.SEEK_SET)
|
||||
data = self.fPtr.read(chunkSize)
|
||||
|
||||
offs = data.rfind(self.MAGIC)
|
||||
|
||||
if offs != -1:
|
||||
self.cookiePos = startPos + offs
|
||||
break
|
||||
|
||||
endPos = startPos + len(self.MAGIC) - 1
|
||||
|
||||
if startPos == 0:
|
||||
break
|
||||
|
||||
if self.cookiePos == -1:
|
||||
print('[!] Error : Missing cookie, unsupported pyinstaller version or not a pyinstaller archive')
|
||||
return False
|
||||
|
||||
self.fPtr.seek(self.cookiePos + self.PYINST20_COOKIE_SIZE, os.SEEK_SET)
|
||||
|
||||
if b'python' in self.fPtr.read(64).lower():
|
||||
print('[+] Pyinstaller version: 2.1+')
|
||||
self.pyinstVer = 21 # pyinstaller 2.1+
|
||||
else:
|
||||
self.pyinstVer = 20 # pyinstaller 2.0
|
||||
print('[+] Pyinstaller version: 2.0')
|
||||
|
||||
return True
|
||||
|
||||
|
||||
def getCArchiveInfo(self):
|
||||
try:
|
||||
if self.pyinstVer == 20:
|
||||
self.fPtr.seek(self.cookiePos, os.SEEK_SET)
|
||||
|
||||
# Read CArchive cookie
|
||||
(magic, lengthofPackage, toc, tocLen, pyver) = \
|
||||
struct.unpack('!8siiii', self.fPtr.read(self.PYINST20_COOKIE_SIZE))
|
||||
|
||||
elif self.pyinstVer == 21:
|
||||
self.fPtr.seek(self.cookiePos, os.SEEK_SET)
|
||||
|
||||
# Read CArchive cookie
|
||||
(magic, lengthofPackage, toc, tocLen, pyver, pylibname) = \
|
||||
struct.unpack('!8sIIii64s', self.fPtr.read(self.PYINST21_COOKIE_SIZE))
|
||||
|
||||
except:
|
||||
print('[!] Error : The file is not a pyinstaller archive')
|
||||
return False
|
||||
|
||||
self.pymaj, self.pymin = (pyver//100, pyver%100) if pyver >= 100 else (pyver//10, pyver%10)
|
||||
print('[+] Python version: {0}.{1}'.format(self.pymaj, self.pymin))
|
||||
|
||||
# Additional data after the cookie
|
||||
tailBytes = self.fileSize - self.cookiePos - (self.PYINST20_COOKIE_SIZE if self.pyinstVer == 20 else self.PYINST21_COOKIE_SIZE)
|
||||
|
||||
# Overlay is the data appended at the end of the PE
|
||||
self.overlaySize = lengthofPackage + tailBytes
|
||||
self.overlayPos = self.fileSize - self.overlaySize
|
||||
self.tableOfContentsPos = self.overlayPos + toc
|
||||
self.tableOfContentsSize = tocLen
|
||||
|
||||
print('[+] Length of package: {0} bytes'.format(lengthofPackage))
|
||||
return True
|
||||
|
||||
|
||||
def parseTOC(self):
|
||||
# Go to the table of contents
|
||||
self.fPtr.seek(self.tableOfContentsPos, os.SEEK_SET)
|
||||
|
||||
self.tocList = []
|
||||
parsedLen = 0
|
||||
|
||||
# Parse table of contents
|
||||
while parsedLen < self.tableOfContentsSize:
|
||||
(entrySize, ) = struct.unpack('!i', self.fPtr.read(4))
|
||||
nameLen = struct.calcsize('!iIIIBc')
|
||||
|
||||
(entryPos, cmprsdDataSize, uncmprsdDataSize, cmprsFlag, typeCmprsData, name) = \
|
||||
struct.unpack( \
|
||||
'!IIIBc{0}s'.format(entrySize - nameLen), \
|
||||
self.fPtr.read(entrySize - 4))
|
||||
|
||||
try:
|
||||
name = name.decode("utf-8").rstrip("\0")
|
||||
except UnicodeDecodeError:
|
||||
newName = str(uniquename())
|
||||
print('[!] Warning: File name {0} contains invalid bytes. Using random name {1}'.format(name, newName))
|
||||
name = newName
|
||||
|
||||
# Prevent writing outside the extraction directory
|
||||
if name.startswith("/"):
|
||||
name = name.lstrip("/")
|
||||
|
||||
if len(name) == 0:
|
||||
name = str(uniquename())
|
||||
print('[!] Warning: Found an unamed file in CArchive. Using random name {0}'.format(name))
|
||||
|
||||
self.tocList.append( \
|
||||
CTOCEntry( \
|
||||
self.overlayPos + entryPos, \
|
||||
cmprsdDataSize, \
|
||||
uncmprsdDataSize, \
|
||||
cmprsFlag, \
|
||||
typeCmprsData, \
|
||||
name \
|
||||
))
|
||||
|
||||
parsedLen += entrySize
|
||||
print('[+] Found {0} files in CArchive'.format(len(self.tocList)))
|
||||
|
||||
|
||||
def _writeRawData(self, filepath, data):
|
||||
nm = filepath.replace('\\', os.path.sep).replace('/', os.path.sep).replace('..', '__')
|
||||
nmDir = os.path.dirname(nm)
|
||||
if nmDir != '' and not os.path.exists(nmDir): # Check if path exists, create if not
|
||||
os.makedirs(nmDir)
|
||||
|
||||
with open(nm, 'wb') as f:
|
||||
f.write(data)
|
||||
|
||||
|
||||
def extractFiles(self):
|
||||
print('[+] Beginning extraction...please standby')
|
||||
extractionDir = os.path.join(os.getcwd(), os.path.basename(self.filePath) + '_extracted')
|
||||
|
||||
if not os.path.exists(extractionDir):
|
||||
os.mkdir(extractionDir)
|
||||
|
||||
os.chdir(extractionDir)
|
||||
|
||||
for entry in self.tocList:
|
||||
self.fPtr.seek(entry.position, os.SEEK_SET)
|
||||
data = self.fPtr.read(entry.cmprsdDataSize)
|
||||
|
||||
if entry.cmprsFlag == 1:
|
||||
try:
|
||||
data = zlib.decompress(data)
|
||||
except zlib.error:
|
||||
print('[!] Error : Failed to decompress {0}'.format(entry.name))
|
||||
continue
|
||||
# Malware may tamper with the uncompressed size
|
||||
# Comment out the assertion in such a case
|
||||
assert len(data) == entry.uncmprsdDataSize # Sanity Check
|
||||
|
||||
if entry.typeCmprsData == b'd' or entry.typeCmprsData == b'o':
|
||||
# d -> ARCHIVE_ITEM_DEPENDENCY
|
||||
# o -> ARCHIVE_ITEM_RUNTIME_OPTION
|
||||
# These are runtime options, not files
|
||||
continue
|
||||
|
||||
basePath = os.path.dirname(entry.name)
|
||||
if basePath != '':
|
||||
# Check if path exists, create if not
|
||||
if not os.path.exists(basePath):
|
||||
os.makedirs(basePath)
|
||||
|
||||
if entry.typeCmprsData == b's':
|
||||
# s -> ARCHIVE_ITEM_PYSOURCE
|
||||
# Entry point are expected to be python scripts
|
||||
print('[+] Possible entry point: {0}.pyc'.format(entry.name))
|
||||
|
||||
if self.pycMagic == b'\0' * 4:
|
||||
# if we don't have the pyc header yet, fix them in a later pass
|
||||
self.barePycList.append(entry.name + '.pyc')
|
||||
self._writePyc(entry.name + '.pyc', data)
|
||||
|
||||
elif entry.typeCmprsData == b'M' or entry.typeCmprsData == b'm':
|
||||
# M -> ARCHIVE_ITEM_PYPACKAGE
|
||||
# m -> ARCHIVE_ITEM_PYMODULE
|
||||
# packages and modules are pyc files with their header intact
|
||||
|
||||
# From PyInstaller 5.3 and above pyc headers are no longer stored
|
||||
# https://github.com/pyinstaller/pyinstaller/commit/a97fdf
|
||||
if data[2:4] == b'\r\n':
|
||||
# < pyinstaller 5.3
|
||||
if self.pycMagic == b'\0' * 4:
|
||||
self.pycMagic = data[0:4]
|
||||
self._writeRawData(entry.name + '.pyc', data)
|
||||
|
||||
else:
|
||||
# >= pyinstaller 5.3
|
||||
if self.pycMagic == b'\0' * 4:
|
||||
# if we don't have the pyc header yet, fix them in a later pass
|
||||
self.barePycList.append(entry.name + '.pyc')
|
||||
|
||||
self._writePyc(entry.name + '.pyc', data)
|
||||
|
||||
else:
|
||||
self._writeRawData(entry.name, data)
|
||||
|
||||
if entry.typeCmprsData == b'z' or entry.typeCmprsData == b'Z':
|
||||
self._extractPyz(entry.name)
|
||||
|
||||
# Fix bare pyc's if any
|
||||
self._fixBarePycs()
|
||||
|
||||
|
||||
def _fixBarePycs(self):
|
||||
for pycFile in self.barePycList:
|
||||
with open(pycFile, 'r+b') as pycFile:
|
||||
# Overwrite the first four bytes
|
||||
pycFile.write(self.pycMagic)
|
||||
|
||||
|
||||
def _writePyc(self, filename, data):
|
||||
with open(filename, 'wb') as pycFile:
|
||||
pycFile.write(self.pycMagic) # pyc magic
|
||||
|
||||
if self.pymaj >= 3 and self.pymin >= 7: # PEP 552 -- Deterministic pycs
|
||||
pycFile.write(b'\0' * 4) # Bitfield
|
||||
pycFile.write(b'\0' * 8) # (Timestamp + size) || hash
|
||||
|
||||
else:
|
||||
pycFile.write(b'\0' * 4) # Timestamp
|
||||
if self.pymaj >= 3 and self.pymin >= 3:
|
||||
pycFile.write(b'\0' * 4) # Size parameter added in Python 3.3
|
||||
|
||||
pycFile.write(data)
|
||||
|
||||
|
||||
def _extractPyz(self, name):
|
||||
dirName = name + '_extracted'
|
||||
# Create a directory for the contents of the pyz
|
||||
if not os.path.exists(dirName):
|
||||
os.mkdir(dirName)
|
||||
|
||||
with open(name, 'rb') as f:
|
||||
pyzMagic = f.read(4)
|
||||
assert pyzMagic == b'PYZ\0' # Sanity Check
|
||||
|
||||
pyzPycMagic = f.read(4) # Python magic value
|
||||
|
||||
if self.pycMagic == b'\0' * 4:
|
||||
self.pycMagic = pyzPycMagic
|
||||
|
||||
elif self.pycMagic != pyzPycMagic:
|
||||
self.pycMagic = pyzPycMagic
|
||||
print('[!] Warning: pyc magic of files inside PYZ archive are different from those in CArchive')
|
||||
|
||||
# Skip PYZ extraction if not running under the same python version
|
||||
if self.pymaj != sys.version_info.major or self.pymin != sys.version_info.minor:
|
||||
print('[!] Warning: This script is running in a different Python version than the one used to build the executable.')
|
||||
print('[!] Please run this script in Python {0}.{1} to prevent extraction errors during unmarshalling'.format(self.pymaj, self.pymin))
|
||||
print('[!] Skipping pyz extraction')
|
||||
return
|
||||
|
||||
(tocPosition, ) = struct.unpack('!i', f.read(4))
|
||||
f.seek(tocPosition, os.SEEK_SET)
|
||||
|
||||
try:
|
||||
toc = marshal.load(f)
|
||||
except:
|
||||
print('[!] Unmarshalling FAILED. Cannot extract {0}. Extracting remaining files.'.format(name))
|
||||
return
|
||||
|
||||
print('[+] Found {0} files in PYZ archive'.format(len(toc)))
|
||||
|
||||
# From pyinstaller 3.1+ toc is a list of tuples
|
||||
if type(toc) == list:
|
||||
toc = dict(toc)
|
||||
|
||||
for key in toc.keys():
|
||||
(ispkg, pos, length) = toc[key]
|
||||
f.seek(pos, os.SEEK_SET)
|
||||
fileName = key
|
||||
|
||||
try:
|
||||
# for Python > 3.3 some keys are bytes object some are str object
|
||||
fileName = fileName.decode('utf-8')
|
||||
except:
|
||||
pass
|
||||
|
||||
# Prevent writing outside dirName
|
||||
fileName = fileName.replace('..', '__').replace('.', os.path.sep)
|
||||
|
||||
if ispkg == 1:
|
||||
filePath = os.path.join(dirName, fileName, '__init__.pyc')
|
||||
|
||||
else:
|
||||
filePath = os.path.join(dirName, fileName + '.pyc')
|
||||
|
||||
fileDir = os.path.dirname(filePath)
|
||||
if not os.path.exists(fileDir):
|
||||
os.makedirs(fileDir)
|
||||
|
||||
try:
|
||||
data = f.read(length)
|
||||
data = zlib.decompress(data)
|
||||
except:
|
||||
print('[!] Error: Failed to decompress {0}, probably encrypted. Extracting as is.'.format(filePath))
|
||||
open(filePath + '.encrypted', 'wb').write(data)
|
||||
else:
|
||||
self._writePyc(filePath, data)
|
||||
|
||||
|
||||
def main():
|
||||
if len(sys.argv) < 2:
|
||||
print('[+] Usage: pyinstxtractor.py <filename>')
|
||||
|
||||
else:
|
||||
arch = PyInstArchive(sys.argv[1])
|
||||
if arch.open():
|
||||
if arch.checkFile():
|
||||
if arch.getCArchiveInfo():
|
||||
arch.parseTOC()
|
||||
arch.extractFiles()
|
||||
arch.close()
|
||||
print('[+] Successfully extracted pyinstaller archive: {0}'.format(sys.argv[1]))
|
||||
print('')
|
||||
print('You can now use a python decompiler on the pyc files within the extracted directory')
|
||||
return
|
||||
|
||||
arch.close()
|
||||
|
||||
|
||||
if __name__ == '__main__':
|
||||
main()
|
||||
Reference in New Issue
Block a user