mirror of
https://github.com/SeekyCt/spm-decomp.git
synced 2024-11-27 07:10:33 +00:00
389 lines
9.4 KiB
Python
389 lines
9.4 KiB
Python
"""
|
|
Common functions & definitions
|
|
"""
|
|
|
|
from dataclasses import dataclass
|
|
from enum import Enum
|
|
from hashlib import sha1
|
|
import json
|
|
import os
|
|
from subprocess import PIPE, run
|
|
from sys import executable as PYTHON, platform
|
|
from typing import List, Tuple, Union
|
|
|
|
import yaml
|
|
try:
|
|
from yaml import CLoader as Loader
|
|
except ImportError:
|
|
from yaml import Loader
|
|
|
|
#############
|
|
# Functions #
|
|
#############
|
|
|
|
def get_file_sha1(path: str) -> bytes:
|
|
"""Gets the SHA1 hash of a file"""
|
|
|
|
with open(path, 'rb') as f:
|
|
return sha1(f.read()).digest()
|
|
|
|
def get_cmd_stdout(cmd: str, text=True) -> str:
|
|
"""Run a command and get the stdout output as a string"""
|
|
|
|
ret = run(cmd.split(), stdout=PIPE, text=text)
|
|
assert ret.returncode == 0, f"Command '{cmd}' returned {ret.returncode}"
|
|
return ret.stdout
|
|
|
|
class Binary(Enum):
|
|
DOL = 1
|
|
REL = 2
|
|
|
|
# ppcdis source output
|
|
SourceDesc = Union[str, Tuple[str, int, int]]
|
|
|
|
def get_containing_slice(addr: int) -> Tuple[Binary, SourceDesc]:
|
|
"""Finds the binary containing an address and its source file
|
|
Source file is empty string if not decompiled"""
|
|
|
|
dol_raw = get_cmd_stdout(f"{SLICES} {DOL_YML} {DOL_SLICES} -p {DOL_SRCDIR}/ --containing {addr:x}")
|
|
containing = json.loads(dol_raw)
|
|
if containing is None:
|
|
rel_raw = get_cmd_stdout(
|
|
f"{SLICES} {REL_YML} {REL_SLICES} -p {REL_SRCDIR}/ --containing {addr:x}"
|
|
)
|
|
containing = json.loads(rel_raw)
|
|
assert containing is not None, f"Unknown address {addr:x}"
|
|
return (Binary.REL, containing)
|
|
else:
|
|
return (Binary.DOL, containing)
|
|
|
|
def lookup_sym(sym: str, dol: bool = False, rel: bool = False, source_name: str = None) -> int:
|
|
"""Takes a symbol as a name or address and returns the address"""
|
|
|
|
# Get binary
|
|
if dol:
|
|
binary_name = DOL_YML
|
|
elif rel:
|
|
binary_name = REL_YML
|
|
else:
|
|
binary_name = None
|
|
|
|
# Determine type
|
|
try:
|
|
return int(sym, 16)
|
|
except ValueError:
|
|
return get_address(sym, binary_name, source_name)
|
|
|
|
def lookup_sym_full(sym: str, dol: bool = False, rel: bool = False, source_name: str = None
|
|
) -> int:
|
|
"""Takes a symbol as a name or address and returns both the name and address"""
|
|
|
|
# Get binary
|
|
if dol:
|
|
binary_name = DOL_YML
|
|
elif rel:
|
|
binary_name = REL_YML
|
|
else:
|
|
binary_name = None
|
|
|
|
# Determine type
|
|
try:
|
|
return int(sym, 16), get_name(sym)
|
|
except ValueError:
|
|
return get_address(sym, binary_name, source_name), sym
|
|
|
|
def get_address(name: str, binary: bool = None, source_name: bool = None) -> int:
|
|
"""Finds the address of a symbol"""
|
|
|
|
args = [name]
|
|
if binary is not None:
|
|
args.append(f"-b {binary}")
|
|
if source_name is not None:
|
|
args.append(f"-n {source_name}")
|
|
|
|
raw = get_cmd_stdout(f"{SYMBOLS} {GAME_SYMBOLS} --get-addr {' '.join(args)}")
|
|
return json.loads(raw)
|
|
|
|
def get_name(addr: int, binary: bool = None, source_name: bool = None) -> int:
|
|
"""Finds the name of a symbol"""
|
|
|
|
args = [addr]
|
|
if binary is not None:
|
|
args.append(f"-b {binary}")
|
|
if source_name is not None:
|
|
args.append(f"-n {source_name}")
|
|
|
|
raw = get_cmd_stdout(f"{SYMBOLS} {GAME_SYMBOLS} --get-name {' '.join(args)}")
|
|
return json.loads(raw)
|
|
|
|
def find_headers(dirname: str, base=None) -> List[str]:
|
|
"""Returns a list of all headers in a folder recursively"""
|
|
|
|
if base is None:
|
|
base = dirname
|
|
|
|
ret = []
|
|
for name in os.listdir(dirname):
|
|
path = dirname + '/' + name
|
|
if os.path.isdir(path):
|
|
ret.extend(find_headers(path, base))
|
|
elif name.endswith('.h'):
|
|
ret.append(path[len(base)+1:])
|
|
|
|
return ret
|
|
|
|
def load_from_yaml(path: str, default=None):
|
|
"""Loads an object from a yaml file"""
|
|
|
|
if default is None:
|
|
default = {}
|
|
with open(path) as f:
|
|
ret = yaml.load(f.read(), Loader)
|
|
if ret is None:
|
|
ret = default
|
|
return ret
|
|
|
|
################
|
|
# Project dirs #
|
|
################
|
|
|
|
# Directory for decompiled dol code
|
|
DOL_SRCDIR = "src"
|
|
|
|
# Directory for decompiled rel code
|
|
REL_SRCDIR = "rel"
|
|
|
|
# Build artifacts directory
|
|
BUILDDIR = "build"
|
|
|
|
# Build include directory
|
|
BUILD_INCDIR = f"{BUILDDIR}/include"
|
|
|
|
# Output binaries directory
|
|
OUTDIR = "out"
|
|
|
|
# Original binaries directory
|
|
ORIG = "orig"
|
|
|
|
# Tools directory
|
|
TOOLS = "tools"
|
|
|
|
# Config directory
|
|
CONFIG = "config"
|
|
|
|
# Extracted assets directory
|
|
ASSETS = "assets"
|
|
|
|
#########
|
|
# Tools #
|
|
#########
|
|
|
|
# ppcdis
|
|
PPCDIS = "tools/ppcdis"
|
|
PPCDIS_INCDIR = f"{PPCDIS}/include"
|
|
SPM_HEADERS = "spm-headers"
|
|
RELEXTERN = f"{PYTHON} {PPCDIS}/relextern.py"
|
|
ANALYSER = f"{PYTHON} {PPCDIS}/analyser.py"
|
|
DISASSEMBLER = f"{PYTHON} {PPCDIS}/disassembler.py"
|
|
ORDERSTRINGS = f"{PYTHON} {PPCDIS}/orderstrings.py"
|
|
ORDERFLOATS = f"{PYTHON} {PPCDIS}/orderfloats.py"
|
|
ASSETRIP = f"{PYTHON} {PPCDIS}/assetrip.py"
|
|
ASSETINC = f"{PYTHON} {PPCDIS}/assetinc.py"
|
|
FORCEACTIVEGEN = f"{PYTHON} {PPCDIS}/forceactivegen.py"
|
|
ELF2DOL = f"{PYTHON} {PPCDIS}/elf2dol.py"
|
|
ELF2REL = f"{PYTHON} {PPCDIS}/elf2rel.py"
|
|
SLICES = f"{PYTHON} {PPCDIS}/slices.py"
|
|
PROGRESS = f"{PYTHON} {PPCDIS}/progress.py"
|
|
SYMBOLS = f"{PYTHON} {PPCDIS}/symbols.py"
|
|
MAKESRC = f"{PYTHON} {PPCDIS}/makesrc.py"
|
|
|
|
# Codewarrior
|
|
TOOLS = "tools"
|
|
CODEWARRIOR = os.path.join(TOOLS, "4199_60831")
|
|
CC = os.path.join(CODEWARRIOR, "mwcceppc.exe")
|
|
LD = os.path.join(CODEWARRIOR, "mwldeppc.exe")
|
|
if platform != "win32":
|
|
CC = f"wine {CC}"
|
|
LD = f"wine {LD}"
|
|
|
|
# DevkitPPC
|
|
DEVKITPPC = os.environ.get("DEVKITPPC")
|
|
AS = os.path.join(DEVKITPPC, "bin", "powerpc-eabi-as")
|
|
OBJDUMP = os.path.join(DEVKITPPC, "bin", "powerpc-eabi-objdump")
|
|
CPP = os.path.join(DEVKITPPC, "bin", "powerpc-eabi-cpp")
|
|
|
|
ICONV = f"{PYTHON} tools/sjis.py" # TODO: get actual iconv working(?)
|
|
NLZSS = f"{PYTHON} tools/lzss3.py"
|
|
|
|
#########
|
|
# Files #
|
|
#########
|
|
|
|
# Slices
|
|
DOL_SLICES = f"{CONFIG}/dol_slices.yml"
|
|
REL_SLICES = f"{CONFIG}/rel_slices.yml"
|
|
|
|
# Overrides
|
|
ANALYSIS_OVERRIDES = f"{CONFIG}/analysis_overrides.yml"
|
|
DISASM_OVERRIDES = f"{CONFIG}/disasm_overrides.yml"
|
|
|
|
# Binaries
|
|
DOL = f"{ORIG}/main.dol" # read in python code
|
|
REL = f"{ORIG}/relF.rel" # read in python code
|
|
REL_COMPR = f"{ORIG}/relF.bin" # read in python code
|
|
DOL_YML = f"{CONFIG}/dol.yml"
|
|
REL_YML = f"{CONFIG}/rel.yml"
|
|
DOL_SHA = f"{ORIG}/main.dol.sha1"
|
|
REL_SHA = f"{ORIG}/relF.rel.sha1"
|
|
DOL_OK = f"{BUILDDIR}/main.dol.ok"
|
|
REL_OK = f"{BUILDDIR}/relF.rel.ok"
|
|
DOL_ASM_LIST = f"{BUILDDIR}/main.dol.asml"
|
|
REL_ASM_LIST = f"{BUILDDIR}/relF.rel.asml"
|
|
|
|
# Symbols
|
|
GAME_SYMBOLS = f"{CONFIG}/symbols.yml"
|
|
|
|
# Assets
|
|
ASSETS_YML = f"{CONFIG}/assets.yml"
|
|
|
|
# Analysis outputs
|
|
EXTERNS = f"{BUILDDIR}/externs.pickle"
|
|
DOL_LABELS = f"{BUILDDIR}/labels.pickle"
|
|
DOL_RELOCS = f"{BUILDDIR}/relocs.pickle"
|
|
REL_LABELS = f"{BUILDDIR}/rel_labels.pickle"
|
|
REL_RELOCS = f"{BUILDDIR}/rel_relocs.pickle"
|
|
|
|
# Linker
|
|
DOL_LCF_TEMPLATE = f"{CONFIG}/dol.lcf"
|
|
DOL_LCF = f"{BUILDDIR}/dol.lcf"
|
|
REL_LCF = f"{CONFIG}/rel.lcf"
|
|
|
|
# Outputs
|
|
DOL_ELF = f"{BUILDDIR}/main.elf"
|
|
REL_PLF = f"{BUILDDIR}/relF.plf"
|
|
DOL_OUT = f"{OUTDIR}/main.dol"
|
|
REL_OUT = f"{OUTDIR}/relF.rel"
|
|
DOL_MAP = f"{OUTDIR}/main.map"
|
|
REL_MAP = f"{OUTDIR}/relF.map"
|
|
|
|
# Optional full disassembly
|
|
DOL_FULL = f"{OUTDIR}/dol.s"
|
|
REL_FULL = f"{OUTDIR}/rel.s"
|
|
|
|
##############
|
|
# Tool Flags #
|
|
##############
|
|
|
|
ASFLAGS = ' '.join([
|
|
"-m gekko",
|
|
f"-I {PPCDIS_INCDIR}",
|
|
f"-I orig"
|
|
])
|
|
|
|
INCDIRS = [
|
|
PPCDIS_INCDIR,
|
|
BUILD_INCDIR,
|
|
f"{SPM_HEADERS}/decomp",
|
|
f"{SPM_HEADERS}/include"
|
|
]
|
|
MWCC_INCLUDES = ' '.join(f"-i {d}" for d in INCDIRS)
|
|
GCC_INCLUDES = ' '.join(f"-I {d}" for d in INCDIRS)
|
|
|
|
DEFINES = [
|
|
"DECOMP",
|
|
"SPM_EU0"
|
|
]
|
|
MWCC_DEFINES = ' '.join(f"-d {d}" for d in DEFINES)
|
|
GCC_DEFINES = ' '.join(f"-D {d}" for d in DEFINES)
|
|
|
|
CPPFLAGS = ' '.join([
|
|
"-nostdinc",
|
|
GCC_DEFINES,
|
|
GCC_INCLUDES
|
|
])
|
|
|
|
DOL_SDATA2_SIZE = 4
|
|
REL_SDATA2_SIZE = 0
|
|
|
|
CFLAGS = [
|
|
"-enc SJIS",
|
|
"-lang c99",
|
|
"-W all",
|
|
"-fp fmadd",
|
|
"-Cpp_exceptions off",
|
|
"-O4",
|
|
"-use_lmw_stmw on",
|
|
"-str pool",
|
|
"-rostr",
|
|
"-sym dwarf-2",
|
|
"-ipa file",
|
|
MWCC_DEFINES
|
|
]
|
|
BASE_DOL_CFLAGS = CFLAGS + [
|
|
"-inline all",
|
|
"-sdata 4",
|
|
f"-sdata2 {DOL_SDATA2_SIZE}"
|
|
]
|
|
BASE_REL_CFLAGS = CFLAGS + [
|
|
"-sdata 0",
|
|
f"-sdata2 {REL_SDATA2_SIZE}",
|
|
"-pool off",
|
|
"-ordered-fp-compares"
|
|
]
|
|
|
|
LOCAL_CFLAGS = [
|
|
"-nostdinc",
|
|
"-proc gekko",
|
|
"-maxerrors 1",
|
|
"-I-",
|
|
MWCC_INCLUDES
|
|
]
|
|
DOL_CFLAGS = ' '.join(BASE_DOL_CFLAGS + LOCAL_CFLAGS)
|
|
REL_CFLAGS = ' '.join(BASE_REL_CFLAGS + LOCAL_CFLAGS)
|
|
EXTERNAL_DOL_CFLAGS = ' '.join(BASE_DOL_CFLAGS)
|
|
EXTERNAL_REL_CFLAGS = ' '.join(BASE_REL_CFLAGS)
|
|
|
|
LDFLAGS = ' '.join([
|
|
"-fp hard",
|
|
"-linkmode moreram",
|
|
"-maxerrors 1",
|
|
"-mapunused"
|
|
])
|
|
|
|
PPCDIS_ANALYSIS_FLAGS = ' '.join([
|
|
f"-o {ANALYSIS_OVERRIDES}",
|
|
f"-l {EXTERNS}"
|
|
])
|
|
|
|
PPCDIS_DISASM_FLAGS = ' '.join([
|
|
f"-m {GAME_SYMBOLS}",
|
|
f"-o {DISASM_OVERRIDES}"
|
|
])
|
|
|
|
############
|
|
# Contexts #
|
|
############
|
|
|
|
@dataclass
|
|
class SourceContext:
|
|
srcdir: str
|
|
cflags: str
|
|
binary: str
|
|
labels: str
|
|
relocs: str
|
|
slices: str
|
|
sdata2_threshold: int
|
|
|
|
DOL_CTX = SourceContext(DOL_SRCDIR, DOL_CFLAGS, DOL_YML, DOL_LABELS, DOL_RELOCS, DOL_SLICES,
|
|
DOL_SDATA2_SIZE)
|
|
REL_CTX = SourceContext(REL_SRCDIR, REL_CFLAGS, REL_YML, REL_LABELS, REL_RELOCS, REL_SLICES,
|
|
REL_SDATA2_SIZE)
|
|
|
|
####################
|
|
# diff.py Expected #
|
|
####################
|
|
|
|
EXPECTED = "expected"
|
|
DOL_EXPECTED = f"{EXPECTED}/build/main.elf"
|
|
REL_EXPECTED = f"{EXPECTED}/build/relF.plf"
|