Init version of jmmt_tools

This commit is contained in:
Lily Tsuru 2022-07-08 04:23:46 -05:00
commit 0544a39dc3
14 changed files with 912 additions and 0 deletions

61
.clang-format Executable file
View File

@ -0,0 +1,61 @@
# Clang-Format file
# google style is the closest unfortunately
BasedOnStyle: Google
# force T* or T&
# rather than T * or T &
DerivePointerAlignment: false
PointerAlignment: Left
# I think if these two aren't the same
# it won't indent with tabs even with UseTab set to Always
TabWidth: 4
IndentWidth: 4
UseTab: Always
IndentPPDirectives: BeforeHash
AllowAllParametersOfDeclarationOnNextLine: true
AllowShortBlocksOnASingleLine: false
AllowShortFunctionsOnASingleLine: None
AllowShortIfStatementsOnASingleLine: Never
BinPackArguments: true
BinPackParameters: true
BreakConstructorInitializers: BeforeColon
BreakStringLiterals: false
# 130 columns is good but causes some weird issues I don't quite like
# especially in some codebases
#ColumnLimit: 130
ColumnLimit: 0
CompactNamespaces: false
ConstructorInitializerAllOnOneLineOrOnePerLine: true
ContinuationIndentWidth: 0
# turning this on causes major issues with initalizer lists,
# turn it off
Cpp11BracedListStyle: false
# this is turned on to allow something like:
#
# T MyTValue {
# initalizer list...
# };
SpaceBeforeCpp11BracedList: true
FixNamespaceComments: true
NamespaceIndentation: All
ReflowComments: true
SortIncludes: CaseInsensitive
SortUsingDeclarations: true
SpacesInSquareBrackets: false
SpaceBeforeParens: Never
SpacesBeforeTrailingComments: 1

10
.gitignore vendored Normal file
View File

@ -0,0 +1,10 @@
/.idea
cmake-build-*
build/
# swap
*.kate-swp
*.swp
# TEMPORARY!!!!
/attic

13
CMakeLists.txt Executable file
View File

@ -0,0 +1,13 @@
cmake_minimum_required(VERSION 3.10)
# Prohibit in-source tree builds.
if(" ${CMAKE_SOURCE_DIR}" STREQUAL " ${CMAKE_BINARY_DIR}")
message(FATAL_ERROR "In-source builds are strictly prohibited.")
endif()
include(cmake/Policies.cmake)
project(jmmt_tools)
add_subdirectory(src/libjmmt)
add_subdirectory(src/tools)

30
README.md Normal file
View File

@ -0,0 +1,30 @@
## JMMT tools
Tools to work with files for Jonny Moseley Mad Trix on the PS2.
## The Libraries
### libjmmt
A library which has:
- the CRC32 hash implementation(s) used by the game
- the LZSS decompression implementation used by the game
- Documented package file structures
Used by the following tools.
## The Tools
### `jmmt_renamer`
Renames the .dat files in data/ on the disc to filenames which are actually useful.
### `jmmt_pack_extractor`
Extractor for .pak files. Unlike the BMS script, this extractor takes into account several things about the format.
Currently kind of crashy. Does extract a few archives in full though.
### `jmmt_met_extractor`
TODO

45
cmake/Policies.cmake Executable file
View File

@ -0,0 +1,45 @@
# CMake policy configuration
if(POLICY CMP0026)
cmake_policy(SET CMP0026 NEW)
endif()
if(POLICY CMP0042)
cmake_policy(SET CMP0042 NEW) # CMake 3.0+ (2.8.12): MacOS "@rpath" in target's install name
endif()
if(POLICY CMP0046)
cmake_policy(SET CMP0046 NEW) # warn about non-existed dependencies
endif()
if(POLICY CMP0051)
cmake_policy(SET CMP0051 NEW)
endif()
if(POLICY CMP0054) # CMake 3.1: Only interpret if() arguments as variables or keywords when unquoted.
cmake_policy(SET CMP0054 NEW)
endif()
if(POLICY CMP0056)
cmake_policy(SET CMP0056 NEW) # try_compile(): link flags
endif()
if(POLICY CMP0066)
cmake_policy(SET CMP0066 NEW) # CMake 3.7: try_compile(): use per-config flags, like CMAKE_CXX_FLAGS_RELEASE
endif()
if(POLICY CMP0067)
cmake_policy(SET CMP0067 NEW) # CMake 3.8: try_compile(): honor language standard variables (like C++11)
endif()
if(POLICY CMP0068)
cmake_policy(SET CMP0068 NEW) # CMake 3.9+: `RPATH` settings on macOS do not affect `install_name`.
endif()
if(POLICY CMP0075)
cmake_policy(SET CMP0075 NEW) # CMake 3.12+: Include file check macros honor `CMAKE_REQUIRED_LIBRARIES`
endif()
if(POLICY CMP0077)
cmake_policy(SET CMP0077 NEW) # CMake 3.13+: option() honors normal variables.
endif()

21
include/jmmt/crc.h Normal file
View File

@ -0,0 +1,21 @@
#ifndef JMMT_CRC_H
#define JMMT_CRC_H
#include <cstdint>
namespace jmmt {
/**
* Result type of HashString()/HashStringCase().
*/
using crc32_t = std::uint32_t;
crc32_t HashString(const char* s);
/**
* Hash a case-sensitive string.
*/
crc32_t HashStringCase(const char* s);
} // namespace jmmt
#endif // JMMT_CRC_H

39
include/jmmt/lzss.h Normal file
View File

@ -0,0 +1,39 @@
#ifndef JMMT_LZSS_H
#define JMMT_LZSS_H
#include <cstdint>
namespace jmmt {
struct LzssHeader {
std::uint32_t next; // done to keep data layout consistent with PS2
std::uint8_t cByteId;
std::uint8_t cHdrSize; // should be sizeof(LzssHeader)
std::uint8_t nMaxMatch;
std::uint8_t nFillByte;
std::uint16_t nRingSize;
std::uint16_t nErrorId;
std::uint32_t nUnCompressedBytes;
std::uint32_t nCompressedBytes;
std::uint32_t nCRC;
std::uint32_t nFileId;
std::uint32_t nCompressedDataCRC;
};
static_assert(sizeof(LzssHeader) == 0x20, "LzssHeader doesn't match game expectations, you are CERTAINLY breaking structures");
/**
* Decompress TECH LZSS data.
*
* \param[in,out] header LZSS header. Unused. Set to nullptr for now.
* \param[in] compressedInput LZSS compressed input data.
* \param[in] compressedLength Compressed length.
* \param[out] destBuffer Destination buffer.
*
* \return 0 on success. Non zero value means error.
*/
int DecompressLzss(LzssHeader* header, std::uint8_t* compressedInput, std::int32_t compressedLength, std::uint8_t* destBuffer);
} // namespace jmmt
#endif

92
include/jmmt/package.h Normal file
View File

@ -0,0 +1,92 @@
// JMMT PAK structures
#ifndef JMMT_PACKAGE_H
#define JMMT_PACKAGE_H
#include <cstdint>
// for LzssHeader
#include <jmmt/lzss.h>
namespace jmmt {
template <class TMagic, TMagic ValidMagic>
struct BasicStructureWithMagic {
constexpr static TMagic TypeMagic = ValidMagic;
};
template <uint32_t ValidMagic>
using FourCCMagic = BasicStructureWithMagic<uint32_t, ValidMagic>;
// This is the "file header" of sorts.
struct PackageEofHeader {
std::uint32_t headerSize;
std::uint32_t debugInfoSize;
std::uint32_t headerStartOffset;
};
struct PackageGroup : public FourCCMagic<0x50524750 /* 'PGRP' */> {
uint32_t magic;
uint32_t groupNameCrc;
uint32_t fileCount;
uint32_t padding; // 0xcdcdcdcd - padding to 0x10 bytes
};
struct PackageFile : public FourCCMagic<0x4C494650 /* 'PFIL' */> {
uint32_t magic;
uint32_t unk[2]; // Don't know what these are?
// Sequence number of the chunk.
// This represents the order of each chunk,
// presumably so order can just be whatever.
//
// However, the archives seem to order chunks for files
// in order, and doesn't start/interleave other files
// in between of files.
//
// In other words: this is a nice waste of 16 bits.
uint16_t chunkSequenceNumber;
// Amount of chunks which need to be read
// from to read this file completely.
//
// 1 means this file starts and ends on this chunk.
uint16_t chunkAmount;
// A CRC32 hash of the path of this file.
// Hashed with jmmt::HashString().
uint32_t filenameCrc;
uint32_t unk2[7]; // more unknown stuff I don't know about yet
// Uncompressed size of this file chunk. Has a maximum of 65535 bytes.
uint32_t chunkSize;
// Offset where this file chunk should start,
// inside of a larger buffer.
uint32_t blockOffset;
// Compressed (stored) size of this chunk.
uint32_t compressedChunkSize;
// Offset inside of the package file where
// the compressed data blob starts.
uint32_t dataOffset;
uint32_t fileSize;
// TECH LZSS header.
// Used to (shocker) configure LZSS decompression.
//
// Duplicates a few things in the file.
LzssHeader lzssHeader;
};
static_assert(sizeof(PackageEofHeader) == 0xc, "PackageEofHeader has invalid size. Extractor 100% won't work, good job");
static_assert(sizeof(PackageGroup) == 0x10, "PackageGroup has invalid size, extractor won't work");
static_assert(sizeof(PackageFile) == 0x64, "PackageFile has invalid size, extractor won't work");
} // namespace jmmt
#endif // JMMT_PACKAGE_H

View File

@ -0,0 +1,13 @@
add_library(jmmt
crc.cpp
lzss.cpp
)
target_include_directories(jmmt PUBLIC ${PROJECT_SOURCE_DIR}/include)
set_target_properties(jmmt PROPERTIES
CXX_STANDARD 20
CXX_STANDARD_REQUIRED ON
)

75
src/libjmmt/crc.cpp Normal file
View File

@ -0,0 +1,75 @@
#include <jmmt/crc.h>
namespace jmmt {
// Standard Ethernet-II CRC32 polynominal table.
constinit static crc32_t Crc32Table[] = {
0x00000000, 0x77073096, 0xee0e612c, 0x990951ba, 0x076dc419, 0x706af48f,
0xe963a535, 0x9e6495a3, 0x0edb8832, 0x79dcb8a4, 0xe0d5e91e, 0x97d2d988,
0x09b64c2b, 0x7eb17cbd, 0xe7b82d07, 0x90bf1d91, 0x1db71064, 0x6ab020f2,
0xf3b97148, 0x84be41de, 0x1adad47d, 0x6ddde4eb, 0xf4d4b551, 0x83d385c7,
0x136c9856, 0x646ba8c0, 0xfd62f97a, 0x8a65c9ec, 0x14015c4f, 0x63066cd9,
0xfa0f3d63, 0x8d080df5, 0x3b6e20c8, 0x4c69105e, 0xd56041e4, 0xa2677172,
0x3c03e4d1, 0x4b04d447, 0xd20d85fd, 0xa50ab56b, 0x35b5a8fa, 0x42b2986c,
0xdbbbc9d6, 0xacbcf940, 0x32d86ce3, 0x45df5c75, 0xdcd60dcf, 0xabd13d59,
0x26d930ac, 0x51de003a, 0xc8d75180, 0xbfd06116, 0x21b4f4b5, 0x56b3c423,
0xcfba9599, 0xb8bda50f, 0x2802b89e, 0x5f058808, 0xc60cd9b2, 0xb10be924,
0x2f6f7c87, 0x58684c11, 0xc1611dab, 0xb6662d3d, 0x76dc4190, 0x01db7106,
0x98d220bc, 0xefd5102a, 0x71b18589, 0x06b6b51f, 0x9fbfe4a5, 0xe8b8d433,
0x7807c9a2, 0x0f00f934, 0x9609a88e, 0xe10e9818, 0x7f6a0dbb, 0x086d3d2d,
0x91646c97, 0xe6635c01, 0x6b6b51f4, 0x1c6c6162, 0x856530d8, 0xf262004e,
0x6c0695ed, 0x1b01a57b, 0x8208f4c1, 0xf50fc457, 0x65b0d9c6, 0x12b7e950,
0x8bbeb8ea, 0xfcb9887c, 0x62dd1ddf, 0x15da2d49, 0x8cd37cf3, 0xfbd44c65,
0x4db26158, 0x3ab551ce, 0xa3bc0074, 0xd4bb30e2, 0x4adfa541, 0x3dd895d7,
0xa4d1c46d, 0xd3d6f4fb, 0x4369e96a, 0x346ed9fc, 0xad678846, 0xda60b8d0,
0x44042d73, 0x33031de5, 0xaa0a4c5f, 0xdd0d7cc9, 0x5005713c, 0x270241aa,
0xbe0b1010, 0xc90c2086, 0x5768b525, 0x206f85b3, 0xb966d409, 0xce61e49f,
0x5edef90e, 0x29d9c998, 0xb0d09822, 0xc7d7a8b4, 0x59b33d17, 0x2eb40d81,
0xb7bd5c3b, 0xc0ba6cad, 0xedb88320, 0x9abfb3b6, 0x03b6e20c, 0x74b1d29a,
0xead54739, 0x9dd277af, 0x04db2615, 0x73dc1683, 0xe3630b12, 0x94643b84,
0x0d6d6a3e, 0x7a6a5aa8, 0xe40ecf0b, 0x9309ff9d, 0x0a00ae27, 0x7d079eb1,
0xf00f9344, 0x8708a3d2, 0x1e01f268, 0x6906c2fe, 0xf762575d, 0x806567cb,
0x196c3671, 0x6e6b06e7, 0xfed41b76, 0x89d32be0, 0x10da7a5a, 0x67dd4acc,
0xf9b9df6f, 0x8ebeeff9, 0x17b7be43, 0x60b08ed5, 0xd6d6a3e8, 0xa1d1937e,
0x38d8c2c4, 0x4fdff252, 0xd1bb67f1, 0xa6bc5767, 0x3fb506dd, 0x48b2364b,
0xd80d2bda, 0xaf0a1b4c, 0x36034af6, 0x41047a60, 0xdf60efc3, 0xa867df55,
0x316e8eef, 0x4669be79, 0xcb61b38c, 0xbc66831a, 0x256fd2a0, 0x5268e236,
0xcc0c7795, 0xbb0b4703, 0x220216b9, 0x5505262f, 0xc5ba3bbe, 0xb2bd0b28,
0x2bb45a92, 0x5cb36a04, 0xc2d7ffa7, 0xb5d0cf31, 0x2cd99e8b, 0x5bdeae1d,
0x9b64c2b0, 0xec63f226, 0x756aa39c, 0x026d930a, 0x9c0906a9, 0xeb0e363f,
0x72076785, 0x05005713, 0x95bf4a82, 0xe2b87a14, 0x7bb12bae, 0x0cb61b38,
0x92d28e9b, 0xe5d5be0d, 0x7cdcefb7, 0x0bdbdf21, 0x86d3d2d4, 0xf1d4e242,
0x68ddb3f8, 0x1fda836e, 0x81be16cd, 0xf6b9265b, 0x6fb077e1, 0x18b74777,
0x88085ae6, 0xff0f6a70, 0x66063bca, 0x11010b5c, 0x8f659eff, 0xf862ae69,
0x616bffd3, 0x166ccf45, 0xa00ae278, 0xd70dd2ee, 0x4e048354, 0x3903b3c2,
0xa7672661, 0xd06016f7, 0x4969474d, 0x3e6e77db, 0xaed16a4a, 0xd9d65adc,
0x40df0b66, 0x37d83bf0, 0xa9bcae53, 0xdebb9ec5, 0x47b2cf7f, 0x30b5ffe9,
0xbdbdf21c, 0xcabac28a, 0x53b39330, 0x24b4a3a6, 0xbad03605, 0xcdd70693,
0x54de5729, 0x23d967bf, 0xb3667a2e, 0xc4614ab8, 0x5d681b02, 0x2a6f2b94,
0xb40bbe37, 0xc30c8ea1, 0x5a05df1b, 0x2d02ef8d
};
// TODO:
// - Use string_view, because C++20 (& it's cleaner)
crc32_t HashString(const char* s) {
crc32_t crc = 0;
while(*s) {
crc = Crc32Table[(crc ^ (*s++ & ~0x20)) & 0xff] ^ (crc >> 8);
}
return crc;
}
// Hash a string which is case-sensitive.
crc32_t HashStringCase(const char* s) {
crc32_t crc = 0;
while(*s) {
crc = Crc32Table[(crc ^ (*s++)) & 0xff] ^ (crc >> 8);
}
return crc;
}
}

114
src/libjmmt/lzss.cpp Normal file
View File

@ -0,0 +1,114 @@
#include <jmmt/lzss.h>
#include <cstring>
#include <cstdio>
#define LZSS_DEFAULT_RINGSIZE 512
#define LZSS_DEFAULT_MATCHSIZE 66
#define LZSS_EOF -1
#define LZSS_CHUNKSIZE 256
#define LZSS_RINGBITS 9
#define LZSS_THRESHOLD 2
#define LZSS_STALLBIT (30)
#define LZSS_GETBYTE(in,inb,out) \
do { \
if( (inb) <= (nInputBufferIndex) ) \
(out) = -1; \
else \
{ \
/* std::printf("getting '%c'\n", *((in)+nInputBufferIndex)); */ \
(out) = *((uint8_t*)((in)+nInputBufferIndex)); \
nInputBufferIndex++; \
} \
}while(0)
// this version logs what it's going to put and where.
//#define LZSS_PUTBYTE(outp,outb) std::printf("LZSS_PUTBYTE(%llu, %x)\n", outp - oldptr, outb); \
*(outp)++ = (uint8_t)(outb)
#define LZSS_PUTBYTE(outp,outb) *(outp)++ = (uint8_t)(outb)
#define FileIO_ZeroMemory(dst, size) memset(dst, 0, size)
namespace jmmt {
int DecompressLzss(LzssHeader* header, std::uint8_t* compressedInput, std::int32_t compressedLength, std::uint8_t* destBuffer) {
int32_t nRingIndex, nInSize, nInputBufferIndex, nRingBits, nRingSize;
uint8_t aRingBuffer[LZSS_DEFAULT_RINGSIZE], *pRingBuffer;
uint32_t nBitFlags = 0;
std::int32_t nInByte;
//auto* oldptr = destBuffer; // uncomment for logging version of LZSS_PUTBYTE
// TODO: this is where we might want to place header usage. You know, if we need to.
nBitFlags = 0;
nInputBufferIndex = 0;
nInSize = compressedLength;
nRingSize = LZSS_DEFAULT_RINGSIZE;
nRingBits = LZSS_RINGBITS;
nRingIndex = LZSS_DEFAULT_RINGSIZE - LZSS_DEFAULT_MATCHSIZE;
// Use stack allocated default ring buffer
pRingBuffer = &aRingBuffer[0];
FileIO_ZeroMemory(pRingBuffer, nRingSize);
//memset(pRingBuffer, ' ', nRingSize);
for(;;) { // get next 8 opcodes?
if(((nBitFlags >>= 1) & 256) == 0) {
LZSS_GETBYTE(compressedInput, nInSize, nInByte);
if(nInByte == -1)
break;
//std::printf("LZSS new opcodes\n");
// store 255 in upper word, when zero get next 8 opcodes
nBitFlags = nInByte | 0xff00;
}
// single char
if(nBitFlags & 1) {
LZSS_GETBYTE(compressedInput, nInSize, nInByte);
if(nInByte == -1)
break;
//std::printf("LZSS single char '%c'\n", nInByte);
LZSS_PUTBYTE(destBuffer, nInByte);
pRingBuffer[nRingIndex++] = (uint8_t)nInByte;
nRingIndex &= (nRingSize - 1);
}
// string
else { // get position & length pair (note: 1 bit of position is stored in length word)
int32_t i, j;
LZSS_GETBYTE(compressedInput, nInSize, i);
if(i == -1)
break;
LZSS_GETBYTE(compressedInput, nInSize, j);
i |= ((j >> (16 - nRingBits)) << 8);
j = (j & (0x00FF >> (nRingBits - 8))) + LZSS_THRESHOLD;
// std::printf("LZSS string pos %d len %d\n", i , j);
//LZSS_VALIDATE(j <= LZSS_DEFAULT_MATCHSIZE, "Invalid match size for decompression");
for(int32_t k = 0; k <= j; ++k) {
nInByte = pRingBuffer[(i + k) & (nRingSize - 1)];
//std::printf("LZSS string byte '%c'\n", nInByte);
LZSS_PUTBYTE(destBuffer, nInByte);
pRingBuffer[nRingIndex++] = (uint8_t)nInByte;
nRingIndex &= (nRingSize - 1);
}
}
}
return 0;
}
} // namespace jmmt

17
src/tools/CMakeLists.txt Normal file
View File

@ -0,0 +1,17 @@
add_executable(jmmt_renamer jmmt_renamer.cpp)
target_link_libraries(jmmt_renamer PUBLIC jmmt)
set_target_properties(jmmt_renamer PROPERTIES
CXX_STANDARD 20
CXX_STANDARD_REQUIRED ON
)
add_executable(jmmt_pack_extractor jmmt_pack_extractor.cpp)
target_link_libraries(jmmt_pack_extractor PUBLIC jmmt)
set_target_properties(jmmt_pack_extractor PROPERTIES
CXX_STANDARD 20
CXX_STANDARD_REQUIRED ON
)

View File

@ -0,0 +1,272 @@
// Package file extractor.
// WIP, and a little crashy.
// Yes, this code is messy, but I just wanted it to work after days of it not doing so.
#include <jmmt/crc.h>
#include <jmmt/lzss.h>
#include <jmmt/package.h>
#include <filesystem>
#include <fstream>
#include <iostream>
#include <map>
#include <vector>
namespace fs = std::filesystem;
// This is lame. But it works :)
template <class T>
T LameRead(std::istream& is) {
if(!is)
throw std::runtime_error("stream is bad");
T t {};
is.read(reinterpret_cast<char*>(&t), sizeof(T));
return t;
}
/**
* Reads package files.
*/
struct PackageReader {
/**
* Decompressed and un-split package file.
*/
struct DecompressedFile {
std::string filename;
std::vector<std::uint8_t> data;
};
explicit PackageReader(std::istream& is)
: is(is) {
}
void Init() {
is.seekg(-0xc, std::istream::end);
// Read the eof header
eofHeader = LameRead<jmmt::PackageEofHeader>(is);
// We ideally should be at the end of file after reading the eof header.
auto fileSize = is.tellg();
// Seek to the header start and read the pgrp.
is.seekg(static_cast<std::streamsize>(eofHeader.headerStartOffset), std::istream::beg);
group = LameRead<jmmt::PackageGroup>(is);
if(group.magic != jmmt::PackageGroup::TypeMagic) {
fileInvalid = true;
return;
}
// Read the string table, and hash every string out into a map.
// This is used to build our crc->filename mapping for this archive.
{
is.seekg(static_cast<std::streamsize>(eofHeader.headerStartOffset) + static_cast<std::streamsize>(eofHeader.headerSize), std::istream::beg);
auto ReadString = [&]() {
std::string s;
char c {};
while(true) {
c = is.get();
// std::printf("%c\n", c);
if(c == '\0')
return s;
s.push_back(c);
}
};
auto l = is.tellg();
// seek ahead of the "header" of the debug info/string table,
// since we don't care about it (we read strings until we "stop". though
// it might be smart to trust it? idk.)
is.seekg(sizeof(uint32_t), std::istream::cur);
while(l != fileSize - static_cast<std::streamsize>(sizeof(eofHeader))) {
auto string = ReadString();
crcToFilename[jmmt::HashString(string.c_str())] = string;
l = is.tellg();
// print out the creation of the crc/filename map for debugging
// std::printf("%s -> 0x%x\n", string.c_str(), jmmt::HashString(string.c_str()));
}
}
// Go to the start of the first pfil (skipping the pgrp we just read)
// after we setup our map.
is.seekg(static_cast<std::streamsize>(eofHeader.headerStartOffset) + sizeof(jmmt::PackageGroup), std::istream::beg);
}
/**
*
* \return false if file isn't invalid, true otherwise.
*/
[[nodiscard]] bool Invalid() const {
return fileInvalid;
}
// Read a file chunk.
void ReadFileChunk() {
if(fileInvalid)
return;
currChunk = LameRead<jmmt::PackageFile>(is);
if(currChunk.magic != jmmt::PackageFile::TypeMagic) {
fileInvalid = true;
return;
}
// Setup some variables
// TODO: Implement CRC-based fallback, if required.
// It PROBABLY isn't.
currFileName = crcToFilename[currChunk.filenameCrc];
chunksLeft = currChunk.chunkAmount - 1;
// If we finished a file, the work buffer is empty.
if(fileWorkBuffer.empty())
fileWorkBuffer.resize(currChunk.fileSize);
std::vector<std::uint8_t> compressedBuffer(currChunk.compressedChunkSize);
auto old = is.tellg();
is.seekg(currChunk.dataOffset, std::istream::beg);
// Read and decompress where we need to, taking the block offset into account.
is.read(reinterpret_cast<char*>(compressedBuffer.data()), currChunk.compressedChunkSize);
jmmt::DecompressLzss(nullptr, compressedBuffer.data(), currChunk.compressedChunkSize, fileWorkBuffer.data() + currChunk.blockOffset);
// Seek back to the old place the stream was before reading and decompress
is.seekg(old, std::istream::beg);
}
/**
* Read a file from this package.
* \param[in] cb Called when file is read
*/
template <class DoneCallback>
void ReadFile(DoneCallback&& cb) {
if(fileInvalid)
return;
// Read first file chunk.
// It's perfectly legal for this to be all we need to do.
ReadFileChunk();
// Read additional chunks, if required.
for(auto i = 0; i < chunksLeft; ++i) {
// std::printf("reading additional chunk %d/%d\n", i, chunksLeft);
ReadFileChunk();
}
//std::cout << "Read file \"" << currFileName << "\"\n";
cb(DecompressedFile { .filename = currFileName,
.data = fileWorkBuffer });
// write file data to stdout (debugging!)
// std::cout.write(reinterpret_cast<const char*>(fileWorkBuffer.data()), fileWorkBuffer.size());
fileWorkBuffer.clear();
}
/**
* Read all possible files from this package.
* \param[in] cb Called when file is read
*/
template <class DoneCallback>
void ReadFiles(DoneCallback&& cb) {
if(fileInvalid)
return;
for(auto i = 0; i < group.fileCount; ++i)
ReadFile(cb);
}
jmmt::PackageGroup& GetGroup() {
return group;
}
private:
std::istream& is;
// Set to true on any invalid file data.
bool fileInvalid = false;
jmmt::PackageEofHeader eofHeader {};
jmmt::PackageGroup group {};
/**
* CRC->sensible filename map.
*/
std::map<jmmt::crc32_t, std::string> crcToFilename;
// file stuff
uint32_t chunksLeft {};
// The name of the file we are processing.
std::string currFileName;
// The current chunk the reader is reading.
jmmt::PackageFile currChunk {};
// File-sized work buffer used to store the file
// we're currently working on. Freed when a file is
// finished being extracted.
std::vector<std::uint8_t> fileWorkBuffer;
};
int main(int argc, char** argv) {
// std::ifstream ifs("config.pak", std::ifstream::binary);
if(argc != 2) {
std::cout << "Usage: " << argv[0] << " [path 2 JMMT PAK file]";
return 1;
}
std::ifstream ifs(argv[1], std::ifstream::binary);
if(!ifs) {
std::cout << "Invalid file \"" << argv[1] << "\"\n";
return 1;
}
PackageReader reader(ifs);
reader.Init();
if(reader.Invalid()) {
std::cout << "File \"" << argv[1] << "\" doesn't seem to be a PAK file.\n";
return 1;
}
auto path = fs::path(argv[1]).stem();
reader.ReadFiles([&](const auto& file) {
auto outpath = path / file.filename;
fs::create_directories(outpath.parent_path());
std::ofstream ofs(outpath.string(), std::ofstream::binary);
if(!ofs) {
std::cout << "Could not open \"" << outpath.string() << "\".\n";
std::exit(1);
}
ofs.write(reinterpret_cast<const char*>(file.data.data()), static_cast<std::streampos>(file.data.size()));
ofs.close();
std::cout << "Wrote \"" << outpath.string() << "\".\n";
});
return 0;
}

110
src/tools/jmmt_renamer.cpp Normal file
View File

@ -0,0 +1,110 @@
// JMMT .DAT file renamer utility thingy
//
// Renames the .DAT files in /DATA on the disc to
// the original filenames, for easier identification,
// less pain, and.. well just because a bunch of DAT
// files is really stupid to go through every time.
//
// (C) 2022 modeco80.
//
// Usage:
//
// - Compile the tool (or scream at me for a binary)
// - Run the tool in the DATA directory of the files
// - ...
// - Profit?
#include <array>
#include <cstdint>
#include <cstdio>
#include <filesystem>
#include <string>
#include <string_view>
namespace fs = std::filesystem;
#include <jmmt/crc.h>
// These are the original filenames that the game tries to load,
// extracted from the game binary.
//
// We could brute-force these, but since the game has them in executable,
// it's a whole lot faster to just try every game filename and see
// what sticks (& rename it if it does).
constinit static std::array<std::string_view, 20> OriginalFilenames = {
// First loaded by the game
"package.toc",
// General packs
"config.pak",
// This file is referenced in the game files,
// but doesn't seem to exist anymore in the final build.
//"shell.pak",
"shell_character_select.pak",
"shell_main.pak",
"shell_title.pak",
"shell_venue.pak",
"shell_event.pak",
"shell_option.pak",
"win_screens.pak",
// Game levels
"SF_san_fran.pak",
"DC_washington.pak",
"MK_MT_KILI.pak",
"MP_MACHU_PIHU.pak",
"LV_Las_Vegas.pak",
"AN_ANTARTICA.pak",
"NP_Nepal.pak",
"TH_TAHOE.pak",
"VA_Valdez_alaska.pak",
"RV_Rome.pak",
"TR_training.pak"
};
std::string MakeDatFilename(const char* filename) {
char datFile[13] {};
// .DAT and .MET filenames are formatted like "[hex char * 8].DAT"
// The name component is the CRC32 of the original filename.
//
// The DAT/MET filename can be a max of 13 characters long.
int res = std::snprintf(&datFile[0], 13, "%X.DAT", jmmt::HashString(filename));
// FIXME: probably throw exception
if(res == -1)
return "";
return { &datFile[0], static_cast<std::size_t>(res) };
}
int main() {
int renamedFiles = 0;
for(auto filename : OriginalFilenames) {
auto datFile = MakeDatFilename(filename.data());
if(fs::exists(datFile)) {
// Try to rename the .DAT file to the game filename.
try {
fs::rename(datFile, filename);
} catch(std::exception& ex) {
// If there's an error renaming, we already catch
// if the source .DAT file (that's supposed to exist)
// doesn't exist, so print the exception and exit.
std::printf("Got exception: %s\n", ex.what());
return 1;
}
std::printf("\"%s\" -> \"%s\"\n", datFile.c_str(), filename.data());
renamedFiles++;
} else {
// FIXME: should probably stop here?
std::printf("???? Generated hash filename \"%s\" (for \"%s\") which does not exist on disk\n", datFile.c_str(), filename.data());
}
}
std::printf("Renamed %d files successfully.\n", renamedFiles);
return 0;
}