diff options
Diffstat (limited to 'tools/br_ips/br_ips.c')
-rw-r--r-- | tools/br_ips/br_ips.c | 321 |
1 files changed, 321 insertions, 0 deletions
diff --git a/tools/br_ips/br_ips.c b/tools/br_ips/br_ips.c new file mode 100644 index 0000000..64c454a --- /dev/null +++ b/tools/br_ips/br_ips.c @@ -0,0 +1,321 @@ +#define _POSIX_C_SOURCE 200808L // Don't use GNU getline +#include <stdio.h> +#include <stdint.h> +#include <stdlib.h> +#include <ctype.h> +#include <string.h> +#include "global.h" + +static const char SPLASH[] = "IPS patch creator for undisassembled data\n" + "Created by PikalaxALT on 23 June 2019 All Rights Reserved\n"; + +static const char HELP[] = "br_ips\n" + "This utility is meant to be run with no arguments in the project root of a PRET AGB disassembly.\n" + "baserom.gba and ld_script.txt are required files which must be present in the project root.\n" + "ld_script.txt is a GNU linker script. For more details, see\n" + "https://ftp.gnu.org/old-gnu/Manuals/ld-2.9.1/html_chapter/ld_3.html#SEC6.\n" + "All ELF targets in the linker script with Makefile rules \"%.o: %.s\" must have their sources present\n" + "at the indicated paths relative to the project root.\n" + "\n" + "Options:\n" + " -h - show this message and exit\n"; + +static int getline(char ** lineptr, size_t * n, FILE * stream) { + // Static implementation of GNU getline + int i = 0; + int c; + if (n == NULL || lineptr == NULL || stream == NULL) return -1; + size_t size = *n; + char * buf = *lineptr; + if (buf == NULL || size < 4) { + size = 128; + *lineptr = buf = realloc(buf, 128); + } + if (buf == NULL) return -1; + while (1) { + c = getc(stream); + if (c == EOF) break; + buf[i++] = c; + if (c == '\n') break; + if (i == size - 1) { + size <<= 1; + buf = realloc(buf, size); + if (buf == NULL) return -1; + *lineptr = buf; + *n = size; + } + } + if (i == 0) return -1; + buf[i] = 0; + return i; +} + +static void getIncbinsFromFile(hunk_t ** hunks, size_t * num, size_t * maxnum, const char * fname, char ** strbuf, size_t * buffersize) { + // Recursively find incbinned segments and encode them as hunks. + FILE * file = fopen(fname, "r"); + if (file == NULL) FATAL_ERROR("unable to open file \"%s\" for reading\n", fname); + hunk_t * data = *hunks; + size_t nhunks = *num; + size_t maxnhunks = *maxnum; + int line_n = 0; // for error prints + while (getline(strbuf, buffersize, file) > 0) { + line_n++; + // If another file is included by this one, recurse into it. + char * include = strstr(*strbuf, ".include"); + if (include != NULL) { + char incfname[128]; + include = strchr(include, '"'); + if (include == NULL) FATAL_ERROR("%s:%d: malformed include\n", fname, line_n); + include++; + char * endq_p = strchr(include, '"'); + if (endq_p == NULL) FATAL_ERROR("%s:%d: malformed include\n", fname, line_n); + *endq_p = 0; + strcpy(incfname, include); + getIncbinsFromFile(&data, &nhunks, &maxnhunks, incfname, strbuf, buffersize); + continue; + } + // Check for a .incbin "baserom.gba" directive + char * line = strstr(*strbuf, ".incbin"); + if (line == NULL) continue; + line = strstr(line + sizeof(".incbin"), "\"baserom.gba\","); + if (line == NULL) continue; + line += sizeof("\"baserom.gba\",") - 1; + uint32_t incbinOffset; + // Enforce the structure .incbin "baserom.gba", offset, size + // Data cannot be located at offset 0, as that is the entry + // point (ARM code). + do { + if (*line == 0) FATAL_ERROR("%s:%d: malformed incbin\n", fname, line_n); + incbinOffset = strtoul(line, &line, 0); + line++; + } while (incbinOffset == 0); + size_t incbinSize; + do { + if (*line == 0) FATAL_ERROR("%s:%d: malformed incbin\n", fname, line_n); + incbinSize = strtoul(line, &line, 0); + line++; + } while (incbinSize == 0); + // Offset must fit in three bytes + if (incbinOffset >= 0x01000000) FATAL_ERROR("%s:%d: offset exceeds encodable limit\n", fname, line_n); + // Avoid confusion with the end sentinel + if (incbinOffset == 0x454F46) { // "EOF" + incbinOffset--; + incbinSize++; + } + // Cannot read past a certain point due to format restrictions + if (incbinOffset + incbinSize > 0xFFFFFF + 0xFFFF) FATAL_ERROR("%s:%d: size exceeds encodable limit\n", fname, line_n); + // Break up the incbin into hunks of maximum size 0xFFFF + do { + size_t trueSize = incbinSize <= 0xFFFF ? incbinSize : 0xFFFF; + if (nhunks >= maxnhunks) { + maxnhunks <<= 1; + data = realloc(data, maxnhunks * sizeof(hunk_t)); + if (data == NULL) FATAL_ERROR("unable to reallocate hunks buffer\n"); + } + data[nhunks].offset = incbinOffset; + data[nhunks].size = trueSize; + incbinOffset += trueSize; + incbinSize -= trueSize; + if (incbinOffset == 0x454F46) { + incbinOffset--; + data[nhunks].size--; + incbinSize++; + } + nhunks++; + } while (incbinSize > 0); + } + // Error check + if (!feof(file)) FATAL_ERROR("getline\n"); + fclose(file); + *hunks = data; + *num = nhunks; + *maxnum = maxnhunks; +} + +static hunk_t * getAllIncbins(FILE * ld_script, size_t * num_p) { + // Parse the ld script. + // Strict adherence to syntax is expected. + char * line = NULL; + size_t linesiz = 0; + char fname_buf[128]; + size_t maxnum = 256; + size_t num = 0; + // Allocate the hunks array. + hunk_t * hunks = malloc(256 * sizeof(hunk_t)); + if (hunks == NULL) FATAL_ERROR("failed to allocate hunks buffer\n"); + while (getline(&line, &linesiz, ld_script) > 0) { + char * endptr; + // We only expect hunks in rodata, script_data, and gfx_data sections. + if ((endptr = strstr(line, ".o(.rodata);")) == NULL + && (endptr = strstr(line, ".o(script_data);")) == NULL + && (endptr = strstr(line, ".o(gfx_data);")) == NULL) continue; + char * startptr = line; + // Skip whitespace. + while (isspace(*startptr)) startptr++; + if (strstr(startptr, ".a:") != NULL) continue; // no hunks in libs + if (strstr(startptr, "src/") == startptr) continue; // no hunks in src/ + // Replace the extension with .s and truncate the string + endptr[1] = 's'; + endptr[2] = 0; + // We're reusing the already-allocated string buffer, so + // copy the filename to the stack for use in error prints. + strcpy(fname_buf, startptr); + getIncbinsFromFile(&hunks, &num, &maxnum, fname_buf, &line, &linesiz); + } + // Error check + if (!feof(ld_script)) FATAL_ERROR("getline\n"); + free(line); + *num_p = num; + return hunks; +} + +static int cmp_baserom(const void * a, const void * b) { + // Comparison function for sorting Hunk structs. + // For more details, please refer to the qsort man pages. + // See also the function "collapseIncbins" below. + const hunk_t * aa = (const hunk_t *)a; + const hunk_t * bb = (const hunk_t *)b; + return (aa->offset > bb->offset) - (aa->offset < bb->offset); +} + +static void collapseIncbins(hunk_t * hunks, size_t * num_p) { + // This function merges adjacent hunks where possible. + size_t num = *num_p; + // Sort the array by offset increasing. + qsort(hunks, num, sizeof(hunk_t), cmp_baserom); + // We stop at num - 1 because we need to be able to look one + // entry ahead in the hunks array. + for (int i = 0; i < num - 1; i++) { + // Loop until the next hunk is not adjacent to the current. + while (hunks[i].offset + hunks[i].size == hunks[i + 1].offset) { + // If this hunk cannot be merged with the next, proceed to the next. + if (hunks[i].size == 0xFFFF || (hunks[i].size == 0xFFFE && hunks[i + 1].offset == 0x454F45)) break; + // If this hunk is empty, remove it. + if (hunks[i].size == 0) { + int j; + // Find the next non-empty hunk + for (j = i + 1; j < num; j++) { + if (hunks[j].size != 0) break; + } + if (j == num) { + // All remaining hunks are empty + num = i; + break; + } + // Compaction + // Use a for loop instead of memcpy to avoid UB from + // overlapping buffers. + for (int k = 0; k < num - j; k++) hunks[i + k] = hunks[j + k]; + num -= j - i; + if (i >= num - 1) break; + } + else + { + // Combine this hunk with the next + hunks[i].size += hunks[i + 1].size; + if (hunks[i].size > 0xFFFF) { + // Split the hunk back up, it's too big to encode. + // Set the earlier hunk to the maximum permitted size, + // and the following hunk to the remainder. + hunks[i + 1].size = hunks[i].size - 0xFFFF; + hunks[i].size = 0xFFFF; + hunks[i + 1].offset = hunks[i].offset + 0xFFFF; + // If this operation would confuse the hunk with the + // EOF sentinel, fix that. + if (hunks[i + 1].offset == 0x454F46) { + hunks[i].size--; + hunks[i + 1].offset--; + hunks[i + 1].size++; + } + break; + } else { + // Compaction + // Use a for loop instead of memcpy to avoid UB from + // overlapping buffers. + for (int j = i + 1; j < num - 1; j++) hunks[j] = hunks[j + 1]; + num--; + if (i >= num - 1) break; + } + } + } + } + *num_p = num; +} + +static void writePatch(const char * filename, const hunk_t * hunks, size_t num, FILE * rom) { + // Create an IPS patch. + // The file is headed with a magic code which is "PATCH" in ASCII. + // Following that are the "hunks": 3-byte offset, 2-byte size, and + // the literal data. The file is ended with "EOF", again in ASCII. + // For that reason, an offset of 0x454F46 cannot be encoded directly. + // Offset and size are encoded big-endian. + FILE * file = fopen(filename, "wb"); + if (file == NULL) FATAL_ERROR("unable to open file \"%s\" for writing\n", filename); + // Maximum hunk size is 65535 bytes. For convenience, we allocate a + // round 65536 (0x10000). This has no effect on memory consumption, + // as malloc will round this up anyway. + char * readbuf = malloc(0x10000); + if (readbuf == NULL) FATAL_ERROR("failed to allocate write buffer\n"); + fwrite("PATCH", 1, 5, file); // magic + for (int i = 0; i < num; i++) { + // Encode the offset + uint32_t offset = hunks[i].offset; + putc(offset >> 16, file); + putc(offset >> 8, file); + putc(offset >> 0, file); + // Encode the size + size_t size = hunks[i].size; + putc(size >> 8, file); + putc(size >> 0, file); + // Yank the data straight from the ROM + if (fseek(rom, offset, SEEK_SET)) FATAL_ERROR("seek\n"); + if (fread(readbuf, 1, size, rom) != size) FATAL_ERROR("read\n"); + if (fwrite(readbuf, 1, size, file) != size) FATAL_ERROR("write\n"); + } + free(readbuf); + // Write the EOF magic + fwrite("EOF", 1, 3, file); + fclose(file); +} + +// This script takes no arguments. +int main(int argc, char ** argv) { + // Show a friendly message + puts(SPLASH); + // If requested, show help message + if (argc >= 2 && strcmp(argv[1], "-h") == 0) { + puts(HELP); + return 0; + } + // This script expects to be in a PRET AGB disassembly project root. + // Required files include baserom.gba, ld_script.txt, and all paths + // referenced in ld_script.txt relative to the project root. + FILE * rom = fopen("baserom.gba", "rb"); + if (rom == NULL) FATAL_ERROR("unable to open \"baserom.gba\" for reading\n"); + FILE * ld_script = fopen("ld_script.txt", "r"); + if (ld_script == NULL) FATAL_ERROR("unable to open \"ld_script.txt\" for reading\n"); + // Find all instances where segments of baserom.gba are incbinned literaly. + size_t num = 0; + hunk_t * hunks = getAllIncbins(ld_script, &num); + fclose(ld_script); + if (num == 0) { + // If this line is printed, the script was unable to find any + // `.incbin "baserom.gba"` lines. + // If this is incorrect, please contact the developer. + puts("No baserom.gba hunks found!\n" + "If there are baserom.gba hunks in this project,\n" + "please ping PikalaxALT on the pret discord,\n" + "channel #gen-3-help.\n"); + } else { + // Merge neighboring hunks to reduce the number of hunks. + collapseIncbins(hunks, &num); + // Encode the hunks in the IPS patch. + writePatch("baserom.ips", hunks, num, rom); + // Communicate status to the user. + puts("IPS file created at baserom.ips\n"); + } + // Clean up and return. + fclose(rom); + free(hunks); + return 0; +} |