/* SPDX-License-Identifier: Unlicense */ #include "disasm.h" #include "data_buffer.h" #include "common.h" #define OPTPARSE_IMPLEMENTATION #define OPTPARSE_API static #include "optparse/optparse.h" #include #include #include #include #include #include #include #include class DisasmMap { DisasmNode *_map[kDisasmMapSizeElements]{}; DisasmNode *findNodeByOffset(uint32_t offset) const; DisasmNode *insertTracedNode(uint32_t offset, TracedNodeType); public: const DisasmNode *FindNodeByOffset(uint32_t offset) const { return findNodeByOffset(offset); }; // Returns true if node inserted, false if node already exist and has not // been changed bool InsertTracedNode(uint32_t offset, TracedNodeType type) { return nullptr != insertTracedNode(offset, type); } // This function disassembles everything that has been traced void DisasmAll(const DataBuffer &code, const Settings &); ~DisasmMap(); }; DisasmNode *DisasmMap::findNodeByOffset(uint32_t offset) const { if (offset < kRomSizeBytes) return _map[offset / kInstructionSizeStepBytes]; return nullptr; } DisasmNode *DisasmMap::insertTracedNode(uint32_t offset, TracedNodeType type) { auto *node = findNodeByOffset(offset); if (node) { return node; } node = new DisasmNode(DisasmNode{type, offset}); assert(node); _map[offset / kInstructionSizeStepBytes] = node; return node; } void DisasmMap::DisasmAll(const DataBuffer &code, const Settings & s) { for (size_t i = 0; i < kDisasmMapSizeElements; i++) { auto *node = _map[i]; if (!node) { continue; } node->Disasm(code, s); if (node->has_branch_addr && node->branch_addr < code.occupied_size) { auto *ref_node = insertTracedNode( node->branch_addr, TracedNodeType::kInstruction); ref_node->Disasm(code, s); ref_node->AddReferencedBy( node->offset, node->is_call ? ReferenceType::kCall : ReferenceType::kBranch); } } } DisasmMap::~DisasmMap() { for (size_t i = 0; i < kDisasmMapSizeElements; i++) { delete _map[i]; _map[i] = nullptr; } } static size_t RenderRawDataComment( char *out, size_t out_sz, uint32_t offset, size_t instr_sz, const DataBuffer &code) { size_t overall_sz{}; for (size_t i = 0; i < instr_sz; i += kInstructionSizeStepBytes) { overall_sz += Min( out_sz - overall_sz, snprintf( out + overall_sz, out_sz - overall_sz, " %04x", GetU16BE(code.buffer + offset + i))); } overall_sz += Min( out_sz - overall_sz, snprintf(out + overall_sz, out_sz - overall_sz, " @%08x", offset)); return overall_sz; } static const char *ReferenceTypeToString(ReferenceType type) { switch (type) { case ReferenceType::kUnknown: return "UNKN"; case ReferenceType::kBranch: return "BRANCH"; case ReferenceType::kCall: return "CALL"; } return "UNKN"; } static void RenderDisassembly( FILE *output, const DisasmMap &disasm_map, const DataBuffer &code, const Settings &s) { for (size_t i = 0; i < code.occupied_size;) { const DisasmNode *node = disasm_map.FindNodeByOffset(i); if (node) { if (node->ref_by) { if (s.xrefs_from) { fprintf(output, "| XREFS:\n"); for (ReferenceNode *ref{node->ref_by}; ref; ref = ref->next) { if (ref->refs_count == 0) { continue; } fprintf(output, "|"); for (size_t i = 0; i < ref->refs_count; i++) { const ReferenceRecord r = ref->refs[i]; fprintf(output, " %s @%08x", ReferenceTypeToString(r.type), r.address); } fprintf(output, "\n"); } } if (s.marks) { fprintf(output, ".L%08x:\n", node->offset); } } const char *const delimiter = node->arguments[0] != '\0' ? " " : ""; fprintf(output, " %s%s%s", node->mnemonic, delimiter, node->arguments); if (node->has_branch_addr && s.xrefs_to) { char branch_addr[12]{}; snprintf(branch_addr, sizeof(branch_addr), " .L%08x", node->branch_addr); fprintf(output, " |%s", branch_addr); } if (s.raw_data_comment) { char raw_data_comment[100]{}; RenderRawDataComment(raw_data_comment, sizeof(raw_data_comment) - 1, node->offset, node->size, code); fprintf(output, " |%s", raw_data_comment); } fprintf(output, "\n"); i += node->size; } else { fprintf(output, " .short 0x%02x%02x\n", code.buffer[i], code.buffer[i + 1]); i += kInstructionSizeStepBytes; } } } static void ParseTraceData(DisasmMap &disasm_map, const DataBuffer &trace_data) { // FIXME make a full blown parser with various radixes support and different // trace types support bool parse = true; for (size_t i = 0; i < trace_data.occupied_size; i++) { if (trace_data.buffer[i] == '\n' || trace_data.buffer[i] == '\r') { parse = true; } else if (parse) { errno = 0; char *startptr = reinterpret_cast(trace_data.buffer + i); char *endptr = startptr; const long offset = strtol(startptr, &endptr, 10); if ((offset == LONG_MAX || offset == LONG_MIN) && errno == ERANGE) { // Error, just skip } else if (startptr == endptr) { // Error, just skip } else { // Valid value disasm_map.InsertTracedNode(offset, TracedNodeType::kInstruction); } if (startptr != endptr) { i += endptr - startptr - 1; } parse = false; } } } static size_t ReadFromStream(DataBuffer &db, FILE *stream) { assert(db.buffer && db.buffer_size >= db.kInitialSize); while (1) { const size_t read_size = db.buffer_size - db.occupied_size; const size_t fread_ret = fread( db.buffer + db.occupied_size, sizeof(*db.buffer), read_size, stream); db.occupied_size += fread_ret; if (fread_ret >= db.buffer_size) { assert(fread_ret == db.buffer_size); db.Expand(db.buffer_size * 2); } else { const int err = errno; if (feof(stream)) { break; } else if (ferror(stream)) { fprintf(stderr, "ReadFromStream: fread(%zu): Error (%d): \"%s\"\n", read_size, err, strerror(err)); return EXIT_FAILURE; } else if (db.buffer_size == db.occupied_size) { db.Expand(db.buffer_size * 2); } else { assert(false); } } } return db.occupied_size; } static int M68kDisasmByTrace(FILE *input_stream, FILE *output_stream, FILE *trace_stream, const Settings &s) { // Read machine code into buffer DataBuffer code{}; const size_t input_size = ReadFromStream(code, input_stream); if (input_size == 0) { fprintf(stderr, "ReadFromStream(code, input_stream): Error: No data has been read\n"); return EXIT_FAILURE; } // Expand a little just in case there is truncated instruction in the end of // the buffer so it will not fall out of buffer trying to fetch arguments // from additional extension words. if (code.occupied_size + 100 > code.buffer_size) { code.Expand(code.occupied_size + 100); } // Read trace file into buffer DataBuffer trace_data{}; const size_t trace_size = ReadFromStream(trace_data, trace_stream); if (trace_size == 0) { fprintf(stderr, "ReadFromStream(trace_data, trace_stream): Error: No data has been read\n"); return EXIT_FAILURE; } // Parse trace file into map DisasmMap *disasm_map = new DisasmMap{}; assert(disasm_map); ParseTraceData(*disasm_map, trace_data); // Disasm into output map disasm_map->DisasmAll(code, s); // Print output into output_stream RenderDisassembly(output_stream, *disasm_map, code, s); delete disasm_map; return 0; } static int M68kDisasmAll(FILE *input_stream, FILE *output_stream, const Settings &) { uint8_t instruction[kInstructionSizeStepBytes]{}; const size_t read_size = kInstructionSizeStepBytes; while (1) { const size_t fread_ret = fread(instruction, 1, read_size, input_stream); if (fread_ret == 0) { const int err = errno; if (feof(input_stream)) { break; } else { fprintf(stderr, "ReadFromStream: fread(%zu): Error (%d): \"%s\"\n", read_size, err, strerror(err)); return EXIT_FAILURE; } } fprintf(output_stream, " .short 0x%02x%02x\n", instruction[0], instruction[1]); } return 0; } static bool IsValidFeature(const char *feature) { constexpr size_t sizeof_no_prefix = strlen("no-"); if (0 == memcmp(feature, "no-", sizeof_no_prefix)) { feature += sizeof_no_prefix; } if (0 == strcmp(feature, "rdc")) { return true; } else if (0 == strcmp(feature, "marks")) { return true; } else if (0 == strcmp(feature, "rel-marks")) { return true; } else if (0 == strcmp(feature, "abs-marks")) { return true; } else if (0 == strcmp(feature, "xrefs-from")) { return true; } else if (0 == strcmp(feature, "xrefs-to")) { return true; } return false; } static void ApplyFeature(Settings& s, const char *feature) { bool disable{}; constexpr size_t sizeof_no_prefix = strlen("no-"); if (0 == memcmp(feature, "no-", sizeof_no_prefix)) { disable = true; feature += sizeof_no_prefix; } if (0 == strcmp(feature, "rdc")) { s.raw_data_comment = !disable; } else if (0 == strcmp(feature, "marks")) { s.marks = !disable; } else if (0 == strcmp(feature, "rel-marks")) { s.rel_marks = !disable; } else if (0 == strcmp(feature, "abs-marks")) { s.abs_marks = !disable; } else if (0 == strcmp(feature, "xrefs-from")) { s.xrefs_from = !disable; } else if (0 == strcmp(feature, "xrefs-to")) { s.xrefs_to = !disable; } } static void PrintUsage(FILE *s, const char *argv0) { fprintf(s, "Usage: %s [options] []\n", argv0); fprintf(s, "Options:\n"); fprintf(s, " -h, --help, Show this message\n"); fprintf(s, " -o, --output, Where to write disassembly to (stdout if not set)\n"); fprintf(s, " -t, --pc-trace, File containing PC trace\n"); fprintf(s, " -f, --feature=[no-]\n"); fprintf(s, " Enable or disable (with \"no-\" prefix) a feature\n"); fprintf(s, " Available features:\n"); fprintf(s, " rdc print raw data comment\n"); fprintf(s, " marks print marks above all places that have jumps\n"); fprintf(s, " from somewhere\n"); fprintf(s, " rel-marks use mark instead of number on relative\n"); fprintf(s, " branch or call\n"); fprintf(s, " abs-marks use mark instead of number on absolute\n"); fprintf(s, " branch or call\n"); fprintf(s, " xrefs-from print xrefs comments above all places that\n"); fprintf(s, " have xrefs\n"); fprintf(s, " xrefs-to print xrefs comments after all branch \n"); fprintf(s, " instructions\n"); fprintf(s, " Binary file with machine code (stdin if not set)\n"); } int main(int, char* argv[]) { struct optparse_long longopts[] = { {"help", 'h', OPTPARSE_NONE}, {"output", 'o', OPTPARSE_REQUIRED}, {"pc-trace", 't', OPTPARSE_REQUIRED}, {"feature", 'f', OPTPARSE_OPTIONAL}, {}, }; const char *trace_file_name = nullptr; const char *output_file_name = nullptr; const char *input_file_name = nullptr; Settings s{}; struct optparse options; optparse_init(&options, argv); // Parse opts int option; while ((option = optparse_long(&options, longopts, NULL)) != -1) { switch (option) { case 'h': PrintUsage(stdout, argv[0]); return EXIT_SUCCESS; break; case 'o': output_file_name = options.optarg; break; case 't': trace_file_name = options.optarg; break; case 'f': if (!IsValidFeature(options.optarg)) { fprintf(stderr, "main: Error: Unknown feature \"%s\", exiting\n", options.optarg); return EXIT_FAILURE; } ApplyFeature(s, options.optarg); break; case '?': fprintf(stderr, "main: optparse_long: Error: \"%s\"\n", options.errmsg); return EXIT_FAILURE; } } // Parse input file name char *arg; while ((arg = optparse_arg(&options))) { if (input_file_name == nullptr) { input_file_name = arg; } else { fprintf(stderr, "error: too many free arguments provided\n"); return EXIT_FAILURE; } } // Open the files FILE *input_stream = stdin; FILE *output_stream = stdout; FILE *trace_stream = nullptr; if (input_file_name) { input_stream = fopen(input_file_name, "r"); if (input_stream == nullptr) { const int err = errno; fprintf(stderr, "main: fopen(\"%s\", \"r\"): Error (%d): \"%s\"\n", input_file_name, err, strerror(err)); return EXIT_FAILURE; } } if (output_file_name) { output_stream = fopen(output_file_name, "w"); if (output_stream == nullptr) { const int err = errno; fprintf(stderr, "main: fopen(\"%s\", \"w\"): Error (%d): \"%s\"\n", output_file_name, err, strerror(err)); return EXIT_FAILURE; } } if (trace_file_name) { trace_stream = fopen(trace_file_name, "r"); if (trace_stream == nullptr) { const int err = errno; fprintf(stderr, "main: fopen(\"%s\", \"r\"): Error (%d): \"%s\"\n", trace_file_name, err, strerror(err)); return EXIT_FAILURE; } } // Run the program const int ret = trace_stream ? M68kDisasmByTrace(input_stream, output_stream, trace_stream, s) : M68kDisasmAll(input_stream, output_stream, s); if (trace_stream != nullptr) { fclose(trace_stream); } if (output_stream != stdout) { fclose(output_stream); } if (input_stream != stdin) { fclose(input_stream); } return ret; }