jak-project/decompiler/config.cpp

410 lines
17 KiB
C++
Raw Permalink Normal View History

2020-08-22 23:30:17 -04:00
#include "config.h"
#include "common/log/log.h"
#include "common/util/FileUtil.h"
#include "common/util/json_util.h"
#include "decompiler/util/config_parsers.h"
2020-08-22 23:30:17 -04:00
#include "fmt/core.h"
namespace decompiler {
2020-08-22 23:30:17 -04:00
void from_json(const nlohmann::json& j, TexInfo& info) {
j.at("name").get_to(info.name);
j.at("tpage_name").get_to(info.tpage_name);
j.at("idx").get_to(info.idx);
}
void to_json(nlohmann::json& j, const TexInfo& info) {
j = {
{"name", info.name},
{"tpage_name", info.tpage_name},
{"idx", info.idx},
};
}
namespace {
/*!
* Read an entry from cfg containing the name of a json file, and parse that file.
* Relative to jak-project directory.
*/
nlohmann::json read_json_file_from_config(const nlohmann::json& json, const std::string& file_key) {
auto file_name = json.at(file_key).get<std::string>();
auto file_txt = file_util::read_text_file(file_util::get_file_path({file_name}));
return parse_commented_json(file_txt, file_name);
}
Config make_config_via_json(nlohmann::json& json) {
Config config;
int version_int = json.at("game_version").get<int>();
ASSERT(version_int == 1 || version_int == 2 || version_int == 3);
config.game_version = (GameVersion)version_int;
config.text_version = json.at("text_version").get<GameTextVersion>();
config.game_name = json.at("game_name").get<std::string>();
if (json.contains("expected_elf_name")) {
config.expected_elf_name = json.at("expected_elf_name").get<std::string>();
}
config.all_types_file = json.at("all_types_file").get<std::string>();
2020-08-22 23:30:17 -04:00
auto inputs_json = read_json_file_from_config(json, "inputs_file");
config.dgo_names = json.contains("dgo_names")
? json.at("dgo_names").get<std::vector<std::string>>()
: inputs_json.at("dgo_names").get<std::vector<std::string>>();
config.object_file_names = inputs_json.at("object_file_names").get<std::vector<std::string>>();
config.str_file_names = inputs_json.at("str_file_names").get<std::vector<std::string>>();
if (inputs_json.contains("str_texture_file_names")) {
config.str_texture_file_names =
inputs_json.at("str_texture_file_names").get<std::vector<std::string>>();
}
if (inputs_json.contains("str_art_file_names")) {
config.str_art_file_names =
inputs_json.at("str_art_file_names").get<std::vector<std::string>>();
}
config.streamed_audio_file_names =
inputs_json.at("streamed_audio_file_names").get<std::vector<std::string>>();
if (json.contains("art_group_dump_file")) {
auto json_data = file_util::read_text_file(
file_util::get_file_path({json.at("art_group_dump_file").get<std::string>()}));
std::unordered_map<std::string, std::unordered_map<int, std::string>> serialized =
parse_commented_json(json_data, "art_group_dump_file");
config.art_group_info_dump = serialized;
}
if (json.contains("joint_node_dump_file")) {
auto json_data = file_util::read_text_file(
file_util::get_file_path({json.at("joint_node_dump_file").get<std::string>()}));
std::unordered_map<std::string, std::unordered_map<int, std::string>> serialized =
parse_commented_json(json_data, "joint_node_dump_file");
config.jg_info_dump = serialized;
}
if (json.contains("tex_dump_file")) {
auto json_data = file_util::read_text_file(
file_util::get_file_path({json.at("tex_dump_file").get<std::string>()}));
std::unordered_map<u32, TexInfo> serialized = parse_commented_json(json_data, "tex_dump_file");
config.texture_info_dump = serialized;
}
if (json.contains("obj_file_name_map_file")) {
config.obj_file_name_map_file = json.at("obj_file_name_map_file").get<std::string>();
}
config.disassemble_code = json.at("disassemble_code").get<bool>();
config.decompile_code = json.at("decompile_code").get<bool>();
g/j1: Cleanup all main issues in the formatter and format all of `goal_src/jak1` (#3535) This PR does two main things: 1. Work through the main low-hanging fruit issues in the formatter keeping it from feeling mature and usable 2. Iterate and prove that point by formatting all of the Jak 1 code base. **This has removed around 100K lines in total.** - The decompiler will now format it's results for jak 1 to keep things from drifting back to where they were. This is controlled by a new config flag `format_code`. How am I confident this hasn't broken anything?: - I compiled the entire project and stored it's `out/jak1/obj` files separately - I then recompiled the project after formatting and wrote a script that md5's each file and compares it (`compare-compilation-outputs.py` - The results (eventually) were the same: ![Screenshot 2024-05-25 132900](https://github.com/open-goal/jak-project/assets/13153231/015e6f20-8d19-49b7-9951-97fa88ddc6c2) > This proves that the only difference before and after is non-critical whitespace for all code/macros that is actually in use. I'm still aware of improvements that could be made to the formatter, as well as general optimization of it's performance. But in general these are for rare or non-critical situations in my opinion and I'll work through them before doing Jak 2. The vast majority looks great and is working properly at this point. Those known issues are the following if you are curious: ![image](https://github.com/open-goal/jak-project/assets/13153231/0edfaba1-6d36-40f5-ab23-0642209867c4)
2024-06-05 22:17:31 -04:00
if (json.contains("format_code")) {
config.format_code = json.at("format_code").get<bool>();
}
config.write_hex_near_instructions = json.at("write_hex_near_instructions").get<bool>();
config.write_scripts = json.at("write_scripts").get<bool>();
config.disassemble_data = json.at("disassemble_data").get<bool>();
config.process_tpages = json.at("process_tpages").get<bool>();
config.write_tpage_imports = json.at("write_tpage_imports").get<bool>();
config.process_game_text = json.at("process_game_text").get<bool>();
config.process_game_count = json.at("process_game_count").get<bool>();
config.process_art_groups = json.at("process_art_groups").get<bool>();
if (json.contains("process_subtitle_text")) {
config.process_subtitle_text = json.at("process_subtitle_text").get<bool>();
}
if (json.contains("process_subtitle_images")) {
config.process_subtitle_images = json.at("process_subtitle_images").get<bool>();
}
config.dump_art_group_info = json.at("dump_art_group_info").get<bool>();
config.dump_joint_geo_info = json.at("dump_joint_geo_info").get<bool>();
config.dump_tex_info = json.at("dump_tex_info").get<bool>();
config.hexdump_code = json.at("hexdump_code").get<bool>();
config.hexdump_data = json.at("hexdump_data").get<bool>();
config.find_functions = json.at("find_functions").get<bool>();
config.dump_objs = json.at("dump_objs").get<bool>();
config.print_cfgs = json.at("print_cfgs").get<bool>();
config.generate_symbol_definition_map = json.at("generate_symbol_definition_map").get<bool>();
config.is_pal = json.at("is_pal").get<bool>();
config.rip_levels = json.at("rip_levels").get<bool>();
config.extract_collision = json.at("extract_collision").get<bool>();
config.generate_all_types = json.at("generate_all_types").get<bool>();
if (json.contains("read_spools")) {
config.read_spools = json.at("read_spools").get<bool>();
}
if (json.contains("ignore_var_name_casts")) {
config.ignore_var_name_casts = json.at("ignore_var_name_casts").get<bool>();
}
if (json.contains("old_all_types_file")) {
config.old_all_types_file = json.at("old_all_types_file").get<std::string>();
}
auto allowed = json.at("allowed_objects").get<std::vector<std::string>>();
for (const auto& x : allowed) {
config.allowed_objects.insert(x);
}
auto banned = json.at("banned_objects").get<std::vector<std::string>>();
for (const auto& x : banned) {
config.banned_objects.insert(x);
}
auto type_casts_json = read_json_file_from_config(json, "type_casts_file");
if (json.contains("type_casts_merge_file")) {
type_casts_json.update(read_json_file_from_config(json, "type_casts_merge_file"));
}
for (auto& kv : type_casts_json.items()) {
auto& function_name = kv.key();
auto& casts = kv.value();
for (auto& cast : casts) {
if (cast.at(0).is_string()) {
auto cast_name = cast.at(0).get<std::string>();
if (cast_name == "_stack_") {
// it's a stack var cast
StackTypeCast stack_cast;
stack_cast.stack_offset = cast.at(1).get<int>();
stack_cast.type_name = cast.at(2).get<std::string>();
config.stack_type_casts_by_function_by_stack_offset[function_name]
[stack_cast.stack_offset] = stack_cast;
} else {
throw std::runtime_error(fmt::format("Unknown cast type: {}", cast_name));
}
} else {
auto idx_range = parse_json_optional_integer_range(cast.at(0));
for (auto idx : idx_range) {
RegisterTypeCast type_cast;
type_cast.atomic_op_idx = idx;
type_cast.reg = Register(cast.at(1).get<std::string>());
type_cast.type_name = cast.at(2).get<std::string>();
config.register_type_casts_by_function_by_atomic_op_idx[function_name][idx].push_back(
type_cast);
}
}
}
}
auto anon_func_json = read_json_file_from_config(json, "anonymous_function_types_file");
if (json.contains("anonymous_function_types_merge_file")) {
anon_func_json.update(read_json_file_from_config(json, "anonymous_function_types_merge_file"));
}
for (auto& kv : anon_func_json.items()) {
auto& obj_file_name = kv.key();
auto& anon_types = kv.value();
for (auto& anon_type : anon_types) {
auto id = anon_type.at(0).get<int>();
const auto& type_name = anon_type.at(1).get<std::string>();
config.anon_function_types_by_obj_by_id[obj_file_name][id] = type_name;
}
}
if (!config.ignore_var_name_casts) {
auto var_names_json = read_json_file_from_config(json, "var_names_file");
for (auto& kv : var_names_json.items()) {
auto& function_name = kv.key();
auto arg = kv.value().find("args");
if (arg != kv.value().end()) {
for (auto& x : arg.value()) {
config.function_arg_names[function_name].push_back(x);
}
}
auto var = kv.value().find("vars");
if (var != kv.value().end()) {
for (auto& vkv : var->get<std::unordered_map<std::string, nlohmann::json>>()) {
LocalVarOverride override;
if (vkv.second.is_string()) {
override.name = vkv.second.get<std::string>();
} else if (vkv.second.is_array()) {
override.name = vkv.second[0].get<std::string>();
override.type = vkv.second[1].get<std::string>();
} else {
throw std::runtime_error("Invalid function var override.");
}
config.function_var_overrides[function_name][vkv.first] = override;
}
}
}
}
auto label_types_json = read_json_file_from_config(json, "label_types_file");
if (json.contains("label_types_merge_file")) {
label_types_json.update(read_json_file_from_config(json, "label_types_merge_file"));
}
for (auto& kv : label_types_json.items()) {
auto& obj_name = kv.key();
auto& types = kv.value();
for (auto& x : types) {
const auto& name = x.at(0).get<std::string>();
const auto& type_name = x.at(1).get<std::string>();
bool is_val = false;
std::optional<int> array_size;
if (x.size() > 2) {
if (x.at(2).is_boolean()) {
is_val = x.at(2).get<bool>();
} else {
array_size = x.at(2).get<int>();
}
}
auto& config_entry = config.label_types[obj_name][name];
config_entry = {is_val, type_name, array_size};
}
}
auto stack_structures_json = read_json_file_from_config(json, "stack_structures_file");
if (json.contains("stack_structures_merge_file")) {
stack_structures_json.update(read_json_file_from_config(json, "stack_structures_merge_file"));
}
for (auto& kv : stack_structures_json.items()) {
auto& func_name = kv.key();
auto& stack_structures = kv.value();
config.stack_structure_hints_by_function[func_name] =
parse_stack_structure_hints(stack_structures);
}
auto hacks_json = read_json_file_from_config(json, "hacks_file");
if (json.contains("hacks_merge_file")) {
// NOTE - here we merge one level deeper because it's worth doing here
// - chances are you just need to override a few individual hacks
const auto hack_overrides = read_json_file_from_config(json, "hacks_merge_file");
for (const auto& entry : hack_overrides.items()) {
if (hacks_json.contains(entry.key())) {
// If the parent json file has this, update it
hacks_json.at(entry.key()).update(entry.value());
} else {
// Otherwise, we append it
hacks_json[entry.key()] = entry.value();
}
}
}
config.hacks.hint_inline_assembly_functions =
hacks_json.at("hint_inline_assembly_functions").get<std::unordered_set<std::string>>();
config.hacks.asm_functions_by_name =
hacks_json.at("asm_functions_by_name").get<std::unordered_set<std::string>>();
config.hacks.pair_functions_by_name =
hacks_json.at("pair_functions_by_name").get<std::unordered_set<std::string>>();
config.hacks.no_type_analysis_functions_by_name =
hacks_json.at("no_type_analysis_functions_by_name").get<std::unordered_set<std::string>>();
config.hacks.types_with_bad_inspect_methods =
hacks_json.at("types_with_bad_inspect_methods").get<std::unordered_set<std::string>>();
config.hacks.reject_cond_to_value = hacks_json.at("aggressively_reject_cond_to_value_rewrite")
.get<std::unordered_set<std::string>>();
config.hacks.blocks_ending_in_asm_branch_by_func_name =
hacks_json.at("blocks_ending_in_asm_branch")
.get<std::unordered_map<std::string, std::unordered_set<int>>>();
config.hacks.format_ops_with_dynamic_string_by_func_name =
hacks_json.at("dynamic_format_arg_counts")
.get<std::unordered_map<std::string, std::vector<std::vector<int>>>>();
config.hacks.mips2c_functions_by_name =
hacks_json.at("mips2c_functions_by_name").get<std::unordered_set<std::string>>();
config.hacks.mips2c_jump_table_functions =
hacks_json.at("mips2c_jump_table_functions")
.get<std::unordered_map<std::string, std::vector<int>>>();
for (auto& entry : hacks_json.at("cond_with_else_max_lengths")) {
auto func_name = entry.at(0).get<std::string>();
auto cond_name = entry.at(1).get<std::string>();
auto max_len = entry.at(2).get<int>();
config.hacks.cond_with_else_len_by_func_name[func_name].max_length_by_start_block[cond_name] =
max_len;
}
for (auto& entry : hacks_json.at("missing_textures")) {
int tpage = entry.at(1).get<int>();
int idx = entry.at(2).get<int>();
config.hacks.missing_textures_by_level[entry.at(0).get<std::string>()].emplace_back(tpage, idx);
}
config.bad_format_strings =
hacks_json.at("bad_format_strings").get<std::unordered_map<std::string, int>>();
auto merged = hacks_json.at("expected_merged_objs").get<std::vector<std::string>>();
for (const auto& x : merged) {
config.merged_objects.insert(x);
}
config.levels_to_extract = inputs_json.at("levels_to_extract").get<std::vector<std::string>>();
config.levels_extract = json.at("levels_extract").get<bool>();
if (json.contains("save_texture_pngs")) {
config.save_texture_pngs = json.at("save_texture_pngs").get<bool>();
}
if (json.contains("rip_streamed_audio")) {
config.rip_streamed_audio = json.at("rip_streamed_audio").get<bool>();
}
if (inputs_json.contains("animated_textures")) {
config.animated_textures =
inputs_json.at("animated_textures").get<std::unordered_set<std::string>>();
}
if (inputs_json.contains("common_tpages")) {
config.common_tpages = inputs_json.at("common_tpages").get<std::unordered_set<int>>();
}
auto art_info_json = read_json_file_from_config(json, "art_info_file");
config.art_group_type_remap =
art_info_json.at("type_remap").get<std::unordered_map<std::string, std::string>>();
if (art_info_json.contains("file_override")) {
config.art_group_file_override =
art_info_json.at("file_override")
.get<std::unordered_map<std::string, std::unordered_map<std::string, std::string>>>();
}
config.joint_node_hacks =
art_info_json.at("joint_node_hacks").get<std::unordered_map<std::string, std::string>>();
auto import_deps = read_json_file_from_config(json, "import_deps_file");
config.import_deps_by_file =
import_deps.get<std::unordered_map<std::string, std::vector<std::string>>>();
if (json.contains("rip_collision")) {
config.rip_collision = json.at("rip_collision").get<bool>();
}
config.write_patches = json.at("write_patches").get<bool>();
config.apply_patches = json.at("apply_patches").get<bool>();
const auto& object_patches = json.at("object_patches");
for (auto& [obj, pch] : object_patches.items()) {
ObjectPatchInfo new_pch;
new_pch.crc = (u32)std::stoull(pch.at("crc32").get<std::string>(), nullptr, 16);
new_pch.target_file = pch.at("in").get<std::string>();
new_pch.patch_file = pch.at("out").get<std::string>();
config.object_patches.insert({obj, new_pch});
}
decomp3: more engine stuff, detect non-virtual state inheritance (#3377) - `speech` - `ambient` - `water-h` - `vol-h` - `generic-obs` - `carry-h` - `pilot-h` - `board-h` - `gun-h` - `flut-h` - `indax-h` - `lightjak-h` - `darkjak-h` - `target-util` - `history` - `collide-reaction-target` - `logic-target` - `sidekick` - `projectile` - `voicebox` - `ragdoll-edit` - most of `ragdoll` (not added to gsrc yet) - `curves` - `find-nearest` - `lightjak-wings` - `target-handler` - `target-anim` - `target` - `target2` - `target-swim` - `target-lightjak` - `target-invisible` - `target-death` - `target-gun` - `gun-util` - `board-util` - `target-board` - `board-states` - `mech-h` - `vol` - `vent` - `viewer` - `gem-pool` - `collectables` - `crates` - `secrets-menu` Additionally: - Detection of non-virtual state inheritance - Added a config file that allows overriding the process stack size set by `stack-size-set!` calls - Fix for integer multiplication with `r0` - Fixed detection for the following macros: - `static-attack-info` - `defpart` and `defpartgroup` (probably still needs adjustments, uses Jak 2 implementation at the moment) - `sound-play` (Jak 3 seems to always call `sound-play-by-name` with a `sound-group` of 0, so the macro has been temporarily defaulted to use that) One somewhat significant change made here that should be noted is that the return type of `process::init-from-entity!` was changed to `object`. I've been thinking about this for a while, since it looks a bit nicer without the `(none)` at the end and I have recently encountered init methods that early return `0`.
2024-03-03 15:15:27 -05:00
auto process_stack_size_json = read_json_file_from_config(json, "process_stack_size_file");
config.process_stack_size_overrides =
process_stack_size_json.get<std::unordered_map<std::string, int>>();
return config;
}
} // namespace
/*!
* Parse the main config file and return decompiler config.
*/
Config read_config_file(const fs::path& path_to_config_file,
const std::string& config_game_version,
const std::string& override_json) {
Config config;
auto config_str = file_util::read_text_file(path_to_config_file);
auto json = parse_commented_json(config_str, path_to_config_file.string());
// First, check if we need to update the JSON from the game versions overrides
if (json.contains("version_overrides")) {
if (!json.at("version_overrides").contains(config_game_version)) {
throw std::runtime_error(fmt::format(
"'{}' provided which doesn't correspond with a 'version_overrides", config_game_version));
}
lg::info("Game Config Overide: '{}'", config_game_version);
json.update(json.at("version_overrides").at(config_game_version));
}
// Then, update any config overrides
if (override_json != "{}" && !override_json.empty()) {
lg::info("Config Override: '{}'", override_json);
auto cfg_override = parse_commented_json(override_json, "");
json.update(cfg_override, true);
}
// debugging, dump the JSON config to a file
// fs::path debug_path = path_to_config_file.parent_path() / "config-debug.jsonc";
// file_util::write_text_file(debug_path, json.dump(2));
// Lastly, update the struct via the JSON
return make_config_via_json(json);
}
} // namespace decompiler