// Copyright 2014 Citra Emulator Project // Licensed under GPLv2 // Refer to the license.txt file included. #include #include #include #include #include "video_core/pica.h" #include "debug_utils.h" namespace Pica { namespace DebugUtils { void GeometryDumper::AddVertex(std::array pos, TriangleTopology topology) { vertices.push_back({pos[0], pos[1], pos[2]}); int num_vertices = vertices.size(); switch (topology) { case TriangleTopology::List: case TriangleTopology::ListIndexed: if (0 == (num_vertices % 3)) faces.push_back({ num_vertices-3, num_vertices-2, num_vertices-1 }); break; default: ERROR_LOG(GPU, "Unknown triangle topology %x", (int)topology); exit(0); break; } } void GeometryDumper::Dump() { // NOTE: Permanently enabling this just trashes hard disks for no reason. // Hence, this is currently disabled. return; static int index = 0; std::string filename = std::string("geometry_dump") + std::to_string(++index) + ".obj"; std::ofstream file(filename); for (const auto& vertex : vertices) { file << "v " << vertex.pos[0] << " " << vertex.pos[1] << " " << vertex.pos[2] << std::endl; } for (const Face& face : faces) { file << "f " << 1+face.index[0] << " " << 1+face.index[1] << " " << 1+face.index[2] << std::endl; } } #pragma pack(1) struct DVLBHeader { enum : u32 { MAGIC_WORD = 0x424C5644, // "DVLB" }; u32 magic_word; u32 num_programs; // u32 dvle_offset_table[]; }; static_assert(sizeof(DVLBHeader) == 0x8, "Incorrect structure size"); struct DVLPHeader { enum : u32 { MAGIC_WORD = 0x504C5644, // "DVLP" }; u32 magic_word; u32 version; u32 binary_offset; // relative to DVLP start u32 binary_size_words; u32 swizzle_patterns_offset; u32 swizzle_patterns_num_entries; u32 unk2; }; static_assert(sizeof(DVLPHeader) == 0x1C, "Incorrect structure size"); struct DVLEHeader { enum : u32 { MAGIC_WORD = 0x454c5644, // "DVLE" }; enum class ShaderType : u8 { VERTEX = 0, GEOMETRY = 1, }; u32 magic_word; u16 pad1; ShaderType type; u8 pad2; u32 main_offset_words; // offset within binary blob u32 endmain_offset_words; u32 pad3; u32 pad4; u32 constant_table_offset; u32 constant_table_size; // number of entries u32 label_table_offset; u32 label_table_size; u32 output_register_table_offset; u32 output_register_table_size; u32 uniform_table_offset; u32 uniform_table_size; u32 symbol_table_offset; u32 symbol_table_size; }; static_assert(sizeof(DVLEHeader) == 0x40, "Incorrect structure size"); #pragma pack() void DumpShader(const u32* binary_data, u32 binary_size, const u32* swizzle_data, u32 swizzle_size, u32 main_offset, const Regs::VSOutputAttributes* output_attributes) { // NOTE: Permanently enabling this just trashes hard disks for no reason. // Hence, this is currently disabled. return; struct StuffToWrite { u8* pointer; u32 size; }; std::vector writing_queue; u32 write_offset = 0; auto QueueForWriting = [&writing_queue,&write_offset](u8* pointer, u32 size) { writing_queue.push_back({pointer, size}); u32 old_write_offset = write_offset; write_offset += size; return old_write_offset; }; // First off, try to translate Pica state (one enum for output attribute type and component) // into shbin format (separate type and component mask). union OutputRegisterInfo { enum Type : u64 { POSITION = 0, COLOR = 2, TEXCOORD0 = 3, TEXCOORD1 = 5, TEXCOORD2 = 6, }; BitField< 0, 64, u64> hex; BitField< 0, 16, Type> type; BitField<16, 16, u64> id; BitField<32, 4, u64> component_mask; }; // This is put into a try-catch block to make sure we notice unknown configurations. std::vector output_info_table; for (int i = 0; i < 7; ++i) { using OutputAttributes = Pica::Regs::VSOutputAttributes; // TODO: It's still unclear how the attribute components map to the register! // Once we know that, this code probably will not make much sense anymore. std::map > map = { { OutputAttributes::POSITION_X, { OutputRegisterInfo::POSITION, 1} }, { OutputAttributes::POSITION_Y, { OutputRegisterInfo::POSITION, 2} }, { OutputAttributes::POSITION_Z, { OutputRegisterInfo::POSITION, 4} }, { OutputAttributes::POSITION_W, { OutputRegisterInfo::POSITION, 8} }, { OutputAttributes::COLOR_R, { OutputRegisterInfo::COLOR, 1} }, { OutputAttributes::COLOR_G, { OutputRegisterInfo::COLOR, 2} }, { OutputAttributes::COLOR_B, { OutputRegisterInfo::COLOR, 4} }, { OutputAttributes::COLOR_A, { OutputRegisterInfo::COLOR, 8} }, { OutputAttributes::TEXCOORD0_U, { OutputRegisterInfo::TEXCOORD0, 1} }, { OutputAttributes::TEXCOORD0_V, { OutputRegisterInfo::TEXCOORD0, 2} }, { OutputAttributes::TEXCOORD1_U, { OutputRegisterInfo::TEXCOORD1, 1} }, { OutputAttributes::TEXCOORD1_V, { OutputRegisterInfo::TEXCOORD1, 2} }, { OutputAttributes::TEXCOORD2_U, { OutputRegisterInfo::TEXCOORD2, 1} }, { OutputAttributes::TEXCOORD2_V, { OutputRegisterInfo::TEXCOORD2, 2} } }; for (const auto& semantic : std::vector{ output_attributes[i].map_x, output_attributes[i].map_y, output_attributes[i].map_z, output_attributes[i].map_w }) { if (semantic == OutputAttributes::INVALID) continue; try { OutputRegisterInfo::Type type = map.at(semantic).first; u32 component_mask = map.at(semantic).second; auto it = std::find_if(output_info_table.begin(), output_info_table.end(), [&i, &type](const OutputRegisterInfo& info) { return info.id == i && info.type == type; } ); if (it == output_info_table.end()) { output_info_table.push_back({}); output_info_table.back().type = type; output_info_table.back().component_mask = component_mask; output_info_table.back().id = i; } else { it->component_mask = it->component_mask | component_mask; } } catch (const std::out_of_range& oor) { _dbg_assert_msg_(GPU, 0, "Unknown output attribute mapping"); ERROR_LOG(GPU, "Unknown output attribute mapping: %03x, %03x, %03x, %03x", (int)output_attributes[i].map_x.Value(), (int)output_attributes[i].map_y.Value(), (int)output_attributes[i].map_z.Value(), (int)output_attributes[i].map_w.Value()); } } } struct { DVLBHeader header; u32 dvle_offset; } dvlb{ {DVLBHeader::MAGIC_WORD, 1 } }; // 1 DVLE DVLPHeader dvlp{ DVLPHeader::MAGIC_WORD }; DVLEHeader dvle{ DVLEHeader::MAGIC_WORD }; QueueForWriting((u8*)&dvlb, sizeof(dvlb)); u32 dvlp_offset = QueueForWriting((u8*)&dvlp, sizeof(dvlp)); dvlb.dvle_offset = QueueForWriting((u8*)&dvle, sizeof(dvle)); // TODO: Reduce the amount of binary code written to relevant portions dvlp.binary_offset = write_offset - dvlp_offset; dvlp.binary_size_words = binary_size; QueueForWriting((u8*)binary_data, binary_size * sizeof(u32)); dvlp.swizzle_patterns_offset = write_offset - dvlp_offset; dvlp.swizzle_patterns_num_entries = swizzle_size; u32 dummy = 0; for (int i = 0; i < swizzle_size; ++i) { QueueForWriting((u8*)&swizzle_data[i], sizeof(swizzle_data[i])); QueueForWriting((u8*)&dummy, sizeof(dummy)); } dvle.main_offset_words = main_offset; dvle.output_register_table_offset = write_offset - dvlb.dvle_offset; dvle.output_register_table_size = output_info_table.size(); QueueForWriting((u8*)output_info_table.data(), output_info_table.size() * sizeof(OutputRegisterInfo)); // TODO: Create a label table for "main" // Write data to file static int dump_index = 0; std::string filename = std::string("shader_dump") + std::to_string(++dump_index) + std::string(".shbin"); std::ofstream file(filename, std::ios_base::out | std::ios_base::binary); for (auto& chunk : writing_queue) { file.write((char*)chunk.pointer, chunk.size); } } static std::unique_ptr pica_trace; static std::mutex pica_trace_mutex; static int is_pica_tracing = false; void StartPicaTracing() { if (is_pica_tracing) { ERROR_LOG(GPU, "StartPicaTracing called even though tracing already running!"); return; } pica_trace_mutex.lock(); pica_trace = std::unique_ptr(new PicaTrace); is_pica_tracing = true; pica_trace_mutex.unlock(); } bool IsPicaTracing() { return is_pica_tracing; } void OnPicaRegWrite(u32 id, u32 value) { // Double check for is_pica_tracing to avoid pointless locking overhead if (!is_pica_tracing) return; std::unique_lock lock(pica_trace_mutex); if (!is_pica_tracing) return; pica_trace->writes.push_back({id, value}); } std::unique_ptr FinishPicaTracing() { if (!is_pica_tracing) { ERROR_LOG(GPU, "FinishPicaTracing called even though tracing already running!"); return {}; } // signalize that no further tracing should be performed is_pica_tracing = false; // Wait until running tracing is finished pica_trace_mutex.lock(); std::unique_ptr ret(std::move(pica_trace)); pica_trace_mutex.unlock(); return std::move(ret); } } // namespace } // namespace