// Copyright 2014 Citra Emulator Project // Licensed under GPLv2 or any later version // Refer to the license.txt file included. #include #include #include #include #include #include #include #include #include #include #include #include #include "citra_qt/debugger/graphics/graphics_vertex_shader.h" #include "citra_qt/util/util.h" #include "core/core.h" #include "video_core/gpu.h" #include "video_core/pica/pica_core.h" #include "video_core/shader/shader_interpreter.h" using nihstro::Instruction; using nihstro::OpCode; using nihstro::SourceRegister; using nihstro::SwizzlePattern; GraphicsVertexShaderModel::GraphicsVertexShaderModel(GraphicsVertexShaderWidget* parent) : QAbstractTableModel(parent), par(parent) {} int GraphicsVertexShaderModel::columnCount([[maybe_unused]] const QModelIndex& parent) const { return 3; } int GraphicsVertexShaderModel::rowCount([[maybe_unused]] const QModelIndex& parent) const { return static_cast(par->info.code.size()); } QVariant GraphicsVertexShaderModel::headerData(int section, [[maybe_unused]] Qt::Orientation orientation, int role) const { switch (role) { case Qt::DisplayRole: { if (section == 0) { return tr("Offset"); } else if (section == 1) { return tr("Raw"); } else if (section == 2) { return tr("Disassembly"); } break; } } return QVariant(); } static std::string SelectorToString(u32 selector) { std::string ret; for (int i = 0; i < 4; ++i) { int component = (selector >> ((3 - i) * 2)) & 3; ret += "xyzw"[component]; } return ret; } // e.g. "-c92[a0.x].xyzw" static void print_input(std::ostringstream& output, const SourceRegister& input, bool negate, const std::string& swizzle_mask, bool align = true, const std::string& address_register_name = std::string()) { if (align) output << std::setw(4) << std::right; output << ((negate ? "-" : "") + input.GetName()); if (!address_register_name.empty()) output << '[' << address_register_name << ']'; output << '.' << swizzle_mask; }; QVariant GraphicsVertexShaderModel::data(const QModelIndex& index, int role) const { switch (role) { case Qt::DisplayRole: { switch (index.column()) { case 0: if (par->info.HasLabel(index.row())) return QString::fromStdString(par->info.GetLabel(index.row())); return QStringLiteral("%1").arg(4 * index.row(), 4, 16, QLatin1Char('0')); case 1: return QStringLiteral("%1").arg(par->info.code[index.row()].hex, 8, 16, QLatin1Char('0')); case 2: { std::ostringstream output; output.flags(std::ios::uppercase); // To make the code aligning columns of assembly easier to keep track of, this function // keeps track of the start of the start of the previous column, allowing alignment // based on desired field widths. int current_column = 0; auto AlignToColumn = [&](int col_width) { // Prints spaces to the output to pad previous column to size and advances the // column marker. current_column += col_width; int to_add = std::max(1, current_column - (int)output.tellp()); for (int i = 0; i < to_add; ++i) { output << ' '; } }; const Instruction& instr = par->info.code[index.row()]; const OpCode opcode = instr.opcode; const OpCode::Info opcode_info = opcode.GetInfo(); const u32 operand_desc_id = opcode_info.type == OpCode::Type::MultiplyAdd ? instr.mad.operand_desc_id.Value() : instr.common.operand_desc_id.Value(); const SwizzlePattern& swizzle = par->info.swizzle_info[operand_desc_id].pattern; // longest known instruction name: "setemit " int kOpcodeColumnWidth = 8; // "rXX.xyzw " int kOutputColumnWidth = 10; // "-rXX.xyzw ", no attempt is made to align indexed inputs int kInputOperandColumnWidth = 11; output << opcode_info.name; switch (opcode_info.type) { case OpCode::Type::Trivial: // Nothing to do here break; case OpCode::Type::Arithmetic: case OpCode::Type::MultiplyAdd: { // Use custom code for special instructions switch (opcode.EffectiveOpCode()) { case OpCode::Id::CMP: { AlignToColumn(kOpcodeColumnWidth); // NOTE: CMP always writes both cc components, so we do not consider the dest // mask here. output << " cc.xy"; AlignToColumn(kOutputColumnWidth); SourceRegister src1 = instr.common.GetSrc1(false); SourceRegister src2 = instr.common.GetSrc2(false); output << ' '; print_input(output, src1, swizzle.negate_src1, swizzle.SelectorToString(false).substr(0, 1), false, instr.common.AddressRegisterName()); output << ' ' << instr.common.compare_op.ToString(instr.common.compare_op.x) << ' '; print_input(output, src2, swizzle.negate_src2, swizzle.SelectorToString(true).substr(0, 1), false); output << ", "; print_input(output, src1, swizzle.negate_src1, swizzle.SelectorToString(false).substr(1, 1), false, instr.common.AddressRegisterName()); output << ' ' << instr.common.compare_op.ToString(instr.common.compare_op.y) << ' '; print_input(output, src2, swizzle.negate_src2, swizzle.SelectorToString(true).substr(1, 1), false); break; } case OpCode::Id::MAD: case OpCode::Id::MADI: { AlignToColumn(kOpcodeColumnWidth); bool src_is_inverted = 0 != (opcode_info.subtype & OpCode::Info::SrcInversed); SourceRegister src1 = instr.mad.GetSrc1(src_is_inverted); SourceRegister src2 = instr.mad.GetSrc2(src_is_inverted); SourceRegister src3 = instr.mad.GetSrc3(src_is_inverted); output << std::setw(3) << std::right << instr.mad.dest.Value().GetName() << '.' << swizzle.DestMaskToString(); AlignToColumn(kOutputColumnWidth); print_input(output, src1, swizzle.negate_src1, SelectorToString(swizzle.src1_selector)); AlignToColumn(kInputOperandColumnWidth); print_input(output, src2, swizzle.negate_src2, SelectorToString(swizzle.src2_selector), true, src_is_inverted ? "" : instr.mad.AddressRegisterName()); AlignToColumn(kInputOperandColumnWidth); print_input(output, src3, swizzle.negate_src3, SelectorToString(swizzle.src3_selector), true, src_is_inverted ? instr.mad.AddressRegisterName() : ""); AlignToColumn(kInputOperandColumnWidth); break; } default: { AlignToColumn(kOpcodeColumnWidth); bool src_is_inverted = 0 != (opcode_info.subtype & OpCode::Info::SrcInversed); if (opcode_info.subtype & OpCode::Info::Dest) { // e.g. "r12.xy__" output << std::setw(3) << std::right << instr.common.dest.Value().GetName() << '.' << swizzle.DestMaskToString(); } else if (opcode_info.subtype == OpCode::Info::MOVA) { output << " a0." << swizzle.DestMaskToString(); } AlignToColumn(kOutputColumnWidth); if (opcode_info.subtype & OpCode::Info::Src1) { SourceRegister src1 = instr.common.GetSrc1(src_is_inverted); print_input(output, src1, swizzle.negate_src1, swizzle.SelectorToString(false), true, src_is_inverted ? "" : instr.common.AddressRegisterName()); AlignToColumn(kInputOperandColumnWidth); } if (opcode_info.subtype & OpCode::Info::Src2) { SourceRegister src2 = instr.common.GetSrc2(src_is_inverted); print_input(output, src2, swizzle.negate_src2, swizzle.SelectorToString(true), true, src_is_inverted ? instr.common.AddressRegisterName() : ""); AlignToColumn(kInputOperandColumnWidth); } break; } } break; } case OpCode::Type::Conditional: case OpCode::Type::UniformFlowControl: { output << ' '; switch (opcode.EffectiveOpCode()) { case OpCode::Id::LOOP: output << 'i' << instr.flow_control.int_uniform_id << " (end on 0x" << std::setw(4) << std::right << std::setfill('0') << std::hex << (4 * instr.flow_control.dest_offset) << ")"; break; default: if (opcode_info.subtype & OpCode::Info::HasCondition) { output << '('; if (instr.flow_control.op != instr.flow_control.JustY) { if (!instr.flow_control.refx) output << '!'; output << "cc.x"; } if (instr.flow_control.op == instr.flow_control.Or) { output << " || "; } else if (instr.flow_control.op == instr.flow_control.And) { output << " && "; } if (instr.flow_control.op != instr.flow_control.JustX) { if (!instr.flow_control.refy) output << '!'; output << "cc.y"; } output << ") "; } else if (opcode_info.subtype & OpCode::Info::HasUniformIndex) { if (opcode.EffectiveOpCode() == OpCode::Id::JMPU && (instr.flow_control.num_instructions & 1) == 1) { output << '!'; } output << 'b' << instr.flow_control.bool_uniform_id << ' '; } if (opcode_info.subtype & OpCode::Info::HasAlternative) { output << "else jump to 0x" << std::setw(4) << std::right << std::setfill('0') << std::hex << (4 * instr.flow_control.dest_offset); } else if (opcode_info.subtype & OpCode::Info::HasExplicitDest) { output << "jump to 0x" << std::setw(4) << std::right << std::setfill('0') << std::hex << (4 * instr.flow_control.dest_offset); } else { // TODO: Handle other cases output << "(unknown destination)"; } if (opcode_info.subtype & OpCode::Info::HasFinishPoint) { output << " (return on 0x" << std::setw(4) << std::right << std::setfill('0') << std::hex << (4 * instr.flow_control.dest_offset + 4 * instr.flow_control.num_instructions) << ')'; } break; } break; } default: output << " (unknown instruction format)"; break; } return QString::fromLatin1(output.str().c_str()); } default: break; } } case Qt::FontRole: return GetMonospaceFont(); case Qt::BackgroundRole: { // Highlight current instruction int current_record_index = par->cycle_index->value(); if (current_record_index < static_cast(par->debug_data.records.size())) { const auto& current_record = par->debug_data.records[current_record_index]; if (index.row() == static_cast(current_record.instruction_offset)) { return QColor(255, 255, 63); } } // Use a grey background for instructions which have no debug data associated to them for (const auto& record : par->debug_data.records) if (index.row() == static_cast(record.instruction_offset)) return QVariant(); return QBrush(QColor(192, 192, 192)); } // TODO: Draw arrows for each "reachable" instruction to visualize control flow default: break; } return QVariant(); } void GraphicsVertexShaderWidget::DumpShader() { QString filename = QFileDialog::getSaveFileName(this, tr("Save Shader Dump"), QStringLiteral("shader_dump.shbin"), tr("Shader Binary (*.shbin)")); if (filename.isEmpty()) { // If the user canceled the dialog, don't dump anything. return; } auto& pica = system.GPU().PicaCore(); Pica::DebugUtils::DumpShader(filename.toStdString(), pica.regs.internal.vs, pica.vs_setup, pica.regs.internal.rasterizer.vs_output_attributes); } GraphicsVertexShaderWidget::GraphicsVertexShaderWidget( Core::System& system_, std::shared_ptr debug_context, QWidget* parent) : BreakPointObserverDock(debug_context, tr("Pica Vertex Shader"), parent), system{system_} { setObjectName(QStringLiteral("PicaVertexShader")); // Clear input vertex data so that it contains valid float values in case a debug shader // execution happens before the first Vertex Loaded breakpoint. // TODO: This makes a crash in the interpreter much less likely, but not impossible. The // interpreter should guard against out-of-bounds accesses to ensure crashes in it aren't // possible. std::memset(&input_vertex, 0, sizeof(input_vertex)); auto input_data_mapper = new QSignalMapper(this); // TODO: Support inputting data in hexadecimal raw format for (std::size_t i = 0; i < input_data.size(); ++i) { input_data[i] = new QLineEdit; input_data[i]->setValidator(new QDoubleValidator(input_data[i])); } breakpoint_warning = new QLabel(tr("(data only available at vertex shader invocation breakpoints)")); // TODO: Add some button for jumping to the shader entry point model = new GraphicsVertexShaderModel(this); binary_list = new QTreeView; binary_list->setModel(model); binary_list->setRootIsDecorated(false); binary_list->setAlternatingRowColors(true); auto dump_shader = new QPushButton(QIcon::fromTheme(QStringLiteral("document-save")), tr("Dump")); instruction_description = new QLabel; cycle_index = new QSpinBox; connect(dump_shader, &QPushButton::clicked, this, &GraphicsVertexShaderWidget::DumpShader); connect(cycle_index, static_cast(&QSpinBox::valueChanged), this, &GraphicsVertexShaderWidget::OnCycleIndexChanged); for (u32 i = 0; i < input_data.size(); ++i) { connect(input_data[i], &QLineEdit::textEdited, input_data_mapper, static_cast(&QSignalMapper::map)); input_data_mapper->setMapping(input_data[i], i); } connect(input_data_mapper, &QSignalMapper::mappedInt, this, &GraphicsVertexShaderWidget::OnInputAttributeChanged); auto main_widget = new QWidget; auto main_layout = new QVBoxLayout; { auto input_data_group = new QGroupBox(tr("Input Data")); // For each vertex attribute, add a QHBoxLayout consisting of: // - A QLabel denoting the source attribute index // - Four QLineEdits for showing and manipulating attribute data // - A QLabel denoting the shader input attribute index auto sub_layout = new QVBoxLayout; for (unsigned i = 0; i < 16; ++i) { // Create an HBoxLayout to store the widgets used to specify a particular attribute // and store it in a QWidget to allow for easy hiding and unhiding. auto row_layout = new QHBoxLayout; // Remove unnecessary padding between rows row_layout->setContentsMargins(0, 0, 0, 0); row_layout->addWidget(new QLabel(tr("Attribute %1").arg(i, 2))); for (unsigned comp = 0; comp < 4; ++comp) row_layout->addWidget(input_data[4 * i + comp]); row_layout->addWidget(input_data_mapping[i] = new QLabel); input_data_container[i] = new QWidget; input_data_container[i]->setLayout(row_layout); input_data_container[i]->hide(); sub_layout->addWidget(input_data_container[i]); } sub_layout->addWidget(breakpoint_warning); breakpoint_warning->hide(); input_data_group->setLayout(sub_layout); main_layout->addWidget(input_data_group); } // Make program listing expand to fill available space in the dialog binary_list->setSizePolicy(QSizePolicy::Preferred, QSizePolicy::MinimumExpanding); main_layout->addWidget(binary_list); main_layout->addWidget(dump_shader); { auto sub_layout = new QFormLayout; sub_layout->addRow(tr("Cycle Index:"), cycle_index); main_layout->addLayout(sub_layout); } // Set a minimum height so that the size of this label doesn't cause the rest of the bottom // part of the UI to keep jumping up and down when cycling through instructions. instruction_description->setMinimumHeight(instruction_description->fontMetrics().lineSpacing() * 6); instruction_description->setAlignment(Qt::AlignLeft | Qt::AlignTop); main_layout->addWidget(instruction_description); main_widget->setLayout(main_layout); setWidget(main_widget); widget()->setEnabled(false); } void GraphicsVertexShaderWidget::OnBreakPointHit(Pica::DebugContext::Event event, const void* data) { if (event == Pica::DebugContext::Event::VertexShaderInvocation) { Reload(true, data); } else { // No vertex data is retrievable => invalidate currently stored vertex data Reload(true, nullptr); } widget()->setEnabled(true); } void GraphicsVertexShaderWidget::Reload(bool replace_vertex_data, const void* vertex_data) { model->beginResetModel(); if (replace_vertex_data) { if (vertex_data) { std::memcpy(&input_vertex, vertex_data, sizeof(input_vertex)); for (unsigned attr = 0; attr < 16; ++attr) { for (unsigned comp = 0; comp < 4; ++comp) { input_data[4 * attr + comp]->setText( QStringLiteral("%1").arg(input_vertex[attr][comp].ToFloat32())); } } breakpoint_warning->hide(); } else { for (unsigned attr = 0; attr < 16; ++attr) { for (unsigned comp = 0; comp < 4; ++comp) { input_data[4 * attr + comp]->setText(QStringLiteral("???")); } } breakpoint_warning->show(); } } // Reload shader code info.Clear(); auto& pica = system.GPU().PicaCore(); for (auto instr : pica.vs_setup.program_code) info.code.push_back({instr}); int num_attributes = pica.regs.internal.vs.max_input_attribute_index + 1; for (auto pattern : pica.vs_setup.swizzle_data) { const nihstro::SwizzleInfo swizzle_info = {.pattern = nihstro::SwizzlePattern{pattern}}; info.swizzle_info.push_back(swizzle_info); } u32 entry_point = pica.regs.internal.vs.main_offset; info.labels.insert({entry_point, "main"}); // Generate debug information Pica::Shader::InterpreterEngine shader_engine; shader_engine.SetupBatch(pica.vs_setup, entry_point); debug_data = shader_engine.ProduceDebugInfo(pica.vs_setup, input_vertex, pica.regs.internal.vs); // Reload widget state for (int attr = 0; attr < num_attributes; ++attr) { unsigned source_attr = pica.regs.internal.vs.GetRegisterForAttribute(attr); input_data_mapping[attr]->setText(QStringLiteral("-> v%1").arg(source_attr)); input_data_container[attr]->setVisible(true); } // Only show input attributes which are used as input to the shader for (unsigned int attr = num_attributes; attr < 16; ++attr) { input_data_container[attr]->setVisible(false); } // Initialize debug info text for current cycle count cycle_index->setMaximum(static_cast(debug_data.records.size() - 1)); OnCycleIndexChanged(cycle_index->value()); model->endResetModel(); } void GraphicsVertexShaderWidget::OnResumed() { widget()->setEnabled(false); } void GraphicsVertexShaderWidget::OnInputAttributeChanged(int index) { const f32 value = input_data[index]->text().toFloat(); input_vertex[index / 4][index % 4] = Pica::f24::FromFloat32(value); // Re-execute shader with updated value Reload(); } void GraphicsVertexShaderWidget::OnCycleIndexChanged(int index) { QString text; const QString true_string = QStringLiteral("true"); const QString false_string = QStringLiteral("false"); auto& record = debug_data.records[index]; if (record.mask & Pica::Shader::DebugDataRecord::SRC1) text += tr("SRC1: %1, %2, %3, %4\n") .arg(record.src1.x.ToFloat32()) .arg(record.src1.y.ToFloat32()) .arg(record.src1.z.ToFloat32()) .arg(record.src1.w.ToFloat32()); if (record.mask & Pica::Shader::DebugDataRecord::SRC2) text += tr("SRC2: %1, %2, %3, %4\n") .arg(record.src2.x.ToFloat32()) .arg(record.src2.y.ToFloat32()) .arg(record.src2.z.ToFloat32()) .arg(record.src2.w.ToFloat32()); if (record.mask & Pica::Shader::DebugDataRecord::SRC3) text += tr("SRC3: %1, %2, %3, %4\n") .arg(record.src3.x.ToFloat32()) .arg(record.src3.y.ToFloat32()) .arg(record.src3.z.ToFloat32()) .arg(record.src3.w.ToFloat32()); if (record.mask & Pica::Shader::DebugDataRecord::DEST_IN) text += tr("DEST_IN: %1, %2, %3, %4\n") .arg(record.dest_in.x.ToFloat32()) .arg(record.dest_in.y.ToFloat32()) .arg(record.dest_in.z.ToFloat32()) .arg(record.dest_in.w.ToFloat32()); if (record.mask & Pica::Shader::DebugDataRecord::DEST_OUT) text += tr("DEST_OUT: %1, %2, %3, %4\n") .arg(record.dest_out.x.ToFloat32()) .arg(record.dest_out.y.ToFloat32()) .arg(record.dest_out.z.ToFloat32()) .arg(record.dest_out.w.ToFloat32()); if (record.mask & Pica::Shader::DebugDataRecord::ADDR_REG_OUT) text += tr("Address Registers: %1, %2\n") .arg(record.address_registers[0]) .arg(record.address_registers[1]); if (record.mask & Pica::Shader::DebugDataRecord::CMP_RESULT) text += tr("Compare Result: %1, %2\n") .arg(record.conditional_code[0] ? true_string : false_string) .arg(record.conditional_code[1] ? true_string : false_string); if (record.mask & Pica::Shader::DebugDataRecord::COND_BOOL_IN) text += tr("Static Condition: %1\n").arg(record.cond_bool ? true_string : false_string); if (record.mask & Pica::Shader::DebugDataRecord::COND_CMP_IN) text += tr("Dynamic Conditions: %1, %2\n") .arg(record.cond_cmp[0] ? true_string : false_string) .arg(record.cond_cmp[1] ? true_string : false_string); if (record.mask & Pica::Shader::DebugDataRecord::LOOP_INT_IN) text += tr("Loop Parameters: %1 (repeats), %2 (initializer), %3 (increment), %4\n") .arg(record.loop_int.x) .arg(record.loop_int.y) .arg(record.loop_int.z) .arg(record.loop_int.w); text += tr("Instruction offset: 0x%1").arg(4 * record.instruction_offset, 4, 16, QLatin1Char('0')); if (record.mask & Pica::Shader::DebugDataRecord::NEXT_INSTR) { text += tr(" -> 0x%2").arg(4 * record.next_instruction, 4, 16, QLatin1Char('0')); } else { text += tr(" (last instruction)"); } instruction_description->setText(text); // Emit model update notification and scroll to current instruction QModelIndex instr_index = model->index(record.instruction_offset, 0); emit model->dataChanged(instr_index, model->index(record.instruction_offset, model->columnCount())); binary_list->scrollTo(instr_index, QAbstractItemView::EnsureVisible); }