summaryrefslogtreecommitdiffstats
path: root/src/video_core/macro/macro_hle.cpp
blob: da988cc0d5d332e18f883d7bc8e8ab53f19e31e4 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
// SPDX-FileCopyrightText: Copyright 2020 yuzu Emulator Project
// SPDX-License-Identifier: GPL-2.0-or-later

#include <array>
#include <vector>
#include "common/scope_exit.h"
#include "video_core/dirty_flags.h"
#include "video_core/engines/draw_manager.h"
#include "video_core/engines/maxwell_3d.h"
#include "video_core/macro/macro.h"
#include "video_core/macro/macro_hle.h"
#include "video_core/memory_manager.h"
#include "video_core/rasterizer_interface.h"

namespace Tegra {
namespace {

using HLEFunction = void (*)(Engines::Maxwell3D& maxwell3d, const std::vector<u32>& parameters);

// HLE'd functions
void HLE_771BB18C62444DA0(Engines::Maxwell3D& maxwell3d, const std::vector<u32>& parameters) {
    const u32 instance_count = parameters[2] & maxwell3d.GetRegisterValue(0xD1B);
    maxwell3d.draw_manager->DrawIndex(
        static_cast<Tegra::Engines::Maxwell3D::Regs::PrimitiveTopology>(parameters[0] & 0x3ffffff),
        parameters[4], parameters[1], parameters[3], parameters[5], instance_count);
}

void HLE_DrawArraysIndirect(Engines::Maxwell3D& maxwell3d, const std::vector<u32>& parameters) {
    const u32 instance_count = (maxwell3d.GetRegisterValue(0xD1B) & parameters[2]);
    maxwell3d.draw_manager->DrawArray(
        static_cast<Tegra::Engines::Maxwell3D::Regs::PrimitiveTopology>(parameters[0]),
        parameters[3], parameters[1], parameters[4], instance_count);
}

void HLE_DrawIndexedIndirect(Engines::Maxwell3D& maxwell3d, const std::vector<u32>& parameters) {
    const u32 element_base = parameters[4];
    const u32 base_instance = parameters[5];
    maxwell3d.regs.vertex_id_base = element_base;
    maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true;
    maxwell3d.CallMethod(0x8e3, 0x640, true);
    maxwell3d.CallMethod(0x8e4, element_base, true);
    maxwell3d.CallMethod(0x8e5, base_instance, true);

    auto& params = maxwell3d.draw_manager->GetIndirectParams();
    params.is_indexed = true;
    params.include_count = false;
    params.count_start_address = 0;
    params.indirect_start_address = maxwell3d.macro_addresses[1];
    params.buffer_size = 5 * sizeof(u32);
    params.max_draw_counts = 1;
    params.stride = 0;

    maxwell3d.draw_manager->DrawIndexedIndirect(
        static_cast<Tegra::Engines::Maxwell3D::Regs::PrimitiveTopology>(parameters[0]), 0,
        1U << 18);

    maxwell3d.regs.vertex_id_base = 0x0;
    maxwell3d.CallMethod(0x8e3, 0x640, true);
    maxwell3d.CallMethod(0x8e4, 0x0, true);
    maxwell3d.CallMethod(0x8e5, 0x0, true);
}

// Multidraw Indixed Indirect
void HLE_MultiDrawIndexedIndirect(Engines::Maxwell3D& maxwell3d,
                                  const std::vector<u32>& parameters) {
    const u32 start_indirect = parameters[0];
    const u32 end_indirect = parameters[1];
    if (start_indirect >= end_indirect) {
        // Nothing to do.
        return;
    }
    const auto topology =
        static_cast<Tegra::Engines::Maxwell3D::Regs::PrimitiveTopology>(parameters[2]);
    const u32 padding = parameters[3]; // padding is in words

    // size of each indirect segment
    const u32 indirect_words = 5 + padding;
    const u32 stride = indirect_words * sizeof(u32);
    const std::size_t draw_count = end_indirect - start_indirect;
    u32 lowest_first = std::numeric_limits<u32>::max();
    u32 highest_limit = std::numeric_limits<u32>::min();
    for (std::size_t index = 0; index < draw_count; index++) {
        const std::size_t base = index * indirect_words + 5;
        const u32 count = parameters[base];
        const u32 first_index = parameters[base + 2];
        lowest_first = std::min(lowest_first, first_index);
        highest_limit = std::max(highest_limit, first_index + count);
    }

    const u32 base_vertex = parameters[8];
    const u32 base_instance = parameters[9];
    maxwell3d.regs.vertex_id_base = base_vertex;
    maxwell3d.CallMethod(0x8e3, 0x640, true);
    maxwell3d.CallMethod(0x8e4, base_vertex, true);
    maxwell3d.CallMethod(0x8e5, base_instance, true);
    auto& params = maxwell3d.draw_manager->GetIndirectParams();
    params.is_indexed = true;
    params.include_count = true;
    params.count_start_address = maxwell3d.macro_addresses[4];
    params.indirect_start_address = maxwell3d.macro_addresses[5];
    params.buffer_size = stride * draw_count;
    params.max_draw_counts = draw_count;
    params.stride = stride;
    maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true;
    maxwell3d.draw_manager->DrawIndexedIndirect(topology, 0, highest_limit);
}

// Multi-layer Clear
void HLE_MultiLayerClear(Engines::Maxwell3D& maxwell3d, const std::vector<u32>& parameters) {
    ASSERT(parameters.size() == 1);

    const Engines::Maxwell3D::Regs::ClearSurface clear_params{parameters[0]};
    const u32 rt_index = clear_params.RT;
    const u32 num_layers = maxwell3d.regs.rt[rt_index].depth;
    ASSERT(clear_params.layer == 0);

    maxwell3d.regs.clear_surface.raw = clear_params.raw;
    maxwell3d.draw_manager->Clear(num_layers);
}

constexpr std::array<std::pair<u64, HLEFunction>, 5> hle_funcs{{
    {0x771BB18C62444DA0, &HLE_771BB18C62444DA0},
    {0x0D61FC9FAAC9FCAD, &HLE_DrawArraysIndirect},
    {0x0217920100488FF7, &HLE_DrawIndexedIndirect},
    {0x3F5E74B9C9A50164, &HLE_MultiDrawIndexedIndirect},
    {0xEAD26C3E2109B06B, &HLE_MultiLayerClear},
}};

class HLEMacroImpl final : public CachedMacro {
public:
    explicit HLEMacroImpl(Engines::Maxwell3D& maxwell3d_, HLEFunction func_)
        : maxwell3d{maxwell3d_}, func{func_} {}

    void Execute(const std::vector<u32>& parameters, u32 method) override {
        func(maxwell3d, parameters);
    }

private:
    Engines::Maxwell3D& maxwell3d;
    HLEFunction func;
};

} // Anonymous namespace

HLEMacro::HLEMacro(Engines::Maxwell3D& maxwell3d_) : maxwell3d{maxwell3d_} {}
HLEMacro::~HLEMacro() = default;

std::unique_ptr<CachedMacro> HLEMacro::GetHLEProgram(u64 hash) const {
    const auto it = std::find_if(hle_funcs.cbegin(), hle_funcs.cend(),
                                 [hash](const auto& pair) { return pair.first == hash; });
    if (it == hle_funcs.end()) {
        return nullptr;
    }
    return std::make_unique<HLEMacroImpl>(maxwell3d, it->second);
}

} // namespace Tegra