diff options
| author | bunnei <bunneidev@gmail.com> | 2021-01-07 12:42:28 -0800 | 
|---|---|---|
| committer | GitHub <noreply@github.com> | 2021-01-07 12:42:28 -0800 | 
| commit | aaf9e39f5624abee7457e8d81048516beaf43c4f (patch) | |
| tree | 7039db82d3a5b08b2f7d437bb572f818645a8e7d /src/video_core | |
| parent | bcb702fa3e9d3f11748082f2ae9a5c1986b1ad8a (diff) | |
| parent | 16392a23cc864ef0fa8a768584fbcc64fec40f2a (diff) | |
Merge pull request #5237 from ameerj/nvdec-syncpt
nvdec: Incorporate syncpoint manager
Diffstat (limited to 'src/video_core')
| -rw-r--r-- | src/video_core/cdma_pusher.cpp | 15 | ||||
| -rw-r--r-- | src/video_core/cdma_pusher.h | 10 | ||||
| -rw-r--r-- | src/video_core/command_classes/host1x.cpp | 19 | ||||
| -rw-r--r-- | src/video_core/command_classes/host1x.h | 49 | 
4 files changed, 20 insertions, 73 deletions
| diff --git a/src/video_core/cdma_pusher.cpp b/src/video_core/cdma_pusher.cpp index e3e7432f7..94679d5d1 100644 --- a/src/video_core/cdma_pusher.cpp +++ b/src/video_core/cdma_pusher.cpp @@ -33,8 +33,7 @@ CDmaPusher::CDmaPusher(GPU& gpu_)      : gpu{gpu_}, nvdec_processor(std::make_shared<Nvdec>(gpu)),        vic_processor(std::make_unique<Vic>(gpu, nvdec_processor)),        host1x_processor(std::make_unique<Host1x>(gpu)), -      nvdec_sync(std::make_unique<SyncptIncrManager>(gpu)), -      vic_sync(std::make_unique<SyncptIncrManager>(gpu)) {} +      sync_manager(std::make_unique<SyncptIncrManager>(gpu)) {}  CDmaPusher::~CDmaPusher() = default; @@ -110,10 +109,10 @@ void CDmaPusher::ExecuteCommand(u32 state_offset, u32 data) {              const auto syncpoint_id = static_cast<u32>(data & 0xFF);              const auto cond = static_cast<u32>((data >> 8) & 0xFF);              if (cond == 0) { -                nvdec_sync->Increment(syncpoint_id); +                sync_manager->Increment(syncpoint_id);              } else { -                nvdec_sync->IncrementWhenDone(static_cast<u32>(current_class), syncpoint_id); -                nvdec_sync->SignalDone(syncpoint_id); +                sync_manager->SignalDone( +                    sync_manager->IncrementWhenDone(static_cast<u32>(current_class), syncpoint_id));              }              break;          } @@ -135,10 +134,10 @@ void CDmaPusher::ExecuteCommand(u32 state_offset, u32 data) {              const auto syncpoint_id = static_cast<u32>(data & 0xFF);              const auto cond = static_cast<u32>((data >> 8) & 0xFF);              if (cond == 0) { -                vic_sync->Increment(syncpoint_id); +                sync_manager->Increment(syncpoint_id);              } else { -                vic_sync->IncrementWhenDone(static_cast<u32>(current_class), syncpoint_id); -                vic_sync->SignalDone(syncpoint_id); +                sync_manager->SignalDone( +                    sync_manager->IncrementWhenDone(static_cast<u32>(current_class), syncpoint_id));              }              break;          } diff --git a/src/video_core/cdma_pusher.h b/src/video_core/cdma_pusher.h index 0db1cd646..8ca70b6dd 100644 --- a/src/video_core/cdma_pusher.h +++ b/src/video_core/cdma_pusher.h @@ -116,12 +116,10 @@ private:      void ThiStateWrite(ThiRegisters& state, u32 state_offset, const std::vector<u32>& arguments);      GPU& gpu; - -    std::shared_ptr<Nvdec> nvdec_processor; -    std::unique_ptr<Vic> vic_processor; -    std::unique_ptr<Host1x> host1x_processor; -    std::unique_ptr<SyncptIncrManager> nvdec_sync; -    std::unique_ptr<SyncptIncrManager> vic_sync; +    std::shared_ptr<Tegra::Nvdec> nvdec_processor; +    std::unique_ptr<Tegra::Vic> vic_processor; +    std::unique_ptr<Tegra::Host1x> host1x_processor; +    std::unique_ptr<SyncptIncrManager> sync_manager;      ChClassId current_class{};      ThiRegisters vic_thi_state{};      ThiRegisters nvdec_thi_state{}; diff --git a/src/video_core/command_classes/host1x.cpp b/src/video_core/command_classes/host1x.cpp index c4dd4881a..b12494528 100644 --- a/src/video_core/command_classes/host1x.cpp +++ b/src/video_core/command_classes/host1x.cpp @@ -10,22 +10,14 @@ Tegra::Host1x::Host1x(GPU& gpu_) : gpu(gpu_) {}  Tegra::Host1x::~Host1x() = default; -void Tegra::Host1x::StateWrite(u32 offset, u32 arguments) { -    u8* const state_offset = reinterpret_cast<u8*>(&state) + offset * sizeof(u32); -    std::memcpy(state_offset, &arguments, sizeof(u32)); -} - -void Tegra::Host1x::ProcessMethod(Method method, const std::vector<u32>& arguments) { -    StateWrite(static_cast<u32>(method), arguments[0]); +void Tegra::Host1x::ProcessMethod(Method method, u32 argument) {      switch (method) { -    case Method::WaitSyncpt: -        Execute(arguments[0]); -        break;      case Method::LoadSyncptPayload32: -        syncpoint_value = arguments[0]; +        syncpoint_value = argument;          break; +    case Method::WaitSyncpt:      case Method::WaitSyncpt32: -        Execute(arguments[0]); +        Execute(argument);          break;      default:          UNIMPLEMENTED_MSG("Host1x method 0x{:X}", static_cast<u32>(method)); @@ -34,6 +26,5 @@ void Tegra::Host1x::ProcessMethod(Method method, const std::vector<u32>& argumen  }  void Tegra::Host1x::Execute(u32 data) { -    // This method waits on a valid syncpoint. -    // TODO: Implement when proper Async is in place +    gpu.WaitFence(data, syncpoint_value);  } diff --git a/src/video_core/command_classes/host1x.h b/src/video_core/command_classes/host1x.h index 013eaa0c1..7e94799dd 100644 --- a/src/video_core/command_classes/host1x.h +++ b/src/video_core/command_classes/host1x.h @@ -14,64 +14,23 @@ class Nvdec;  class Host1x {  public: -    struct Host1xClassRegisters { -        u32 incr_syncpt{}; -        u32 incr_syncpt_ctrl{}; -        u32 incr_syncpt_error{}; -        INSERT_PADDING_WORDS(5); -        u32 wait_syncpt{}; -        u32 wait_syncpt_base{}; -        u32 wait_syncpt_incr{}; -        u32 load_syncpt_base{}; -        u32 incr_syncpt_base{}; -        u32 clear{}; -        u32 wait{}; -        u32 wait_with_interrupt{}; -        u32 delay_use{}; -        u32 tick_count_high{}; -        u32 tick_count_low{}; -        u32 tick_ctrl{}; -        INSERT_PADDING_WORDS(23); -        u32 ind_ctrl{}; -        u32 ind_off2{}; -        u32 ind_off{}; -        std::array<u32, 31> ind_data{}; -        INSERT_PADDING_WORDS(1); -        u32 load_syncpoint_payload32{}; -        u32 stall_ctrl{}; -        u32 wait_syncpt32{}; -        u32 wait_syncpt_base32{}; -        u32 load_syncpt_base32{}; -        u32 incr_syncpt_base32{}; -        u32 stall_count_high{}; -        u32 stall_count_low{}; -        u32 xref_ctrl{}; -        u32 channel_xref_high{}; -        u32 channel_xref_low{}; -    }; -    static_assert(sizeof(Host1xClassRegisters) == 0x164, "Host1xClassRegisters is an invalid size"); -      enum class Method : u32 { -        WaitSyncpt = offsetof(Host1xClassRegisters, wait_syncpt) / 4, -        LoadSyncptPayload32 = offsetof(Host1xClassRegisters, load_syncpoint_payload32) / 4, -        WaitSyncpt32 = offsetof(Host1xClassRegisters, wait_syncpt32) / 4, +        WaitSyncpt = 0x8, +        LoadSyncptPayload32 = 0x4e, +        WaitSyncpt32 = 0x50,      };      explicit Host1x(GPU& gpu);      ~Host1x();      /// Writes the method into the state, Invoke Execute() if encountered -    void ProcessMethod(Method method, const std::vector<u32>& arguments); +    void ProcessMethod(Method method, u32 argument);  private:      /// For Host1x, execute is waiting on a syncpoint previously written into the state      void Execute(u32 data); -    /// Write argument into the provided offset -    void StateWrite(u32 offset, u32 arguments); -      u32 syncpoint_value{}; -    Host1xClassRegisters state{};      GPU& gpu;  }; | 
