diff options
| author | bunnei <bunneidev@gmail.com> | 2019-04-07 17:44:59 -0400 | 
|---|---|---|
| committer | GitHub <noreply@github.com> | 2019-04-07 17:44:59 -0400 | 
| commit | 80162888e6cf30722f71fbdc94b818ae8eae27ee (patch) | |
| tree | a5c498512d256c6f8bc7a63e709fdb8a8010cdc6 | |
| parent | 864280fabcb4b9d97a5a171d0100694d9f2d4ec4 (diff) | |
| parent | 20be92d5e623a348560dd9f764a9208a99cbc758 (diff) | |
Merge pull request #2352 from bunnei/mem-manager-fixes
memory_manager: Improved implementation of read/write/copy block.
| -rw-r--r-- | src/video_core/gpu.cpp | 2 | ||||
| -rw-r--r-- | src/video_core/memory_manager.cpp | 87 | ||||
| -rw-r--r-- | src/video_core/memory_manager.h | 7 | 
3 files changed, 84 insertions, 12 deletions
| diff --git a/src/video_core/gpu.cpp b/src/video_core/gpu.cpp index 30b29e14d..4461083ff 100644 --- a/src/video_core/gpu.cpp +++ b/src/video_core/gpu.cpp @@ -31,7 +31,7 @@ u32 FramebufferConfig::BytesPerPixel(PixelFormat format) {  GPU::GPU(Core::System& system, VideoCore::RendererBase& renderer) : renderer{renderer} {      auto& rasterizer{renderer.Rasterizer()}; -    memory_manager = std::make_unique<Tegra::MemoryManager>(); +    memory_manager = std::make_unique<Tegra::MemoryManager>(rasterizer);      dma_pusher = std::make_unique<Tegra::DmaPusher>(*this);      maxwell_3d = std::make_unique<Engines::Maxwell3D>(system, rasterizer, *memory_manager);      fermi_2d = std::make_unique<Engines::Fermi2D>(rasterizer, *memory_manager); diff --git a/src/video_core/memory_manager.cpp b/src/video_core/memory_manager.cpp index 8417324ff..0f4e820aa 100644 --- a/src/video_core/memory_manager.cpp +++ b/src/video_core/memory_manager.cpp @@ -5,16 +5,13 @@  #include "common/alignment.h"  #include "common/assert.h"  #include "common/logging/log.h" -#include "core/core.h"  #include "core/memory.h" -#include "video_core/gpu.h"  #include "video_core/memory_manager.h"  #include "video_core/rasterizer_interface.h" -#include "video_core/renderer_base.h"  namespace Tegra { -MemoryManager::MemoryManager() { +MemoryManager::MemoryManager(VideoCore::RasterizerInterface& rasterizer) : rasterizer{rasterizer} {      std::fill(page_table.pointers.begin(), page_table.pointers.end(), nullptr);      std::fill(page_table.attributes.begin(), page_table.attributes.end(),                Common::PageType::Unmapped); @@ -70,8 +67,7 @@ GPUVAddr MemoryManager::UnmapBuffer(GPUVAddr gpu_addr, u64 size) {      const u64 aligned_size{Common::AlignUp(size, page_size)};      const CacheAddr cache_addr{ToCacheAddr(GetPointer(gpu_addr))}; -    Core::System::GetInstance().Renderer().Rasterizer().FlushAndInvalidateRegion(cache_addr, -                                                                                 aligned_size); +    rasterizer.FlushAndInvalidateRegion(cache_addr, aligned_size);      UnmapRange(gpu_addr, aligned_size);      return gpu_addr; @@ -204,14 +200,85 @@ const u8* MemoryManager::GetPointer(GPUVAddr addr) const {  }  void MemoryManager::ReadBlock(GPUVAddr src_addr, void* dest_buffer, std::size_t size) const { -    std::memcpy(dest_buffer, GetPointer(src_addr), size); +    std::size_t remaining_size{size}; +    std::size_t page_index{src_addr >> page_bits}; +    std::size_t page_offset{src_addr & page_mask}; + +    while (remaining_size > 0) { +        const std::size_t copy_amount{ +            std::min(static_cast<std::size_t>(page_size) - page_offset, remaining_size)}; + +        switch (page_table.attributes[page_index]) { +        case Common::PageType::Memory: { +            const u8* src_ptr{page_table.pointers[page_index] + page_offset}; +            rasterizer.FlushRegion(ToCacheAddr(src_ptr), copy_amount); +            std::memcpy(dest_buffer, src_ptr, copy_amount); +            break; +        } +        default: +            UNREACHABLE(); +        } + +        page_index++; +        page_offset = 0; +        dest_buffer = static_cast<u8*>(dest_buffer) + copy_amount; +        remaining_size -= copy_amount; +    }  } +  void MemoryManager::WriteBlock(GPUVAddr dest_addr, const void* src_buffer, std::size_t size) { -    std::memcpy(GetPointer(dest_addr), src_buffer, size); +    std::size_t remaining_size{size}; +    std::size_t page_index{dest_addr >> page_bits}; +    std::size_t page_offset{dest_addr & page_mask}; + +    while (remaining_size > 0) { +        const std::size_t copy_amount{ +            std::min(static_cast<std::size_t>(page_size) - page_offset, remaining_size)}; + +        switch (page_table.attributes[page_index]) { +        case Common::PageType::Memory: { +            u8* dest_ptr{page_table.pointers[page_index] + page_offset}; +            rasterizer.InvalidateRegion(ToCacheAddr(dest_ptr), copy_amount); +            std::memcpy(dest_ptr, src_buffer, copy_amount); +            break; +        } +        default: +            UNREACHABLE(); +        } + +        page_index++; +        page_offset = 0; +        src_buffer = static_cast<const u8*>(src_buffer) + copy_amount; +        remaining_size -= copy_amount; +    }  }  void MemoryManager::CopyBlock(GPUVAddr dest_addr, GPUVAddr src_addr, std::size_t size) { -    std::memcpy(GetPointer(dest_addr), GetPointer(src_addr), size); +    std::size_t remaining_size{size}; +    std::size_t page_index{src_addr >> page_bits}; +    std::size_t page_offset{src_addr & page_mask}; + +    while (remaining_size > 0) { +        const std::size_t copy_amount{ +            std::min(static_cast<std::size_t>(page_size) - page_offset, remaining_size)}; + +        switch (page_table.attributes[page_index]) { +        case Common::PageType::Memory: { +            const u8* src_ptr{page_table.pointers[page_index] + page_offset}; +            rasterizer.FlushRegion(ToCacheAddr(src_ptr), copy_amount); +            WriteBlock(dest_addr, src_ptr, copy_amount); +            break; +        } +        default: +            UNREACHABLE(); +        } + +        page_index++; +        page_offset = 0; +        dest_addr += static_cast<VAddr>(copy_amount); +        src_addr += static_cast<VAddr>(copy_amount); +        remaining_size -= copy_amount; +    }  }  void MemoryManager::MapPages(GPUVAddr base, u64 size, u8* memory, Common::PageType type, @@ -351,7 +418,7 @@ MemoryManager::VMAIter MemoryManager::CarveVMA(GPUVAddr base, u64 size) {      const VirtualMemoryArea& vma{vma_handle->second};      if (vma.type == VirtualMemoryArea::Type::Mapped) {          // Region is already allocated -        return {}; +        return vma_handle;      }      const VAddr start_in_vma{base - vma.base}; diff --git a/src/video_core/memory_manager.h b/src/video_core/memory_manager.h index 178e2f655..647cbf93a 100644 --- a/src/video_core/memory_manager.h +++ b/src/video_core/memory_manager.h @@ -10,6 +10,10 @@  #include "common/common_types.h"  #include "common/page_table.h" +namespace VideoCore { +class RasterizerInterface; +} +  namespace Tegra {  /** @@ -43,7 +47,7 @@ struct VirtualMemoryArea {  class MemoryManager final {  public: -    MemoryManager(); +    MemoryManager(VideoCore::RasterizerInterface& rasterizer);      GPUVAddr AllocateSpace(u64 size, u64 align);      GPUVAddr AllocateSpace(GPUVAddr addr, u64 size, u64 align); @@ -144,6 +148,7 @@ private:      Common::PageTable page_table{page_bits};      VMAMap vma_map; +    VideoCore::RasterizerInterface& rasterizer;  };  } // namespace Tegra | 
