diff options
39 files changed, 248 insertions, 181 deletions
| diff --git a/externals/cubeb b/externals/cubeb -Subproject 12b78c0edfa40007e41dbdcd9dfe367fbb98d01 +Subproject 6f2420de8f155b10330cf973900ac7bdbfee589 diff --git a/src/audio_core/audio_renderer.h b/src/audio_core/audio_renderer.h index 201ec7a3c..b2e5d336c 100644 --- a/src/audio_core/audio_renderer.h +++ b/src/audio_core/audio_renderer.h @@ -46,16 +46,18 @@ struct AudioRendererParameter {      u32_le sample_rate;      u32_le sample_count;      u32_le mix_buffer_count; -    u32_le unknown_c; +    u32_le submix_count;      u32_le voice_count;      u32_le sink_count;      u32_le effect_count; -    u32_le unknown_1c; -    u8 unknown_20; -    INSERT_PADDING_BYTES(3); +    u32_le performance_frame_count; +    u8 is_voice_drop_enabled; +    u8 unknown_21; +    u8 unknown_22; +    u8 execution_mode;      u32_le splitter_count; -    u32_le unknown_2c; -    INSERT_PADDING_WORDS(1); +    u32_le num_splitter_send_channels; +    u32_le unknown_30;      u32_le revision;  };  static_assert(sizeof(AudioRendererParameter) == 52, "AudioRendererParameter is an invalid size"); diff --git a/src/audio_core/cubeb_sink.cpp b/src/audio_core/cubeb_sink.cpp index dc45dedd3..1da0b9f2a 100644 --- a/src/audio_core/cubeb_sink.cpp +++ b/src/audio_core/cubeb_sink.cpp @@ -12,6 +12,10 @@  #include "common/ring_buffer.h"  #include "core/settings.h" +#ifdef _MSC_VER +#include <objbase.h> +#endif +  namespace AudioCore {  class CubebSinkStream final : public SinkStream { @@ -108,6 +112,11 @@ private:  };  CubebSink::CubebSink(std::string_view target_device_name) { +    // Cubeb requires COM to be initialized on the thread calling cubeb_init on Windows +#ifdef _MSC_VER +    com_init_result = CoInitializeEx(nullptr, COINIT_MULTITHREADED); +#endif +      if (cubeb_init(&ctx, "yuzu", nullptr) != CUBEB_OK) {          LOG_CRITICAL(Audio_Sink, "cubeb_init failed");          return; @@ -142,6 +151,12 @@ CubebSink::~CubebSink() {      }      cubeb_destroy(ctx); + +#ifdef _MSC_VER +    if (SUCCEEDED(com_init_result)) { +        CoUninitialize(); +    } +#endif  }  SinkStream& CubebSink::AcquireSinkStream(u32 sample_rate, u32 num_channels, diff --git a/src/audio_core/cubeb_sink.h b/src/audio_core/cubeb_sink.h index efb9d1634..511df7bb1 100644 --- a/src/audio_core/cubeb_sink.h +++ b/src/audio_core/cubeb_sink.h @@ -25,6 +25,10 @@ private:      cubeb* ctx{};      cubeb_devid output_device{};      std::vector<SinkStreamPtr> sink_streams; + +#ifdef _MSC_VER +    u32 com_init_result = 0; +#endif  };  std::vector<std::string> ListCubebSinkDevices(); diff --git a/src/common/color.h b/src/common/color.h index 0379040be..3a2222077 100644 --- a/src/common/color.h +++ b/src/common/color.h @@ -55,36 +55,36 @@ constexpr u8 Convert8To6(u8 value) {  /**   * Decode a color stored in RGBA8 format   * @param bytes Pointer to encoded source color - * @return Result color decoded as Math::Vec4<u8> + * @return Result color decoded as Common::Vec4<u8>   */ -inline Math::Vec4<u8> DecodeRGBA8(const u8* bytes) { +inline Common::Vec4<u8> DecodeRGBA8(const u8* bytes) {      return {bytes[3], bytes[2], bytes[1], bytes[0]};  }  /**   * Decode a color stored in RGB8 format   * @param bytes Pointer to encoded source color - * @return Result color decoded as Math::Vec4<u8> + * @return Result color decoded as Common::Vec4<u8>   */ -inline Math::Vec4<u8> DecodeRGB8(const u8* bytes) { +inline Common::Vec4<u8> DecodeRGB8(const u8* bytes) {      return {bytes[2], bytes[1], bytes[0], 255};  }  /**   * Decode a color stored in RG8 (aka HILO8) format   * @param bytes Pointer to encoded source color - * @return Result color decoded as Math::Vec4<u8> + * @return Result color decoded as Common::Vec4<u8>   */ -inline Math::Vec4<u8> DecodeRG8(const u8* bytes) { +inline Common::Vec4<u8> DecodeRG8(const u8* bytes) {      return {bytes[1], bytes[0], 0, 255};  }  /**   * Decode a color stored in RGB565 format   * @param bytes Pointer to encoded source color - * @return Result color decoded as Math::Vec4<u8> + * @return Result color decoded as Common::Vec4<u8>   */ -inline Math::Vec4<u8> DecodeRGB565(const u8* bytes) { +inline Common::Vec4<u8> DecodeRGB565(const u8* bytes) {      u16_le pixel;      std::memcpy(&pixel, bytes, sizeof(pixel));      return {Convert5To8((pixel >> 11) & 0x1F), Convert6To8((pixel >> 5) & 0x3F), @@ -94,9 +94,9 @@ inline Math::Vec4<u8> DecodeRGB565(const u8* bytes) {  /**   * Decode a color stored in RGB5A1 format   * @param bytes Pointer to encoded source color - * @return Result color decoded as Math::Vec4<u8> + * @return Result color decoded as Common::Vec4<u8>   */ -inline Math::Vec4<u8> DecodeRGB5A1(const u8* bytes) { +inline Common::Vec4<u8> DecodeRGB5A1(const u8* bytes) {      u16_le pixel;      std::memcpy(&pixel, bytes, sizeof(pixel));      return {Convert5To8((pixel >> 11) & 0x1F), Convert5To8((pixel >> 6) & 0x1F), @@ -106,9 +106,9 @@ inline Math::Vec4<u8> DecodeRGB5A1(const u8* bytes) {  /**   * Decode a color stored in RGBA4 format   * @param bytes Pointer to encoded source color - * @return Result color decoded as Math::Vec4<u8> + * @return Result color decoded as Common::Vec4<u8>   */ -inline Math::Vec4<u8> DecodeRGBA4(const u8* bytes) { +inline Common::Vec4<u8> DecodeRGBA4(const u8* bytes) {      u16_le pixel;      std::memcpy(&pixel, bytes, sizeof(pixel));      return {Convert4To8((pixel >> 12) & 0xF), Convert4To8((pixel >> 8) & 0xF), @@ -138,9 +138,9 @@ inline u32 DecodeD24(const u8* bytes) {  /**   * Decode a depth value and a stencil value stored in D24S8 format   * @param bytes Pointer to encoded source values - * @return Resulting values stored as a Math::Vec2 + * @return Resulting values stored as a Common::Vec2   */ -inline Math::Vec2<u32> DecodeD24S8(const u8* bytes) { +inline Common::Vec2<u32> DecodeD24S8(const u8* bytes) {      return {static_cast<u32>((bytes[2] << 16) | (bytes[1] << 8) | bytes[0]), bytes[3]};  } @@ -149,7 +149,7 @@ inline Math::Vec2<u32> DecodeD24S8(const u8* bytes) {   * @param color Source color to encode   * @param bytes Destination pointer to store encoded color   */ -inline void EncodeRGBA8(const Math::Vec4<u8>& color, u8* bytes) { +inline void EncodeRGBA8(const Common::Vec4<u8>& color, u8* bytes) {      bytes[3] = color.r();      bytes[2] = color.g();      bytes[1] = color.b(); @@ -161,7 +161,7 @@ inline void EncodeRGBA8(const Math::Vec4<u8>& color, u8* bytes) {   * @param color Source color to encode   * @param bytes Destination pointer to store encoded color   */ -inline void EncodeRGB8(const Math::Vec4<u8>& color, u8* bytes) { +inline void EncodeRGB8(const Common::Vec4<u8>& color, u8* bytes) {      bytes[2] = color.r();      bytes[1] = color.g();      bytes[0] = color.b(); @@ -172,7 +172,7 @@ inline void EncodeRGB8(const Math::Vec4<u8>& color, u8* bytes) {   * @param color Source color to encode   * @param bytes Destination pointer to store encoded color   */ -inline void EncodeRG8(const Math::Vec4<u8>& color, u8* bytes) { +inline void EncodeRG8(const Common::Vec4<u8>& color, u8* bytes) {      bytes[1] = color.r();      bytes[0] = color.g();  } @@ -181,7 +181,7 @@ inline void EncodeRG8(const Math::Vec4<u8>& color, u8* bytes) {   * @param color Source color to encode   * @param bytes Destination pointer to store encoded color   */ -inline void EncodeRGB565(const Math::Vec4<u8>& color, u8* bytes) { +inline void EncodeRGB565(const Common::Vec4<u8>& color, u8* bytes) {      const u16_le data =          (Convert8To5(color.r()) << 11) | (Convert8To6(color.g()) << 5) | Convert8To5(color.b()); @@ -193,7 +193,7 @@ inline void EncodeRGB565(const Math::Vec4<u8>& color, u8* bytes) {   * @param color Source color to encode   * @param bytes Destination pointer to store encoded color   */ -inline void EncodeRGB5A1(const Math::Vec4<u8>& color, u8* bytes) { +inline void EncodeRGB5A1(const Common::Vec4<u8>& color, u8* bytes) {      const u16_le data = (Convert8To5(color.r()) << 11) | (Convert8To5(color.g()) << 6) |                          (Convert8To5(color.b()) << 1) | Convert8To1(color.a()); @@ -205,7 +205,7 @@ inline void EncodeRGB5A1(const Math::Vec4<u8>& color, u8* bytes) {   * @param color Source color to encode   * @param bytes Destination pointer to store encoded color   */ -inline void EncodeRGBA4(const Math::Vec4<u8>& color, u8* bytes) { +inline void EncodeRGBA4(const Common::Vec4<u8>& color, u8* bytes) {      const u16 data = (Convert8To4(color.r()) << 12) | (Convert8To4(color.g()) << 8) |                       (Convert8To4(color.b()) << 4) | Convert8To4(color.a()); diff --git a/src/common/math_util.h b/src/common/math_util.h index 94b4394c5..cff3d48c5 100644 --- a/src/common/math_util.h +++ b/src/common/math_util.h @@ -7,7 +7,7 @@  #include <cstdlib>  #include <type_traits> -namespace MathUtil { +namespace Common {  constexpr float PI = 3.14159265f; @@ -41,4 +41,4 @@ struct Rectangle {      }  }; -} // namespace MathUtil +} // namespace Common diff --git a/src/common/quaternion.h b/src/common/quaternion.h index c528c0b68..370198ae0 100644 --- a/src/common/quaternion.h +++ b/src/common/quaternion.h @@ -6,12 +6,12 @@  #include "common/vector_math.h" -namespace Math { +namespace Common {  template <typename T>  class Quaternion {  public: -    Math::Vec3<T> xyz; +    Vec3<T> xyz;      T w{};      Quaternion<decltype(-T{})> Inverse() const { @@ -38,12 +38,12 @@ public:  };  template <typename T> -auto QuaternionRotate(const Quaternion<T>& q, const Math::Vec3<T>& v) { +auto QuaternionRotate(const Quaternion<T>& q, const Vec3<T>& v) {      return v + 2 * Cross(q.xyz, Cross(q.xyz, v) + v * q.w);  } -inline Quaternion<float> MakeQuaternion(const Math::Vec3<float>& axis, float angle) { +inline Quaternion<float> MakeQuaternion(const Vec3<float>& axis, float angle) {      return {axis * std::sin(angle / 2), std::cos(angle / 2)};  } -} // namespace Math +} // namespace Common diff --git a/src/common/vector_math.h b/src/common/vector_math.h index 8feb49941..429485329 100644 --- a/src/common/vector_math.h +++ b/src/common/vector_math.h @@ -33,7 +33,7 @@  #include <cmath>  #include <type_traits> -namespace Math { +namespace Common {  template <typename T>  class Vec2; @@ -690,4 +690,4 @@ constexpr Vec4<T> MakeVec(const T& x, const Vec3<T>& yzw) {      return MakeVec(x, yzw[0], yzw[1], yzw[2]);  } -} // namespace Math +} // namespace Common diff --git a/src/core/frontend/emu_window.cpp b/src/core/frontend/emu_window.cpp index 9dd493efb..e29afd630 100644 --- a/src/core/frontend/emu_window.cpp +++ b/src/core/frontend/emu_window.cpp @@ -67,7 +67,7 @@ static bool IsWithinTouchscreen(const Layout::FramebufferLayout& layout, unsigne              framebuffer_x >= layout.screen.left && framebuffer_x < layout.screen.right);  } -std::tuple<unsigned, unsigned> EmuWindow::ClipToTouchScreen(unsigned new_x, unsigned new_y) { +std::tuple<unsigned, unsigned> EmuWindow::ClipToTouchScreen(unsigned new_x, unsigned new_y) const {      new_x = std::max(new_x, framebuffer_layout.screen.left);      new_x = std::min(new_x, framebuffer_layout.screen.right - 1); diff --git a/src/core/frontend/emu_window.h b/src/core/frontend/emu_window.h index 7006a37b3..d0bcb4660 100644 --- a/src/core/frontend/emu_window.h +++ b/src/core/frontend/emu_window.h @@ -166,7 +166,7 @@ private:      /**       * Clip the provided coordinates to be inside the touchscreen area.       */ -    std::tuple<unsigned, unsigned> ClipToTouchScreen(unsigned new_x, unsigned new_y); +    std::tuple<unsigned, unsigned> ClipToTouchScreen(unsigned new_x, unsigned new_y) const;  };  } // namespace Core::Frontend diff --git a/src/core/frontend/framebuffer_layout.cpp b/src/core/frontend/framebuffer_layout.cpp index f8662d193..a1357179f 100644 --- a/src/core/frontend/framebuffer_layout.cpp +++ b/src/core/frontend/framebuffer_layout.cpp @@ -12,12 +12,12 @@ namespace Layout {  // Finds the largest size subrectangle contained in window area that is confined to the aspect ratio  template <class T> -static MathUtil::Rectangle<T> maxRectangle(MathUtil::Rectangle<T> window_area, -                                           float screen_aspect_ratio) { +static Common::Rectangle<T> MaxRectangle(Common::Rectangle<T> window_area, +                                         float screen_aspect_ratio) {      float scale = std::min(static_cast<float>(window_area.GetWidth()),                             window_area.GetHeight() / screen_aspect_ratio); -    return MathUtil::Rectangle<T>{0, 0, static_cast<T>(std::round(scale)), -                                  static_cast<T>(std::round(scale * screen_aspect_ratio))}; +    return Common::Rectangle<T>{0, 0, static_cast<T>(std::round(scale)), +                                static_cast<T>(std::round(scale * screen_aspect_ratio))};  }  FramebufferLayout DefaultFrameLayout(unsigned width, unsigned height) { @@ -29,8 +29,8 @@ FramebufferLayout DefaultFrameLayout(unsigned width, unsigned height) {      const float emulation_aspect_ratio{static_cast<float>(ScreenUndocked::Height) /                                         ScreenUndocked::Width}; -    MathUtil::Rectangle<unsigned> screen_window_area{0, 0, width, height}; -    MathUtil::Rectangle<unsigned> screen = maxRectangle(screen_window_area, emulation_aspect_ratio); +    Common::Rectangle<unsigned> screen_window_area{0, 0, width, height}; +    Common::Rectangle<unsigned> screen = MaxRectangle(screen_window_area, emulation_aspect_ratio);      float window_aspect_ratio = static_cast<float>(height) / width; diff --git a/src/core/frontend/framebuffer_layout.h b/src/core/frontend/framebuffer_layout.h index e06647794..c2c63d08c 100644 --- a/src/core/frontend/framebuffer_layout.h +++ b/src/core/frontend/framebuffer_layout.h @@ -16,7 +16,7 @@ struct FramebufferLayout {      unsigned width{ScreenUndocked::Width};      unsigned height{ScreenUndocked::Height}; -    MathUtil::Rectangle<unsigned> screen; +    Common::Rectangle<unsigned> screen;      /**       * Returns the ration of pixel size of the screen, compared to the native size of the undocked diff --git a/src/core/frontend/input.h b/src/core/frontend/input.h index 16fdcd376..7c11d7546 100644 --- a/src/core/frontend/input.h +++ b/src/core/frontend/input.h @@ -124,7 +124,7 @@ using AnalogDevice = InputDevice<std::tuple<float, float>>;   *   Orientation is determined by right-hand rule.   *   Units: deg/sec   */ -using MotionDevice = InputDevice<std::tuple<Math::Vec3<float>, Math::Vec3<float>>>; +using MotionDevice = InputDevice<std::tuple<Common::Vec3<float>, Common::Vec3<float>>>;  /**   * A touch device is an input device that returns a tuple of two floats and a bool. The floats are diff --git a/src/core/hle/kernel/errors.h b/src/core/hle/kernel/errors.h index d17eb0cb6..8097b3863 100644 --- a/src/core/hle/kernel/errors.h +++ b/src/core/hle/kernel/errors.h @@ -14,6 +14,7 @@ constexpr ResultCode ERR_MAX_CONNECTIONS_REACHED{ErrorModule::Kernel, 7};  constexpr ResultCode ERR_INVALID_CAPABILITY_DESCRIPTOR{ErrorModule::Kernel, 14};  constexpr ResultCode ERR_INVALID_SIZE{ErrorModule::Kernel, 101};  constexpr ResultCode ERR_INVALID_ADDRESS{ErrorModule::Kernel, 102}; +constexpr ResultCode ERR_OUT_OF_MEMORY{ErrorModule::Kernel, 104};  constexpr ResultCode ERR_HANDLE_TABLE_FULL{ErrorModule::Kernel, 105};  constexpr ResultCode ERR_INVALID_ADDRESS_STATE{ErrorModule::Kernel, 106};  constexpr ResultCode ERR_INVALID_MEMORY_PERMISSIONS{ErrorModule::Kernel, 108}; diff --git a/src/core/hle/kernel/handle_table.cpp b/src/core/hle/kernel/handle_table.cpp index c8acde5b1..bdfaa977f 100644 --- a/src/core/hle/kernel/handle_table.cpp +++ b/src/core/hle/kernel/handle_table.cpp @@ -14,32 +14,47 @@  namespace Kernel {  namespace {  constexpr u16 GetSlot(Handle handle) { -    return handle >> 15; +    return static_cast<u16>(handle >> 15);  }  constexpr u16 GetGeneration(Handle handle) { -    return handle & 0x7FFF; +    return static_cast<u16>(handle & 0x7FFF);  }  } // Anonymous namespace  HandleTable::HandleTable() { -    next_generation = 1;      Clear();  }  HandleTable::~HandleTable() = default; +ResultCode HandleTable::SetSize(s32 handle_table_size) { +    if (static_cast<u32>(handle_table_size) > MAX_COUNT) { +        return ERR_OUT_OF_MEMORY; +    } + +    // Values less than or equal to zero indicate to use the maximum allowable +    // size for the handle table in the actual kernel, so we ignore the given +    // value in that case, since we assume this by default unless this function +    // is called. +    if (handle_table_size > 0) { +        table_size = static_cast<u16>(handle_table_size); +    } + +    return RESULT_SUCCESS; +} +  ResultVal<Handle> HandleTable::Create(SharedPtr<Object> obj) {      DEBUG_ASSERT(obj != nullptr); -    u16 slot = next_free_slot; -    if (slot >= generations.size()) { +    const u16 slot = next_free_slot; +    if (slot >= table_size) {          LOG_ERROR(Kernel, "Unable to allocate Handle, too many slots in use.");          return ERR_HANDLE_TABLE_FULL;      }      next_free_slot = generations[slot]; -    u16 generation = next_generation++; +    const u16 generation = next_generation++;      // Overflow count so it fits in the 15 bits dedicated to the generation in the handle.      // Horizon OS uses zero to represent an invalid handle, so skip to 1. @@ -64,10 +79,11 @@ ResultVal<Handle> HandleTable::Duplicate(Handle handle) {  }  ResultCode HandleTable::Close(Handle handle) { -    if (!IsValid(handle)) +    if (!IsValid(handle)) {          return ERR_INVALID_HANDLE; +    } -    u16 slot = GetSlot(handle); +    const u16 slot = GetSlot(handle);      objects[slot] = nullptr; @@ -77,10 +93,10 @@ ResultCode HandleTable::Close(Handle handle) {  }  bool HandleTable::IsValid(Handle handle) const { -    std::size_t slot = GetSlot(handle); -    u16 generation = GetGeneration(handle); +    const std::size_t slot = GetSlot(handle); +    const u16 generation = GetGeneration(handle); -    return slot < MAX_COUNT && objects[slot] != nullptr && generations[slot] == generation; +    return slot < table_size && objects[slot] != nullptr && generations[slot] == generation;  }  SharedPtr<Object> HandleTable::GetGeneric(Handle handle) const { @@ -97,7 +113,7 @@ SharedPtr<Object> HandleTable::GetGeneric(Handle handle) const {  }  void HandleTable::Clear() { -    for (u16 i = 0; i < MAX_COUNT; ++i) { +    for (u16 i = 0; i < table_size; ++i) {          generations[i] = i + 1;          objects[i] = nullptr;      } diff --git a/src/core/hle/kernel/handle_table.h b/src/core/hle/kernel/handle_table.h index 89a3bc740..44901391b 100644 --- a/src/core/hle/kernel/handle_table.h +++ b/src/core/hle/kernel/handle_table.h @@ -50,6 +50,20 @@ public:      ~HandleTable();      /** +     * Sets the number of handles that may be in use at one time +     * for this handle table. +     * +     * @param handle_table_size The desired size to limit the handle table to. +     * +     * @returns an error code indicating if initialization was successful. +     *          If initialization was not successful, then ERR_OUT_OF_MEMORY +     *          will be returned. +     * +     * @pre handle_table_size must be within the range [0, 1024] +     */ +    ResultCode SetSize(s32 handle_table_size); + +    /**       * Allocates a handle for the given object.       * @return The created Handle or one of the following errors:       *           - `ERR_HANDLE_TABLE_FULL`: the maximum number of handles has been exceeded. @@ -104,13 +118,20 @@ private:      std::array<u16, MAX_COUNT> generations;      /** +     * The limited size of the handle table. This can be specified by process +     * capabilities in order to restrict the overall number of handles that +     * can be created in a process instance +     */ +    u16 table_size = static_cast<u16>(MAX_COUNT); + +    /**       * Global counter of the number of created handles. Stored in `generations` when a handle is       * created, and wraps around to 1 when it hits 0x8000.       */ -    u16 next_generation; +    u16 next_generation = 1;      /// Head of the free slots linked list. -    u16 next_free_slot; +    u16 next_free_slot = 0;  };  } // namespace Kernel diff --git a/src/core/hle/kernel/process.cpp b/src/core/hle/kernel/process.cpp index c5aa19afa..8009150e0 100644 --- a/src/core/hle/kernel/process.cpp +++ b/src/core/hle/kernel/process.cpp @@ -99,7 +99,13 @@ ResultCode Process::LoadFromMetadata(const FileSys::ProgramMetadata& metadata) {      vm_manager.Reset(metadata.GetAddressSpaceType());      const auto& caps = metadata.GetKernelCapabilities(); -    return capabilities.InitializeForUserProcess(caps.data(), caps.size(), vm_manager); +    const auto capability_init_result = +        capabilities.InitializeForUserProcess(caps.data(), caps.size(), vm_manager); +    if (capability_init_result.IsError()) { +        return capability_init_result; +    } + +    return handle_table.SetSize(capabilities.GetHandleTableSize());  }  void Process::Run(VAddr entry_point, s32 main_thread_priority, u32 stack_size) { diff --git a/src/core/hle/kernel/process_capability.cpp b/src/core/hle/kernel/process_capability.cpp index 3a2164b25..583e35b79 100644 --- a/src/core/hle/kernel/process_capability.cpp +++ b/src/core/hle/kernel/process_capability.cpp @@ -96,7 +96,7 @@ void ProcessCapabilities::InitializeForMetadatalessProcess() {      interrupt_capabilities.set();      // Allow using the maximum possible amount of handles -    handle_table_size = static_cast<u32>(HandleTable::MAX_COUNT); +    handle_table_size = static_cast<s32>(HandleTable::MAX_COUNT);      // Allow all debugging capabilities.      is_debuggable = true; @@ -337,7 +337,7 @@ ResultCode ProcessCapabilities::HandleHandleTableFlags(u32 flags) {          return ERR_RESERVED_VALUE;      } -    handle_table_size = (flags >> 16) & 0x3FF; +    handle_table_size = static_cast<s32>((flags >> 16) & 0x3FF);      return RESULT_SUCCESS;  } diff --git a/src/core/hle/kernel/process_capability.h b/src/core/hle/kernel/process_capability.h index fbc8812a3..5cdd80747 100644 --- a/src/core/hle/kernel/process_capability.h +++ b/src/core/hle/kernel/process_capability.h @@ -156,7 +156,7 @@ public:      }      /// Gets the number of total allowable handles for the process' handle table. -    u32 GetHandleTableSize() const { +    s32 GetHandleTableSize() const {          return handle_table_size;      } @@ -252,7 +252,7 @@ private:      u64 core_mask = 0;      u64 priority_mask = 0; -    u32 handle_table_size = 0; +    s32 handle_table_size = 0;      u32 kernel_version = 0;      ProgramType program_type = ProgramType::SysModule; diff --git a/src/core/hle/service/audio/audren_u.cpp b/src/core/hle/service/audio/audren_u.cpp index 7e0cc64a8..49648394c 100644 --- a/src/core/hle/service/audio/audren_u.cpp +++ b/src/core/hle/service/audio/audren_u.cpp @@ -262,20 +262,20 @@ void AudRenU::GetAudioRendererWorkBufferSize(Kernel::HLERequestContext& ctx) {      LOG_DEBUG(Service_Audio, "called");      u64 buffer_sz = Common::AlignUp(4 * params.mix_buffer_count, 0x40); -    buffer_sz += params.unknown_c * 1024; -    buffer_sz += 0x940 * (params.unknown_c + 1); +    buffer_sz += params.submix_count * 1024; +    buffer_sz += 0x940 * (params.submix_count + 1);      buffer_sz += 0x3F0 * params.voice_count; -    buffer_sz += Common::AlignUp(8 * (params.unknown_c + 1), 0x10); +    buffer_sz += Common::AlignUp(8 * (params.submix_count + 1), 0x10);      buffer_sz += Common::AlignUp(8 * params.voice_count, 0x10); -    buffer_sz += -        Common::AlignUp((0x3C0 * (params.sink_count + params.unknown_c) + 4 * params.sample_count) * -                            (params.mix_buffer_count + 6), -                        0x40); +    buffer_sz += Common::AlignUp( +        (0x3C0 * (params.sink_count + params.submix_count) + 4 * params.sample_count) * +            (params.mix_buffer_count + 6), +        0x40);      if (IsFeatureSupported(AudioFeatures::Splitter, params.revision)) { -        u32 count = params.unknown_c + 1; +        const u32 count = params.submix_count + 1;          u64 node_count = Common::AlignUp(count, 0x40); -        u64 node_state_buffer_sz = +        const u64 node_state_buffer_sz =              4 * (node_count * node_count) + 0xC * node_count + 2 * (node_count / 8);          u64 edge_matrix_buffer_sz = 0;          node_count = Common::AlignUp(count * count, 0x40); @@ -289,19 +289,19 @@ void AudRenU::GetAudioRendererWorkBufferSize(Kernel::HLERequestContext& ctx) {      buffer_sz += 0x20 * (params.effect_count + 4 * params.voice_count) + 0x50;      if (IsFeatureSupported(AudioFeatures::Splitter, params.revision)) { -        buffer_sz += 0xE0 * params.unknown_2c; +        buffer_sz += 0xE0 * params.num_splitter_send_channels;          buffer_sz += 0x20 * params.splitter_count; -        buffer_sz += Common::AlignUp(4 * params.unknown_2c, 0x10); +        buffer_sz += Common::AlignUp(4 * params.num_splitter_send_channels, 0x10);      }      buffer_sz = Common::AlignUp(buffer_sz, 0x40) + 0x170 * params.sink_count;      u64 output_sz = buffer_sz + 0x280 * params.sink_count + 0x4B0 * params.effect_count +                      ((params.voice_count * 256) | 0x40); -    if (params.unknown_1c >= 1) { +    if (params.performance_frame_count >= 1) {          output_sz = Common::AlignUp(((16 * params.sink_count + 16 * params.effect_count +                                        16 * params.voice_count + 16) +                                       0x658) * -                                            (params.unknown_1c + 1) + +                                            (params.performance_frame_count + 1) +                                          0xc0,                                      0x40) +                      output_sz; diff --git a/src/core/hle/service/nvdrv/devices/nvdisp_disp0.cpp b/src/core/hle/service/nvdrv/devices/nvdisp_disp0.cpp index 21ccfe1f8..dbe7ee6e8 100644 --- a/src/core/hle/service/nvdrv/devices/nvdisp_disp0.cpp +++ b/src/core/hle/service/nvdrv/devices/nvdisp_disp0.cpp @@ -23,7 +23,7 @@ u32 nvdisp_disp0::ioctl(Ioctl command, const std::vector<u8>& input, std::vector  void nvdisp_disp0::flip(u32 buffer_handle, u32 offset, u32 format, u32 width, u32 height,                          u32 stride, NVFlinger::BufferQueue::BufferTransformFlags transform, -                        const MathUtil::Rectangle<int>& crop_rect) { +                        const Common::Rectangle<int>& crop_rect) {      VAddr addr = nvmap_dev->GetObjectAddress(buffer_handle);      LOG_TRACE(Service,                "Drawing from address {:X} offset {:08X} Width {} Height {} Stride {} Format {}", diff --git a/src/core/hle/service/nvdrv/devices/nvdisp_disp0.h b/src/core/hle/service/nvdrv/devices/nvdisp_disp0.h index a45086e45..ace71169f 100644 --- a/src/core/hle/service/nvdrv/devices/nvdisp_disp0.h +++ b/src/core/hle/service/nvdrv/devices/nvdisp_disp0.h @@ -25,7 +25,7 @@ public:      /// Performs a screen flip, drawing the buffer pointed to by the handle.      void flip(u32 buffer_handle, u32 offset, u32 format, u32 width, u32 height, u32 stride,                NVFlinger::BufferQueue::BufferTransformFlags transform, -              const MathUtil::Rectangle<int>& crop_rect); +              const Common::Rectangle<int>& crop_rect);  private:      std::shared_ptr<nvmap> nvmap_dev; diff --git a/src/core/hle/service/nvflinger/buffer_queue.cpp b/src/core/hle/service/nvflinger/buffer_queue.cpp index fc07d9bb8..4d150fc71 100644 --- a/src/core/hle/service/nvflinger/buffer_queue.cpp +++ b/src/core/hle/service/nvflinger/buffer_queue.cpp @@ -63,7 +63,7 @@ const IGBPBuffer& BufferQueue::RequestBuffer(u32 slot) const {  }  void BufferQueue::QueueBuffer(u32 slot, BufferTransformFlags transform, -                              const MathUtil::Rectangle<int>& crop_rect) { +                              const Common::Rectangle<int>& crop_rect) {      auto itr = std::find_if(queue.begin(), queue.end(),                              [&](const Buffer& buffer) { return buffer.slot == slot; });      ASSERT(itr != queue.end()); diff --git a/src/core/hle/service/nvflinger/buffer_queue.h b/src/core/hle/service/nvflinger/buffer_queue.h index ab90d591e..e1ccb6171 100644 --- a/src/core/hle/service/nvflinger/buffer_queue.h +++ b/src/core/hle/service/nvflinger/buffer_queue.h @@ -67,14 +67,14 @@ public:          Status status = Status::Free;          IGBPBuffer igbp_buffer;          BufferTransformFlags transform; -        MathUtil::Rectangle<int> crop_rect; +        Common::Rectangle<int> crop_rect;      };      void SetPreallocatedBuffer(u32 slot, const IGBPBuffer& igbp_buffer);      std::optional<u32> DequeueBuffer(u32 width, u32 height);      const IGBPBuffer& RequestBuffer(u32 slot) const;      void QueueBuffer(u32 slot, BufferTransformFlags transform, -                     const MathUtil::Rectangle<int>& crop_rect); +                     const Common::Rectangle<int>& crop_rect);      std::optional<std::reference_wrapper<const Buffer>> AcquireBuffer();      void ReleaseBuffer(u32 slot);      u32 Query(QueryType type); diff --git a/src/core/hle/service/vi/vi.cpp b/src/core/hle/service/vi/vi.cpp index 74384a24d..a975767bb 100644 --- a/src/core/hle/service/vi/vi.cpp +++ b/src/core/hle/service/vi/vi.cpp @@ -420,7 +420,7 @@ public:          u32_le fence_is_valid;          std::array<Fence, 2> fences; -        MathUtil::Rectangle<int> GetCropRect() const { +        Common::Rectangle<int> GetCropRect() const {              return {crop_left, crop_top, crop_right, crop_bottom};          }      }; diff --git a/src/core/memory.cpp b/src/core/memory.cpp index e9166dbd9..f809567b6 100644 --- a/src/core/memory.cpp +++ b/src/core/memory.cpp @@ -71,15 +71,20 @@ static void MapPages(PageTable& page_table, VAddr base, u64 size, u8* memory, Pa                                   FlushMode::FlushAndInvalidate);      VAddr end = base + size; -    while (base != end) { -        ASSERT_MSG(base < page_table.pointers.size(), "out of range mapping at {:016X}", base); +    ASSERT_MSG(end <= page_table.pointers.size(), "out of range mapping at {:016X}", +               base + page_table.pointers.size()); -        page_table.attributes[base] = type; -        page_table.pointers[base] = memory; +    std::fill(page_table.attributes.begin() + base, page_table.attributes.begin() + end, type); -        base += 1; -        if (memory != nullptr) +    if (memory == nullptr) { +        std::fill(page_table.pointers.begin() + base, page_table.pointers.begin() + end, memory); +    } else { +        while (base != end) { +            page_table.pointers[base] = memory; + +            base += 1;              memory += PAGE_SIZE; +        }      }  } diff --git a/src/input_common/motion_emu.cpp b/src/input_common/motion_emu.cpp index 9570c060e..6d96d4019 100644 --- a/src/input_common/motion_emu.cpp +++ b/src/input_common/motion_emu.cpp @@ -32,12 +32,12 @@ public:      }      void BeginTilt(int x, int y) { -        mouse_origin = Math::MakeVec(x, y); +        mouse_origin = Common::MakeVec(x, y);          is_tilting = true;      }      void Tilt(int x, int y) { -        auto mouse_move = Math::MakeVec(x, y) - mouse_origin; +        auto mouse_move = Common::MakeVec(x, y) - mouse_origin;          if (is_tilting) {              std::lock_guard<std::mutex> guard(tilt_mutex);              if (mouse_move.x == 0 && mouse_move.y == 0) { @@ -45,7 +45,7 @@ public:              } else {                  tilt_direction = mouse_move.Cast<float>();                  tilt_angle = -                    std::clamp(tilt_direction.Normalize() * sensitivity, 0.0f, MathUtil::PI * 0.5f); +                    std::clamp(tilt_direction.Normalize() * sensitivity, 0.0f, Common::PI * 0.5f);              }          }      } @@ -56,7 +56,7 @@ public:          is_tilting = false;      } -    std::tuple<Math::Vec3<float>, Math::Vec3<float>> GetStatus() { +    std::tuple<Common::Vec3<float>, Common::Vec3<float>> GetStatus() {          std::lock_guard<std::mutex> guard(status_mutex);          return status;      } @@ -66,17 +66,17 @@ private:      const std::chrono::steady_clock::duration update_duration;      const float sensitivity; -    Math::Vec2<int> mouse_origin; +    Common::Vec2<int> mouse_origin;      std::mutex tilt_mutex; -    Math::Vec2<float> tilt_direction; +    Common::Vec2<float> tilt_direction;      float tilt_angle = 0;      bool is_tilting = false;      Common::Event shutdown_event; -    std::tuple<Math::Vec3<float>, Math::Vec3<float>> status; +    std::tuple<Common::Vec3<float>, Common::Vec3<float>> status;      std::mutex status_mutex;      // Note: always keep the thread declaration at the end so that other objects are initialized @@ -85,8 +85,8 @@ private:      void MotionEmuThread() {          auto update_time = std::chrono::steady_clock::now(); -        Math::Quaternion<float> q = MakeQuaternion(Math::Vec3<float>(), 0); -        Math::Quaternion<float> old_q; +        Common::Quaternion<float> q = Common::MakeQuaternion(Common::Vec3<float>(), 0); +        Common::Quaternion<float> old_q;          while (!shutdown_event.WaitUntil(update_time)) {              update_time += update_duration; @@ -96,18 +96,18 @@ private:                  std::lock_guard<std::mutex> guard(tilt_mutex);                  // Find the quaternion describing current 3DS tilting -                q = MakeQuaternion(Math::MakeVec(-tilt_direction.y, 0.0f, tilt_direction.x), -                                   tilt_angle); +                q = Common::MakeQuaternion( +                    Common::MakeVec(-tilt_direction.y, 0.0f, tilt_direction.x), tilt_angle);              }              auto inv_q = q.Inverse();              // Set the gravity vector in world space -            auto gravity = Math::MakeVec(0.0f, -1.0f, 0.0f); +            auto gravity = Common::MakeVec(0.0f, -1.0f, 0.0f);              // Find the angular rate vector in world space              auto angular_rate = ((q - old_q) * inv_q).xyz * 2; -            angular_rate *= 1000 / update_millisecond / MathUtil::PI * 180; +            angular_rate *= 1000 / update_millisecond / Common::PI * 180;              // Transform the two vectors from world space to 3DS space              gravity = QuaternionRotate(inv_q, gravity); @@ -131,7 +131,7 @@ public:          device = std::make_shared<MotionEmuDevice>(update_millisecond, sensitivity);      } -    std::tuple<Math::Vec3<float>, Math::Vec3<float>> GetStatus() const override { +    std::tuple<Common::Vec3<float>, Common::Vec3<float>> GetStatus() const override {          return device->GetStatus();      } diff --git a/src/video_core/engines/fermi_2d.cpp b/src/video_core/engines/fermi_2d.cpp index ec1a57226..540dcc52c 100644 --- a/src/video_core/engines/fermi_2d.cpp +++ b/src/video_core/engines/fermi_2d.cpp @@ -44,10 +44,10 @@ void Fermi2D::HandleSurfaceCopy() {      const u32 src_blit_y2{          static_cast<u32>((regs.blit_src_y + (regs.blit_dst_height * regs.blit_dv_dy)) >> 32)}; -    const MathUtil::Rectangle<u32> src_rect{src_blit_x1, src_blit_y1, src_blit_x2, src_blit_y2}; -    const MathUtil::Rectangle<u32> dst_rect{regs.blit_dst_x, regs.blit_dst_y, -                                            regs.blit_dst_x + regs.blit_dst_width, -                                            regs.blit_dst_y + regs.blit_dst_height}; +    const Common::Rectangle<u32> src_rect{src_blit_x1, src_blit_y1, src_blit_x2, src_blit_y2}; +    const Common::Rectangle<u32> dst_rect{regs.blit_dst_x, regs.blit_dst_y, +                                          regs.blit_dst_x + regs.blit_dst_width, +                                          regs.blit_dst_y + regs.blit_dst_height};      if (!rasterizer.AccelerateSurfaceCopy(regs.src, regs.dst, src_rect, dst_rect)) {          UNIMPLEMENTED(); diff --git a/src/video_core/engines/maxwell_3d.cpp b/src/video_core/engines/maxwell_3d.cpp index 2d2136067..144e7fa82 100644 --- a/src/video_core/engines/maxwell_3d.cpp +++ b/src/video_core/engines/maxwell_3d.cpp @@ -107,21 +107,23 @@ void Maxwell3D::CallMacroMethod(u32 method, std::vector<u32> parameters) {  void Maxwell3D::CallMethod(const GPU::MethodCall& method_call) {      auto debug_context = system.GetGPUDebugContext(); +    const u32 method = method_call.method; +      // It is an error to write to a register other than the current macro's ARG register before it      // has finished execution.      if (executing_macro != 0) { -        ASSERT(method_call.method == executing_macro + 1); +        ASSERT(method == executing_macro + 1);      }      // Methods after 0xE00 are special, they're actually triggers for some microcode that was      // uploaded to the GPU during initialization. -    if (method_call.method >= MacroRegistersStart) { +    if (method >= MacroRegistersStart) {          // We're trying to execute a macro          if (executing_macro == 0) {              // A macro call must begin by writing the macro method's register, not its argument. -            ASSERT_MSG((method_call.method % 2) == 0, +            ASSERT_MSG((method % 2) == 0,                         "Can't start macro execution by writing to the ARGS register"); -            executing_macro = method_call.method; +            executing_macro = method;          }          macro_params.push_back(method_call.argument); @@ -133,66 +135,62 @@ void Maxwell3D::CallMethod(const GPU::MethodCall& method_call) {          return;      } -    ASSERT_MSG(method_call.method < Regs::NUM_REGS, +    ASSERT_MSG(method < Regs::NUM_REGS,                 "Invalid Maxwell3D register, increase the size of the Regs structure");      if (debug_context) {          debug_context->OnEvent(Tegra::DebugContext::Event::MaxwellCommandLoaded, nullptr);      } -    if (regs.reg_array[method_call.method] != method_call.argument) { -        regs.reg_array[method_call.method] = method_call.argument; +    if (regs.reg_array[method] != method_call.argument) { +        regs.reg_array[method] = method_call.argument;          // Color buffers          constexpr u32 first_rt_reg = MAXWELL3D_REG_INDEX(rt);          constexpr u32 registers_per_rt = sizeof(regs.rt[0]) / sizeof(u32); -        if (method_call.method >= first_rt_reg && -            method_call.method < first_rt_reg + registers_per_rt * Regs::NumRenderTargets) { -            const std::size_t rt_index = (method_call.method - first_rt_reg) / registers_per_rt; -            dirty_flags.color_buffer |= 1u << static_cast<u32>(rt_index); +        if (method >= first_rt_reg && +            method < first_rt_reg + registers_per_rt * Regs::NumRenderTargets) { +            const std::size_t rt_index = (method - first_rt_reg) / registers_per_rt; +            dirty_flags.color_buffer.set(rt_index);          }          // Zeta buffer          constexpr u32 registers_in_zeta = sizeof(regs.zeta) / sizeof(u32); -        if (method_call.method == MAXWELL3D_REG_INDEX(zeta_enable) || -            method_call.method == MAXWELL3D_REG_INDEX(zeta_width) || -            method_call.method == MAXWELL3D_REG_INDEX(zeta_height) || -            (method_call.method >= MAXWELL3D_REG_INDEX(zeta) && -             method_call.method < MAXWELL3D_REG_INDEX(zeta) + registers_in_zeta)) { +        if (method == MAXWELL3D_REG_INDEX(zeta_enable) || +            method == MAXWELL3D_REG_INDEX(zeta_width) || +            method == MAXWELL3D_REG_INDEX(zeta_height) || +            (method >= MAXWELL3D_REG_INDEX(zeta) && +             method < MAXWELL3D_REG_INDEX(zeta) + registers_in_zeta)) {              dirty_flags.zeta_buffer = true;          }          // Shader          constexpr u32 shader_registers_count =              sizeof(regs.shader_config[0]) * Regs::MaxShaderProgram / sizeof(u32); -        if (method_call.method >= MAXWELL3D_REG_INDEX(shader_config[0]) && -            method_call.method < MAXWELL3D_REG_INDEX(shader_config[0]) + shader_registers_count) { +        if (method >= MAXWELL3D_REG_INDEX(shader_config[0]) && +            method < MAXWELL3D_REG_INDEX(shader_config[0]) + shader_registers_count) {              dirty_flags.shaders = true;          }          // Vertex format -        if (method_call.method >= MAXWELL3D_REG_INDEX(vertex_attrib_format) && -            method_call.method < -                MAXWELL3D_REG_INDEX(vertex_attrib_format) + regs.vertex_attrib_format.size()) { +        if (method >= MAXWELL3D_REG_INDEX(vertex_attrib_format) && +            method < MAXWELL3D_REG_INDEX(vertex_attrib_format) + regs.vertex_attrib_format.size()) {              dirty_flags.vertex_attrib_format = true;          }          // Vertex buffer -        if (method_call.method >= MAXWELL3D_REG_INDEX(vertex_array) && -            method_call.method < MAXWELL3D_REG_INDEX(vertex_array) + 4 * 32) { -            dirty_flags.vertex_array |= -                1u << ((method_call.method - MAXWELL3D_REG_INDEX(vertex_array)) >> 2); -        } else if (method_call.method >= MAXWELL3D_REG_INDEX(vertex_array_limit) && -                   method_call.method < MAXWELL3D_REG_INDEX(vertex_array_limit) + 2 * 32) { -            dirty_flags.vertex_array |= -                1u << ((method_call.method - MAXWELL3D_REG_INDEX(vertex_array_limit)) >> 1); -        } else if (method_call.method >= MAXWELL3D_REG_INDEX(instanced_arrays) && -                   method_call.method < MAXWELL3D_REG_INDEX(instanced_arrays) + 32) { -            dirty_flags.vertex_array |= -                1u << (method_call.method - MAXWELL3D_REG_INDEX(instanced_arrays)); +        if (method >= MAXWELL3D_REG_INDEX(vertex_array) && +            method < MAXWELL3D_REG_INDEX(vertex_array) + 4 * 32) { +            dirty_flags.vertex_array.set((method - MAXWELL3D_REG_INDEX(vertex_array)) >> 2); +        } else if (method >= MAXWELL3D_REG_INDEX(vertex_array_limit) && +                   method < MAXWELL3D_REG_INDEX(vertex_array_limit) + 2 * 32) { +            dirty_flags.vertex_array.set((method - MAXWELL3D_REG_INDEX(vertex_array_limit)) >> 1); +        } else if (method >= MAXWELL3D_REG_INDEX(instanced_arrays) && +                   method < MAXWELL3D_REG_INDEX(instanced_arrays) + 32) { +            dirty_flags.vertex_array.set(method - MAXWELL3D_REG_INDEX(instanced_arrays));          }      } -    switch (method_call.method) { +    switch (method) {      case MAXWELL3D_REG_INDEX(macros.data): {          ProcessMacroUpload(method_call.argument);          break; diff --git a/src/video_core/engines/maxwell_3d.h b/src/video_core/engines/maxwell_3d.h index 0e3873ffd..7fbf1026e 100644 --- a/src/video_core/engines/maxwell_3d.h +++ b/src/video_core/engines/maxwell_3d.h @@ -5,8 +5,10 @@  #pragma once  #include <array> +#include <bitset>  #include <unordered_map>  #include <vector> +  #include "common/assert.h"  #include "common/bit_field.h"  #include "common/common_funcs.h" @@ -503,7 +505,7 @@ public:              f32 translate_z;              INSERT_PADDING_WORDS(2); -            MathUtil::Rectangle<s32> GetRect() const { +            Common::Rectangle<s32> GetRect() const {                  return {                      GetX(),               // left                      GetY() + GetHeight(), // top @@ -1094,19 +1096,18 @@ public:      MemoryManager& memory_manager;      struct DirtyFlags { -        u8 color_buffer = 0xFF; -        bool zeta_buffer = true; - -        bool shaders = true; +        std::bitset<8> color_buffer{0xFF}; +        std::bitset<32> vertex_array{0xFFFFFFFF};          bool vertex_attrib_format = true; -        u32 vertex_array = 0xFFFFFFFF; +        bool zeta_buffer = true; +        bool shaders = true;          void OnMemoryWrite() { -            color_buffer = 0xFF;              zeta_buffer = true;              shaders = true; -            vertex_array = 0xFFFFFFFF; +            color_buffer.set(); +            vertex_array.set();          }      }; diff --git a/src/video_core/gpu.h b/src/video_core/gpu.h index 0f5bfdcbf..6313702f2 100644 --- a/src/video_core/gpu.h +++ b/src/video_core/gpu.h @@ -100,7 +100,7 @@ struct FramebufferConfig {      using TransformFlags = Service::NVFlinger::BufferQueue::BufferTransformFlags;      TransformFlags transform_flags; -    MathUtil::Rectangle<int> crop_rect; +    Common::Rectangle<int> crop_rect;  };  namespace Engines { diff --git a/src/video_core/rasterizer_interface.h b/src/video_core/rasterizer_interface.h index b2a223705..6a1dc9cf6 100644 --- a/src/video_core/rasterizer_interface.h +++ b/src/video_core/rasterizer_interface.h @@ -47,8 +47,8 @@ public:      /// Attempt to use a faster method to perform a surface copy      virtual bool AccelerateSurfaceCopy(const Tegra::Engines::Fermi2D::Regs::Surface& src,                                         const Tegra::Engines::Fermi2D::Regs::Surface& dst, -                                       const MathUtil::Rectangle<u32>& src_rect, -                                       const MathUtil::Rectangle<u32>& dst_rect) { +                                       const Common::Rectangle<u32>& src_rect, +                                       const Common::Rectangle<u32>& dst_rect) {          return false;      } diff --git a/src/video_core/renderer_opengl/gl_rasterizer.cpp b/src/video_core/renderer_opengl/gl_rasterizer.cpp index c1c88673d..523ed10fa 100644 --- a/src/video_core/renderer_opengl/gl_rasterizer.cpp +++ b/src/video_core/renderer_opengl/gl_rasterizer.cpp @@ -200,7 +200,7 @@ GLuint RasterizerOpenGL::SetupVertexFormat() {      }      // Rebinding the VAO invalidates the vertex buffer bindings. -    gpu.dirty_flags.vertex_array = 0xFFFFFFFF; +    gpu.dirty_flags.vertex_array.set();      state.draw.vertex_array = vao_entry.handle;      return vao_entry.handle; @@ -210,14 +210,14 @@ void RasterizerOpenGL::SetupVertexBuffer(GLuint vao) {      auto& gpu = Core::System::GetInstance().GPU().Maxwell3D();      const auto& regs = gpu.regs; -    if (!gpu.dirty_flags.vertex_array) +    if (gpu.dirty_flags.vertex_array.none())          return;      MICROPROFILE_SCOPE(OpenGL_VB);      // Upload all guest vertex arrays sequentially to our buffer      for (u32 index = 0; index < Maxwell::NumVertexArrays; ++index) { -        if (~gpu.dirty_flags.vertex_array & (1u << index)) +        if (!gpu.dirty_flags.vertex_array[index])              continue;          const auto& vertex_array = regs.vertex_array[index]; @@ -244,7 +244,7 @@ void RasterizerOpenGL::SetupVertexBuffer(GLuint vao) {          }      } -    gpu.dirty_flags.vertex_array = 0; +    gpu.dirty_flags.vertex_array.reset();  }  DrawParameters RasterizerOpenGL::SetupDraw() { @@ -488,13 +488,13 @@ std::pair<bool, bool> RasterizerOpenGL::ConfigureFramebuffers(      OpenGLState& current_state, bool using_color_fb, bool using_depth_fb, bool preserve_contents,      std::optional<std::size_t> single_color_target) {      MICROPROFILE_SCOPE(OpenGL_Framebuffer); -    const auto& gpu = Core::System::GetInstance().GPU().Maxwell3D(); +    auto& gpu = Core::System::GetInstance().GPU().Maxwell3D();      const auto& regs = gpu.regs;      const FramebufferConfigState fb_config_state{using_color_fb, using_depth_fb, preserve_contents,                                                   single_color_target}; -    if (fb_config_state == current_framebuffer_config_state && gpu.dirty_flags.color_buffer == 0 && -        !gpu.dirty_flags.zeta_buffer) { +    if (fb_config_state == current_framebuffer_config_state && +        gpu.dirty_flags.color_buffer.none() && !gpu.dirty_flags.zeta_buffer) {          // Only skip if the previous ConfigureFramebuffers call was from the same kind (multiple or          // single color targets). This is done because the guest registers may not change but the          // host framebuffer may contain different attachments @@ -721,10 +721,10 @@ void RasterizerOpenGL::DrawArrays() {      // Add space for at least 18 constant buffers      buffer_size += Maxwell::MaxConstBuffers * (MaxConstbufferSize + uniform_buffer_alignment); -    bool invalidate = buffer_cache.Map(buffer_size); +    const bool invalidate = buffer_cache.Map(buffer_size);      if (invalidate) {          // As all cached buffers are invalidated, we need to recheck their state. -        gpu.dirty_flags.vertex_array = 0xFFFFFFFF; +        gpu.dirty_flags.vertex_array.set();      }      const GLuint vao = SetupVertexFormat(); @@ -779,8 +779,8 @@ void RasterizerOpenGL::FlushAndInvalidateRegion(VAddr addr, u64 size) {  bool RasterizerOpenGL::AccelerateSurfaceCopy(const Tegra::Engines::Fermi2D::Regs::Surface& src,                                               const Tegra::Engines::Fermi2D::Regs::Surface& dst, -                                             const MathUtil::Rectangle<u32>& src_rect, -                                             const MathUtil::Rectangle<u32>& dst_rect) { +                                             const Common::Rectangle<u32>& src_rect, +                                             const Common::Rectangle<u32>& dst_rect) {      MICROPROFILE_SCOPE(OpenGL_Blits);      res_cache.FermiCopySurface(src, dst, src_rect, dst_rect);      return true; @@ -1034,7 +1034,7 @@ void RasterizerOpenGL::SyncViewport(OpenGLState& current_state) {      for (std::size_t i = 0; i < viewport_count; i++) {          auto& viewport = current_state.viewports[i];          const auto& src = regs.viewports[i]; -        const MathUtil::Rectangle<s32> viewport_rect{regs.viewport_transform[i].GetRect()}; +        const Common::Rectangle<s32> viewport_rect{regs.viewport_transform[i].GetRect()};          viewport.x = viewport_rect.left;          viewport.y = viewport_rect.bottom;          viewport.width = viewport_rect.GetWidth(); diff --git a/src/video_core/renderer_opengl/gl_rasterizer.h b/src/video_core/renderer_opengl/gl_rasterizer.h index 258d62259..2f0524f85 100644 --- a/src/video_core/renderer_opengl/gl_rasterizer.h +++ b/src/video_core/renderer_opengl/gl_rasterizer.h @@ -62,8 +62,8 @@ public:      void FlushAndInvalidateRegion(VAddr addr, u64 size) override;      bool AccelerateSurfaceCopy(const Tegra::Engines::Fermi2D::Regs::Surface& src,                                 const Tegra::Engines::Fermi2D::Regs::Surface& dst, -                               const MathUtil::Rectangle<u32>& src_rect, -                               const MathUtil::Rectangle<u32>& dst_rect) override; +                               const Common::Rectangle<u32>& src_rect, +                               const Common::Rectangle<u32>& dst_rect) override;      bool AccelerateDisplay(const Tegra::FramebufferConfig& config, VAddr framebuffer_addr,                             u32 pixel_stride) override;      bool AccelerateDrawBatch(bool is_indexed) override; diff --git a/src/video_core/renderer_opengl/gl_rasterizer_cache.cpp b/src/video_core/renderer_opengl/gl_rasterizer_cache.cpp index e6d47ce41..81b6099f9 100644 --- a/src/video_core/renderer_opengl/gl_rasterizer_cache.cpp +++ b/src/video_core/renderer_opengl/gl_rasterizer_cache.cpp @@ -399,7 +399,7 @@ static const FormatTuple& GetFormatTuple(PixelFormat pixel_format, ComponentType      return format;  } -MathUtil::Rectangle<u32> SurfaceParams::GetRect(u32 mip_level) const { +Common::Rectangle<u32> SurfaceParams::GetRect(u32 mip_level) const {      u32 actual_height{std::max(1U, unaligned_height >> mip_level)};      if (IsPixelFormatASTC(pixel_format)) {          // ASTC formats must stop at the ATSC block size boundary @@ -962,10 +962,10 @@ Surface RasterizerCacheOpenGL::GetColorBufferSurface(std::size_t index, bool pre      auto& gpu{Core::System::GetInstance().GPU().Maxwell3D()};      const auto& regs{gpu.regs}; -    if ((gpu.dirty_flags.color_buffer & (1u << static_cast<u32>(index))) == 0) { +    if (!gpu.dirty_flags.color_buffer[index]) {          return last_color_buffers[index];      } -    gpu.dirty_flags.color_buffer &= ~(1u << static_cast<u32>(index)); +    gpu.dirty_flags.color_buffer.reset(index);      ASSERT(index < Tegra::Engines::Maxwell3D::Regs::NumRenderTargets); @@ -1062,8 +1062,8 @@ void RasterizerCacheOpenGL::FastLayeredCopySurface(const Surface& src_surface,  }  static bool BlitSurface(const Surface& src_surface, const Surface& dst_surface, -                        const MathUtil::Rectangle<u32>& src_rect, -                        const MathUtil::Rectangle<u32>& dst_rect, GLuint read_fb_handle, +                        const Common::Rectangle<u32>& src_rect, +                        const Common::Rectangle<u32>& dst_rect, GLuint read_fb_handle,                          GLuint draw_fb_handle, GLenum src_attachment = 0, GLenum dst_attachment = 0,                          std::size_t cubemap_face = 0) { @@ -1193,7 +1193,7 @@ static bool BlitSurface(const Surface& src_surface, const Surface& dst_surface,  void RasterizerCacheOpenGL::FermiCopySurface(      const Tegra::Engines::Fermi2D::Regs::Surface& src_config,      const Tegra::Engines::Fermi2D::Regs::Surface& dst_config, -    const MathUtil::Rectangle<u32>& src_rect, const MathUtil::Rectangle<u32>& dst_rect) { +    const Common::Rectangle<u32>& src_rect, const Common::Rectangle<u32>& dst_rect) {      const auto& src_params = SurfaceParams::CreateForFermiCopySurface(src_config);      const auto& dst_params = SurfaceParams::CreateForFermiCopySurface(dst_config); diff --git a/src/video_core/renderer_opengl/gl_rasterizer_cache.h b/src/video_core/renderer_opengl/gl_rasterizer_cache.h index 89d733c50..838554c35 100644 --- a/src/video_core/renderer_opengl/gl_rasterizer_cache.h +++ b/src/video_core/renderer_opengl/gl_rasterizer_cache.h @@ -28,7 +28,7 @@ namespace OpenGL {  class CachedSurface;  using Surface = std::shared_ptr<CachedSurface>; -using SurfaceSurfaceRect_Tuple = std::tuple<Surface, Surface, MathUtil::Rectangle<u32>>; +using SurfaceSurfaceRect_Tuple = std::tuple<Surface, Surface, Common::Rectangle<u32>>;  using SurfaceTarget = VideoCore::Surface::SurfaceTarget;  using SurfaceType = VideoCore::Surface::SurfaceType; @@ -71,7 +71,7 @@ struct SurfaceParams {      }      /// Returns the rectangle corresponding to this surface -    MathUtil::Rectangle<u32> GetRect(u32 mip_level = 0) const; +    Common::Rectangle<u32> GetRect(u32 mip_level = 0) const;      /// Returns the total size of this surface in bytes, adjusted for compression      std::size_t SizeInBytesRaw(bool ignore_tiled = false) const { @@ -430,8 +430,8 @@ public:      /// Copies the contents of one surface to another      void FermiCopySurface(const Tegra::Engines::Fermi2D::Regs::Surface& src_config,                            const Tegra::Engines::Fermi2D::Regs::Surface& dst_config, -                          const MathUtil::Rectangle<u32>& src_rect, -                          const MathUtil::Rectangle<u32>& dst_rect); +                          const Common::Rectangle<u32>& src_rect, +                          const Common::Rectangle<u32>& dst_rect);  private:      void LoadSurface(const Surface& surface); diff --git a/src/video_core/renderer_opengl/gl_shader_disk_cache.cpp b/src/video_core/renderer_opengl/gl_shader_disk_cache.cpp index 81882822b..82fc4d44b 100644 --- a/src/video_core/renderer_opengl/gl_shader_disk_cache.cpp +++ b/src/video_core/renderer_opengl/gl_shader_disk_cache.cpp @@ -2,8 +2,6 @@  // Licensed under GPLv2 or any later version  // Refer to the license.txt file included. -#pragma once -  #include <cstring>  #include <fmt/format.h>  #include <lz4.h> diff --git a/src/video_core/renderer_opengl/renderer_opengl.h b/src/video_core/renderer_opengl/renderer_opengl.h index 7e13e566b..c168fa89e 100644 --- a/src/video_core/renderer_opengl/renderer_opengl.h +++ b/src/video_core/renderer_opengl/renderer_opengl.h @@ -39,7 +39,7 @@ struct TextureInfo {  /// Structure used for storing information about the display target for the Switch screen  struct ScreenInfo {      GLuint display_texture; -    const MathUtil::Rectangle<float> display_texcoords{0.0f, 0.0f, 1.0f, 1.0f}; +    const Common::Rectangle<float> display_texcoords{0.0f, 0.0f, 1.0f, 1.0f};      TextureInfo texture;  }; @@ -102,7 +102,7 @@ private:      /// Used for transforming the framebuffer orientation      Tegra::FramebufferConfig::TransformFlags framebuffer_transform_flags; -    MathUtil::Rectangle<int> framebuffer_crop_rect; +    Common::Rectangle<int> framebuffer_crop_rect;  };  } // namespace OpenGL diff --git a/src/yuzu/debugger/graphics/graphics_surface.cpp b/src/yuzu/debugger/graphics/graphics_surface.cpp index 209798521..71683da8e 100644 --- a/src/yuzu/debugger/graphics/graphics_surface.cpp +++ b/src/yuzu/debugger/graphics/graphics_surface.cpp @@ -398,7 +398,7 @@ void GraphicsSurfaceWidget::OnUpdate() {      for (unsigned int y = 0; y < surface_height; ++y) {          for (unsigned int x = 0; x < surface_width; ++x) { -            Math::Vec4<u8> color; +            Common::Vec4<u8> color;              color[0] = texture_data[x + y * surface_width + 0];              color[1] = texture_data[x + y * surface_width + 1];              color[2] = texture_data[x + y * surface_width + 2]; | 
