// Copyright 2015 Citra Emulator Project // Licensed under GPLv2 or any later version // Refer to the license.txt file included. #pragma once #include #include #include #include #include #ifdef __GNUC__ #pragma GCC diagnostic push #pragma GCC diagnostic ignored "-Wunused-local-typedefs" #endif #include #include #ifdef __GNUC__ #pragma GCC diagnostic pop #endif #include #include #include #include "common/assert.h" #include "common/common_funcs.h" #include "common/common_types.h" #include "common/math_util.h" #include "core/hw/gpu.h" #include "video_core/regs_framebuffer.h" #include "video_core/regs_texturing.h" #include "video_core/renderer_opengl/gl_resource_manager.h" #include "video_core/texture/texture_decode.h" namespace OpenGL { struct TextureCubeConfig { PAddr px; PAddr nx; PAddr py; PAddr ny; PAddr pz; PAddr nz; u32 width; Pica::TexturingRegs::TextureFormat format; bool operator==(const TextureCubeConfig& rhs) const { return std::tie(px, nx, py, ny, pz, nz, width, format) == std::tie(rhs.px, rhs.nx, rhs.py, rhs.ny, rhs.pz, rhs.nz, rhs.width, rhs.format); } bool operator!=(const TextureCubeConfig& rhs) const { return !(*this == rhs); } }; } // namespace OpenGL namespace std { template <> struct hash { std::size_t operator()(const OpenGL::TextureCubeConfig& config) const { std::size_t hash = 0; boost::hash_combine(hash, config.px); boost::hash_combine(hash, config.nx); boost::hash_combine(hash, config.py); boost::hash_combine(hash, config.ny); boost::hash_combine(hash, config.pz); boost::hash_combine(hash, config.nz); boost::hash_combine(hash, config.width); boost::hash_combine(hash, static_cast(config.format)); return hash; } }; } // namespace std namespace OpenGL { struct CachedSurface; using Surface = std::shared_ptr; using SurfaceSet = std::set; using SurfaceRegions = boost::icl::interval_set; using SurfaceMap = boost::icl::interval_map; using SurfaceCache = boost::icl::interval_map; using SurfaceInterval = SurfaceCache::interval_type; static_assert(std::is_same() && std::is_same(), "incorrect interval types"); using SurfaceRect_Tuple = std::tuple>; using SurfaceSurfaceRect_Tuple = std::tuple>; using PageMap = boost::icl::interval_map; enum class ScaleMatch { Exact, // only accept same res scale Upscale, // only allow higher scale than params Ignore // accept every scaled res }; struct SurfaceParams { enum class PixelFormat { // First 5 formats are shared between textures and color buffers RGBA8 = 0, RGB8 = 1, RGB5A1 = 2, RGB565 = 3, RGBA4 = 4, // Texture-only formats IA8 = 5, RG8 = 6, I8 = 7, A8 = 8, IA4 = 9, I4 = 10, A4 = 11, ETC1 = 12, ETC1A4 = 13, // Depth buffer-only formats D16 = 14, // gap D24 = 16, D24S8 = 17, Invalid = 255, }; enum class SurfaceType { Color = 0, Texture = 1, Depth = 2, DepthStencil = 3, Fill = 4, Invalid = 5 }; static constexpr unsigned int GetFormatBpp(PixelFormat format) { constexpr std::array bpp_table = { 32, // RGBA8 24, // RGB8 16, // RGB5A1 16, // RGB565 16, // RGBA4 16, // IA8 16, // RG8 8, // I8 8, // A8 8, // IA4 4, // I4 4, // A4 4, // ETC1 8, // ETC1A4 16, // D16 0, 24, // D24 32, // D24S8 }; assert(static_cast(format) < bpp_table.size()); return bpp_table[static_cast(format)]; } unsigned int GetFormatBpp() const { return GetFormatBpp(pixel_format); } static PixelFormat PixelFormatFromTextureFormat(Pica::TexturingRegs::TextureFormat format) { return ((unsigned int)format < 14) ? (PixelFormat)format : PixelFormat::Invalid; } static PixelFormat PixelFormatFromColorFormat(Pica::FramebufferRegs::ColorFormat format) { return ((unsigned int)format < 5) ? (PixelFormat)format : PixelFormat::Invalid; } static PixelFormat PixelFormatFromDepthFormat(Pica::FramebufferRegs::DepthFormat format) { return ((unsigned int)format < 4) ? (PixelFormat)((unsigned int)format + 14) : PixelFormat::Invalid; } static PixelFormat PixelFormatFromGPUPixelFormat(GPU::Regs::PixelFormat format) { switch (format) { // RGB565 and RGB5A1 are switched in PixelFormat compared to ColorFormat case GPU::Regs::PixelFormat::RGB565: return PixelFormat::RGB565; case GPU::Regs::PixelFormat::RGB5A1: return PixelFormat::RGB5A1; default: return ((unsigned int)format < 5) ? (PixelFormat)format : PixelFormat::Invalid; } } static bool CheckFormatsBlittable(PixelFormat pixel_format_a, PixelFormat pixel_format_b) { SurfaceType a_type = GetFormatType(pixel_format_a); SurfaceType b_type = GetFormatType(pixel_format_b); if ((a_type == SurfaceType::Color || a_type == SurfaceType::Texture) && (b_type == SurfaceType::Color || b_type == SurfaceType::Texture)) { return true; } if (a_type == SurfaceType::Depth && b_type == SurfaceType::Depth) { return true; } if (a_type == SurfaceType::DepthStencil && b_type == SurfaceType::DepthStencil) { return true; } return false; } static constexpr SurfaceType GetFormatType(PixelFormat pixel_format) { if ((unsigned int)pixel_format < 5) { return SurfaceType::Color; } if ((unsigned int)pixel_format < 14) { return SurfaceType::Texture; } if (pixel_format == PixelFormat::D16 || pixel_format == PixelFormat::D24) { return SurfaceType::Depth; } if (pixel_format == PixelFormat::D24S8) { return SurfaceType::DepthStencil; } return SurfaceType::Invalid; } /// Update the params "size", "end" and "type" from the already set "addr", "width", "height" /// and "pixel_format" void UpdateParams() { if (stride == 0) { stride = width; } type = GetFormatType(pixel_format); size = !is_tiled ? BytesInPixels(stride * (height - 1) + width) : BytesInPixels(stride * 8 * (height / 8 - 1) + width * 8); end = addr + size; } SurfaceInterval GetInterval() const { return SurfaceInterval::right_open(addr, end); } // Returns the outer rectangle containing "interval" SurfaceParams FromInterval(SurfaceInterval interval) const; SurfaceInterval GetSubRectInterval(MathUtil::Rectangle unscaled_rect) const; // Returns the region of the biggest valid rectange within interval SurfaceInterval GetCopyableInterval(const Surface& src_surface) const; u32 GetScaledWidth() const { return width * res_scale; } u32 GetScaledHeight() const { return height * res_scale; } MathUtil::Rectangle GetRect() const { return {0, height, width, 0}; } MathUtil::Rectangle GetScaledRect() const { return {0, GetScaledHeight(), GetScaledWidth(), 0}; } u32 PixelsInBytes(u32 size) const { return size * CHAR_BIT / GetFormatBpp(pixel_format); } u32 BytesInPixels(u32 pixels) const { return pixels * GetFormatBpp(pixel_format) / CHAR_BIT; } bool ExactMatch(const SurfaceParams& other_surface) const; bool CanSubRect(const SurfaceParams& sub_surface) const; bool CanExpand(const SurfaceParams& expanded_surface) const; bool CanTexCopy(const SurfaceParams& texcopy_params) const; MathUtil::Rectangle GetSubRect(const SurfaceParams& sub_surface) const; MathUtil::Rectangle GetScaledSubRect(const SurfaceParams& sub_surface) const; PAddr addr = 0; PAddr end = 0; u32 size = 0; u32 width = 0; u32 height = 0; u32 stride = 0; u16 res_scale = 1; bool is_tiled = false; PixelFormat pixel_format = PixelFormat::Invalid; SurfaceType type = SurfaceType::Invalid; }; /** * A watcher that notifies whether a cached surface has been changed. This is useful for caching * surface collection objects, including texture cube and mipmap. */ struct SurfaceWatcher { public: explicit SurfaceWatcher(std::weak_ptr&& surface) : surface(std::move(surface)) {} /** * Checks whether the surface has been changed. * @return false if the surface content has been changed since last Validate() call or has been * destroyed; otherwise true */ bool IsValid() const { return !surface.expired() && valid; } /// Marks that the content of the referencing surface has been updated to the watcher user. void Validate() { ASSERT(!surface.expired()); valid = true; } /// Gets the referencing surface. Returns null if the surface has been destroyed Surface Get() const { return surface.lock(); } private: friend struct CachedSurface; std::weak_ptr surface; bool valid = false; }; struct CachedSurface : SurfaceParams, std::enable_shared_from_this { bool CanFill(const SurfaceParams& dest_surface, SurfaceInterval fill_interval) const; bool CanCopy(const SurfaceParams& dest_surface, SurfaceInterval copy_interval) const; bool IsRegionValid(SurfaceInterval interval) const { return (invalid_regions.find(interval) == invalid_regions.end()); } bool IsSurfaceFullyInvalid() const { return (invalid_regions & GetInterval()) == SurfaceRegions(GetInterval()); } bool registered = false; SurfaceRegions invalid_regions; u32 fill_size = 0; /// Number of bytes to read from fill_data std::array fill_data; OGLTexture texture; static constexpr unsigned int GetGLBytesPerPixel(PixelFormat format) { // OpenGL needs 4 bpp alignment for D24 since using GL_UNSIGNED_INT as type return format == PixelFormat::Invalid ? 0 : (format == PixelFormat::D24 || GetFormatType(format) == SurfaceType::Texture) ? 4 : SurfaceParams::GetFormatBpp(format) / 8; } std::unique_ptr gl_buffer; std::size_t gl_buffer_size = 0; // Read/Write data in 3DS memory to/from gl_buffer void LoadGLBuffer(PAddr load_start, PAddr load_end); void FlushGLBuffer(PAddr flush_start, PAddr flush_end); // Upload/Download data in gl_buffer in/to this surface's texture void UploadGLTexture(const MathUtil::Rectangle& rect, GLuint read_fb_handle, GLuint draw_fb_handle); void DownloadGLTexture(const MathUtil::Rectangle& rect, GLuint read_fb_handle, GLuint draw_fb_handle); std::shared_ptr CreateWatcher() { auto watcher = std::make_shared(weak_from_this()); watchers.push_front(watcher); return watcher; } void InvalidateAllWatcher() { for (const auto& watcher : watchers) { if (auto locked = watcher.lock()) { locked->valid = false; } } } private: std::list> watchers; }; struct CachedTextureCube { OGLTexture texture; u16 res_scale = 1; std::shared_ptr px; std::shared_ptr nx; std::shared_ptr py; std::shared_ptr ny; std::shared_ptr pz; std::shared_ptr nz; }; class RasterizerCacheOpenGL : NonCopyable { public: RasterizerCacheOpenGL(); ~RasterizerCacheOpenGL(); /// Blit one surface's texture to another bool BlitSurfaces(const Surface& src_surface, const MathUtil::Rectangle& src_rect, const Surface& dst_surface, const MathUtil::Rectangle& dst_rect); void ConvertD24S8toABGR(GLuint src_tex, const MathUtil::Rectangle& src_rect, GLuint dst_tex, const MathUtil::Rectangle& dst_rect); /// Copy one surface's region to another void CopySurface(const Surface& src_surface, const Surface& dst_surface, SurfaceInterval copy_interval); /// Load a texture from 3DS memory to OpenGL and cache it (if not already cached) Surface GetSurface(const SurfaceParams& params, ScaleMatch match_res_scale, bool load_if_create); /// Attempt to find a subrect (resolution scaled) of a surface, otherwise loads a texture from /// 3DS memory to OpenGL and caches it (if not already cached) SurfaceRect_Tuple GetSurfaceSubRect(const SurfaceParams& params, ScaleMatch match_res_scale, bool load_if_create); /// Get a surface based on the texture configuration Surface GetTextureSurface(const Pica::TexturingRegs::FullTextureConfig& config); Surface GetTextureSurface(const Pica::Texture::TextureInfo& info); /// Get a texture cube based on the texture configuration const CachedTextureCube& GetTextureCube(const TextureCubeConfig& config); /// Get the color and depth surfaces based on the framebuffer configuration SurfaceSurfaceRect_Tuple GetFramebufferSurfaces(bool using_color_fb, bool using_depth_fb, const MathUtil::Rectangle& viewport_rect); /// Get a surface that matches the fill config Surface GetFillSurface(const GPU::Regs::MemoryFillConfig& config); /// Get a surface that matches a "texture copy" display transfer config SurfaceRect_Tuple GetTexCopySurface(const SurfaceParams& params); /// Write any cached resources overlapping the region back to memory (if dirty) void FlushRegion(PAddr addr, u32 size, Surface flush_surface = nullptr); /// Mark region as being invalidated by region_owner (nullptr if 3DS memory) void InvalidateRegion(PAddr addr, u32 size, const Surface& region_owner); /// Flush all cached resources tracked by this cache manager void FlushAll(); private: void DuplicateSurface(const Surface& src_surface, const Surface& dest_surface); /// Update surface's texture for given region when necessary void ValidateSurface(const Surface& surface, PAddr addr, u32 size); /// Create a new surface Surface CreateSurface(const SurfaceParams& params); /// Register surface into the cache void RegisterSurface(const Surface& surface); /// Remove surface from the cache void UnregisterSurface(const Surface& surface); /// Increase/decrease the number of surface in pages touching the specified region void UpdatePagesCachedCount(PAddr addr, u32 size, int delta); SurfaceCache surface_cache; PageMap cached_pages; SurfaceMap dirty_regions; SurfaceSet remove_surfaces; OGLFramebuffer read_framebuffer; OGLFramebuffer draw_framebuffer; OGLVertexArray attributeless_vao; OGLBuffer d24s8_abgr_buffer; GLsizeiptr d24s8_abgr_buffer_size; OGLProgram d24s8_abgr_shader; GLint d24s8_abgr_tbo_size_u_id; GLint d24s8_abgr_viewport_u_id; std::unordered_map texture_cube_cache; }; } // namespace OpenGL