video_core: Add BCn decoding support
This commit is contained in:
parent
b8c96cee5f
commit
eac46ad7ce
16 changed files with 1789 additions and 120 deletions
3
externals/CMakeLists.txt
vendored
3
externals/CMakeLists.txt
vendored
|
@ -157,6 +157,9 @@ endif()
|
||||||
add_library(stb stb/stb_dxt.cpp)
|
add_library(stb stb/stb_dxt.cpp)
|
||||||
target_include_directories(stb PUBLIC ./stb)
|
target_include_directories(stb PUBLIC ./stb)
|
||||||
|
|
||||||
|
add_library(bc_decoder bc_decoder/bc_decoder.cpp)
|
||||||
|
target_include_directories(bc_decoder PUBLIC ./bc_decoder)
|
||||||
|
|
||||||
if (ANDROID)
|
if (ANDROID)
|
||||||
if (ARCHITECTURE_arm64)
|
if (ARCHITECTURE_arm64)
|
||||||
add_subdirectory(libadrenotools)
|
add_subdirectory(libadrenotools)
|
||||||
|
|
1522
externals/bc_decoder/bc_decoder.cpp
vendored
Normal file
1522
externals/bc_decoder/bc_decoder.cpp
vendored
Normal file
File diff suppressed because it is too large
Load diff
43
externals/bc_decoder/bc_decoder.h
vendored
Normal file
43
externals/bc_decoder/bc_decoder.h
vendored
Normal file
|
@ -0,0 +1,43 @@
|
||||||
|
// SPDX-License-Identifier: MPL-2.0
|
||||||
|
// Copyright © 2022 Skyline Team and Contributors (https://github.com/skyline-emu/)
|
||||||
|
|
||||||
|
#pragma once
|
||||||
|
|
||||||
|
#include <cstdint>
|
||||||
|
|
||||||
|
namespace bcn {
|
||||||
|
/**
|
||||||
|
* @brief Decodes a BC1 encoded image to R8G8B8A8
|
||||||
|
*/
|
||||||
|
void DecodeBc1(const uint8_t *src, uint8_t *dst, size_t x, size_t y, size_t width, size_t height);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief Decodes a BC2 encoded image to R8G8B8A8
|
||||||
|
*/
|
||||||
|
void DecodeBc2(const uint8_t *src, uint8_t *dst, size_t x, size_t y, size_t width, size_t height);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief Decodes a BC3 encoded image to R8G8B8A8
|
||||||
|
*/
|
||||||
|
void DecodeBc3(const uint8_t *src, uint8_t *dst, size_t x, size_t y, size_t width, size_t height);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief Decodes a BC4 encoded image to R8
|
||||||
|
*/
|
||||||
|
void DecodeBc4(const uint8_t *src, uint8_t *dst, size_t x, size_t y, size_t width, size_t height, bool isSigned);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief Decodes a BC5 encoded image to R8G8
|
||||||
|
*/
|
||||||
|
void DecodeBc5(const uint8_t *src, uint8_t *dst, size_t x, size_t y, size_t width, size_t height, bool isSigned);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief Decodes a BC6 encoded image to R16G16B16A16
|
||||||
|
*/
|
||||||
|
void DecodeBc6(const uint8_t *src, uint8_t *dst, size_t x, size_t y, size_t width, size_t height, bool isSigned);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief Decodes a BC7 encoded image to R8G8B8A8
|
||||||
|
*/
|
||||||
|
void DecodeBc7(const uint8_t *src, uint8_t *dst, size_t x, size_t y, size_t width, size_t height);
|
||||||
|
}
|
|
@ -220,8 +220,8 @@ add_library(video_core STATIC
|
||||||
surface.h
|
surface.h
|
||||||
texture_cache/accelerated_swizzle.cpp
|
texture_cache/accelerated_swizzle.cpp
|
||||||
texture_cache/accelerated_swizzle.h
|
texture_cache/accelerated_swizzle.h
|
||||||
texture_cache/decode_bc4.cpp
|
texture_cache/decode_bc.cpp
|
||||||
texture_cache/decode_bc4.h
|
texture_cache/decode_bc.h
|
||||||
texture_cache/descriptor_table.h
|
texture_cache/descriptor_table.h
|
||||||
texture_cache/formatter.cpp
|
texture_cache/formatter.cpp
|
||||||
texture_cache/formatter.h
|
texture_cache/formatter.h
|
||||||
|
@ -279,7 +279,7 @@ add_library(video_core STATIC
|
||||||
create_target_directory_groups(video_core)
|
create_target_directory_groups(video_core)
|
||||||
|
|
||||||
target_link_libraries(video_core PUBLIC common core)
|
target_link_libraries(video_core PUBLIC common core)
|
||||||
target_link_libraries(video_core PUBLIC glad shader_recompiler stb)
|
target_link_libraries(video_core PUBLIC glad shader_recompiler stb bc_decoder)
|
||||||
|
|
||||||
if (YUZU_USE_BUNDLED_FFMPEG AND NOT (WIN32 OR ANDROID))
|
if (YUZU_USE_BUNDLED_FFMPEG AND NOT (WIN32 OR ANDROID))
|
||||||
add_dependencies(video_core ffmpeg-build)
|
add_dependencies(video_core ffmpeg-build)
|
||||||
|
|
|
@ -259,6 +259,26 @@ FormatInfo SurfaceFormat(const Device& device, FormatType format_type, bool with
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
// Transcode on hardware that doesn't support BCn natively
|
||||||
|
if (!device.IsOptimalBcnSupported() && VideoCore::Surface::IsPixelFormatBCn(pixel_format)) {
|
||||||
|
const bool is_srgb = with_srgb && VideoCore::Surface::IsPixelFormatSRGB(pixel_format);
|
||||||
|
if (pixel_format == PixelFormat::BC4_SNORM) {
|
||||||
|
tuple.format = VK_FORMAT_R8_SNORM;
|
||||||
|
} else if (pixel_format == PixelFormat::BC4_UNORM) {
|
||||||
|
tuple.format = VK_FORMAT_R8_UNORM;
|
||||||
|
} else if (pixel_format == PixelFormat::BC5_SNORM) {
|
||||||
|
tuple.format = VK_FORMAT_R8G8_SNORM;
|
||||||
|
} else if (pixel_format == PixelFormat::BC5_UNORM) {
|
||||||
|
tuple.format = VK_FORMAT_R8G8_UNORM;
|
||||||
|
} else if (pixel_format == PixelFormat::BC6H_SFLOAT ||
|
||||||
|
pixel_format == PixelFormat::BC6H_UFLOAT) {
|
||||||
|
tuple.format = VK_FORMAT_R16G16B16A16_SFLOAT;
|
||||||
|
} else if (is_srgb) {
|
||||||
|
tuple.format = VK_FORMAT_A8B8G8R8_SRGB_PACK32;
|
||||||
|
} else {
|
||||||
|
tuple.format = VK_FORMAT_A8B8G8R8_UNORM_PACK32;
|
||||||
|
}
|
||||||
|
}
|
||||||
const bool attachable = (tuple.usage & Attachable) != 0;
|
const bool attachable = (tuple.usage & Attachable) != 0;
|
||||||
const bool storage = (tuple.usage & Storage) != 0;
|
const bool storage = (tuple.usage & Storage) != 0;
|
||||||
|
|
||||||
|
|
|
@ -315,7 +315,14 @@ void RasterizerVulkan::Clear(u32 layer_count) {
|
||||||
FlushWork();
|
FlushWork();
|
||||||
gpu_memory->FlushCaching();
|
gpu_memory->FlushCaching();
|
||||||
|
|
||||||
|
#if ANDROID
|
||||||
|
if (Settings::IsGPULevelHigh()) {
|
||||||
|
// This is problematic on Android, disable on GPU Normal.
|
||||||
query_cache.UpdateCounters();
|
query_cache.UpdateCounters();
|
||||||
|
}
|
||||||
|
#else
|
||||||
|
query_cache.UpdateCounters();
|
||||||
|
#endif
|
||||||
|
|
||||||
auto& regs = maxwell3d->regs;
|
auto& regs = maxwell3d->regs;
|
||||||
const bool use_color = regs.clear_surface.R || regs.clear_surface.G || regs.clear_surface.B ||
|
const bool use_color = regs.clear_surface.R || regs.clear_surface.G || regs.clear_surface.B ||
|
||||||
|
|
|
@ -1279,6 +1279,10 @@ Image::Image(TextureCacheRuntime& runtime_, const ImageInfo& info_, GPUVAddr gpu
|
||||||
flags |= VideoCommon::ImageFlagBits::Converted;
|
flags |= VideoCommon::ImageFlagBits::Converted;
|
||||||
flags |= VideoCommon::ImageFlagBits::CostlyLoad;
|
flags |= VideoCommon::ImageFlagBits::CostlyLoad;
|
||||||
}
|
}
|
||||||
|
if (IsPixelFormatBCn(info.format) && !runtime->device.IsOptimalBcnSupported()) {
|
||||||
|
flags |= VideoCommon::ImageFlagBits::Converted;
|
||||||
|
flags |= VideoCommon::ImageFlagBits::CostlyLoad;
|
||||||
|
}
|
||||||
if (runtime->device.HasDebuggingToolAttached()) {
|
if (runtime->device.HasDebuggingToolAttached()) {
|
||||||
original_image.SetObjectNameEXT(VideoCommon::Name(*this).c_str());
|
original_image.SetObjectNameEXT(VideoCommon::Name(*this).c_str());
|
||||||
}
|
}
|
||||||
|
|
|
@ -269,6 +269,28 @@ bool IsPixelFormatASTC(PixelFormat format) {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool IsPixelFormatBCn(PixelFormat format) {
|
||||||
|
switch (format) {
|
||||||
|
case PixelFormat::BC1_RGBA_UNORM:
|
||||||
|
case PixelFormat::BC2_UNORM:
|
||||||
|
case PixelFormat::BC3_UNORM:
|
||||||
|
case PixelFormat::BC4_UNORM:
|
||||||
|
case PixelFormat::BC4_SNORM:
|
||||||
|
case PixelFormat::BC5_UNORM:
|
||||||
|
case PixelFormat::BC5_SNORM:
|
||||||
|
case PixelFormat::BC1_RGBA_SRGB:
|
||||||
|
case PixelFormat::BC2_SRGB:
|
||||||
|
case PixelFormat::BC3_SRGB:
|
||||||
|
case PixelFormat::BC7_UNORM:
|
||||||
|
case PixelFormat::BC6H_UFLOAT:
|
||||||
|
case PixelFormat::BC6H_SFLOAT:
|
||||||
|
case PixelFormat::BC7_SRGB:
|
||||||
|
return true;
|
||||||
|
default:
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
bool IsPixelFormatSRGB(PixelFormat format) {
|
bool IsPixelFormatSRGB(PixelFormat format) {
|
||||||
switch (format) {
|
switch (format) {
|
||||||
case PixelFormat::A8B8G8R8_SRGB:
|
case PixelFormat::A8B8G8R8_SRGB:
|
||||||
|
|
|
@ -501,6 +501,8 @@ SurfaceType GetFormatType(PixelFormat pixel_format);
|
||||||
|
|
||||||
bool IsPixelFormatASTC(PixelFormat format);
|
bool IsPixelFormatASTC(PixelFormat format);
|
||||||
|
|
||||||
|
bool IsPixelFormatBCn(PixelFormat format);
|
||||||
|
|
||||||
bool IsPixelFormatSRGB(PixelFormat format);
|
bool IsPixelFormatSRGB(PixelFormat format);
|
||||||
|
|
||||||
bool IsPixelFormatInteger(PixelFormat format);
|
bool IsPixelFormatInteger(PixelFormat format);
|
||||||
|
|
129
src/video_core/texture_cache/decode_bc.cpp
Normal file
129
src/video_core/texture_cache/decode_bc.cpp
Normal file
|
@ -0,0 +1,129 @@
|
||||||
|
// SPDX-FileCopyrightText: Copyright 2020 yuzu Emulator Project
|
||||||
|
// SPDX-License-Identifier: GPL-2.0-or-later
|
||||||
|
|
||||||
|
#include <algorithm>
|
||||||
|
#include <array>
|
||||||
|
#include <span>
|
||||||
|
#include <bc_decoder.h>
|
||||||
|
|
||||||
|
#include "common/common_types.h"
|
||||||
|
#include "video_core/texture_cache/decode_bc.h"
|
||||||
|
|
||||||
|
namespace VideoCommon {
|
||||||
|
|
||||||
|
namespace {
|
||||||
|
constexpr u32 BLOCK_SIZE = 4;
|
||||||
|
|
||||||
|
using VideoCore::Surface::PixelFormat;
|
||||||
|
|
||||||
|
constexpr bool IsSigned(PixelFormat pixel_format) {
|
||||||
|
switch (pixel_format) {
|
||||||
|
case PixelFormat::BC4_SNORM:
|
||||||
|
case PixelFormat::BC4_UNORM:
|
||||||
|
case PixelFormat::BC5_SNORM:
|
||||||
|
case PixelFormat::BC5_UNORM:
|
||||||
|
case PixelFormat::BC6H_SFLOAT:
|
||||||
|
case PixelFormat::BC6H_UFLOAT:
|
||||||
|
return true;
|
||||||
|
default:
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
constexpr u32 BlockSize(PixelFormat pixel_format) {
|
||||||
|
switch (pixel_format) {
|
||||||
|
case PixelFormat::BC1_RGBA_SRGB:
|
||||||
|
case PixelFormat::BC1_RGBA_UNORM:
|
||||||
|
case PixelFormat::BC4_SNORM:
|
||||||
|
case PixelFormat::BC4_UNORM:
|
||||||
|
return 8;
|
||||||
|
default:
|
||||||
|
return 16;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
} // Anonymous namespace
|
||||||
|
|
||||||
|
u32 ConvertedBytesPerBlock(VideoCore::Surface::PixelFormat pixel_format) {
|
||||||
|
switch (pixel_format) {
|
||||||
|
case PixelFormat::BC4_SNORM:
|
||||||
|
case PixelFormat::BC4_UNORM:
|
||||||
|
return 1;
|
||||||
|
case PixelFormat::BC5_SNORM:
|
||||||
|
case PixelFormat::BC5_UNORM:
|
||||||
|
return 2;
|
||||||
|
case PixelFormat::BC6H_SFLOAT:
|
||||||
|
case PixelFormat::BC6H_UFLOAT:
|
||||||
|
return 8;
|
||||||
|
default:
|
||||||
|
return 4;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
template <auto decompress, PixelFormat pixel_format>
|
||||||
|
void DecompressBlocks(std::span<const u8> input, std::span<u8> output, Extent3D extent,
|
||||||
|
bool is_signed = false) {
|
||||||
|
const u32 out_bpp = ConvertedBytesPerBlock(pixel_format);
|
||||||
|
const u32 block_width = std::min(extent.width, BLOCK_SIZE);
|
||||||
|
const u32 block_height = std::min(extent.height, BLOCK_SIZE);
|
||||||
|
const u32 pitch = extent.width * out_bpp;
|
||||||
|
size_t input_offset = 0;
|
||||||
|
size_t output_offset = 0;
|
||||||
|
for (u32 slice = 0; slice < extent.depth; ++slice) {
|
||||||
|
for (u32 y = 0; y < extent.height; y += block_height) {
|
||||||
|
size_t row_offset = 0;
|
||||||
|
for (u32 x = 0; x < extent.width;
|
||||||
|
x += block_width, row_offset += block_width * out_bpp) {
|
||||||
|
const u8* src = input.data() + input_offset;
|
||||||
|
u8* const dst = output.data() + output_offset + row_offset;
|
||||||
|
if constexpr (IsSigned(pixel_format)) {
|
||||||
|
decompress(src, dst, x, y, extent.width, extent.height, is_signed);
|
||||||
|
} else {
|
||||||
|
decompress(src, dst, x, y, extent.width, extent.height);
|
||||||
|
}
|
||||||
|
input_offset += BlockSize(pixel_format);
|
||||||
|
}
|
||||||
|
output_offset += block_height * pitch;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void DecompressBCn(std::span<const u8> input, std::span<u8> output, Extent3D extent,
|
||||||
|
VideoCore::Surface::PixelFormat pixel_format) {
|
||||||
|
switch (pixel_format) {
|
||||||
|
case PixelFormat::BC1_RGBA_UNORM:
|
||||||
|
case PixelFormat::BC1_RGBA_SRGB:
|
||||||
|
DecompressBlocks<bcn::DecodeBc1, PixelFormat::BC1_RGBA_UNORM>(input, output, extent);
|
||||||
|
break;
|
||||||
|
case PixelFormat::BC2_UNORM:
|
||||||
|
case PixelFormat::BC2_SRGB:
|
||||||
|
DecompressBlocks<bcn::DecodeBc2, PixelFormat::BC2_UNORM>(input, output, extent);
|
||||||
|
break;
|
||||||
|
case PixelFormat::BC3_UNORM:
|
||||||
|
case PixelFormat::BC3_SRGB:
|
||||||
|
DecompressBlocks<bcn::DecodeBc3, PixelFormat::BC3_UNORM>(input, output, extent);
|
||||||
|
break;
|
||||||
|
case PixelFormat::BC4_SNORM:
|
||||||
|
case PixelFormat::BC4_UNORM:
|
||||||
|
DecompressBlocks<bcn::DecodeBc4, PixelFormat::BC4_UNORM>(
|
||||||
|
input, output, extent, pixel_format == PixelFormat::BC4_SNORM);
|
||||||
|
break;
|
||||||
|
case PixelFormat::BC5_SNORM:
|
||||||
|
case PixelFormat::BC5_UNORM:
|
||||||
|
DecompressBlocks<bcn::DecodeBc5, PixelFormat::BC5_UNORM>(
|
||||||
|
input, output, extent, pixel_format == PixelFormat::BC5_SNORM);
|
||||||
|
break;
|
||||||
|
case PixelFormat::BC6H_SFLOAT:
|
||||||
|
case PixelFormat::BC6H_UFLOAT:
|
||||||
|
DecompressBlocks<bcn::DecodeBc6, PixelFormat::BC6H_UFLOAT>(
|
||||||
|
input, output, extent, pixel_format == PixelFormat::BC6H_SFLOAT);
|
||||||
|
break;
|
||||||
|
case PixelFormat::BC7_SRGB:
|
||||||
|
case PixelFormat::BC7_UNORM:
|
||||||
|
DecompressBlocks<bcn::DecodeBc7, PixelFormat::BC7_UNORM>(input, output, extent);
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
LOG_WARNING(HW_GPU, "Unimplemented BCn decompression {}", pixel_format);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
} // namespace VideoCommon
|
|
@ -6,10 +6,14 @@
|
||||||
#include <span>
|
#include <span>
|
||||||
|
|
||||||
#include "common/common_types.h"
|
#include "common/common_types.h"
|
||||||
|
#include "video_core/surface.h"
|
||||||
#include "video_core/texture_cache/types.h"
|
#include "video_core/texture_cache/types.h"
|
||||||
|
|
||||||
namespace VideoCommon {
|
namespace VideoCommon {
|
||||||
|
|
||||||
void DecompressBC4(std::span<const u8> data, Extent3D extent, std::span<u8> output);
|
[[nodiscard]] u32 ConvertedBytesPerBlock(VideoCore::Surface::PixelFormat pixel_format);
|
||||||
|
|
||||||
|
void DecompressBCn(std::span<const u8> input, std::span<u8> output, Extent3D extent,
|
||||||
|
VideoCore::Surface::PixelFormat pixel_format);
|
||||||
|
|
||||||
} // namespace VideoCommon
|
} // namespace VideoCommon
|
|
@ -1,96 +0,0 @@
|
||||||
// SPDX-FileCopyrightText: Copyright 2020 yuzu Emulator Project
|
|
||||||
// SPDX-License-Identifier: GPL-2.0-or-later
|
|
||||||
|
|
||||||
#include <algorithm>
|
|
||||||
#include <array>
|
|
||||||
#include <span>
|
|
||||||
|
|
||||||
#include "common/assert.h"
|
|
||||||
#include "common/common_types.h"
|
|
||||||
#include "video_core/texture_cache/decode_bc4.h"
|
|
||||||
#include "video_core/texture_cache/types.h"
|
|
||||||
|
|
||||||
namespace VideoCommon {
|
|
||||||
|
|
||||||
// https://www.khronos.org/registry/OpenGL/extensions/ARB/ARB_texture_compression_rgtc.txt
|
|
||||||
[[nodiscard]] constexpr u32 DecompressBlock(u64 bits, u32 x, u32 y) {
|
|
||||||
const u32 code_offset = 16 + 3 * (4 * y + x);
|
|
||||||
const u32 code = (bits >> code_offset) & 7;
|
|
||||||
const u32 red0 = (bits >> 0) & 0xff;
|
|
||||||
const u32 red1 = (bits >> 8) & 0xff;
|
|
||||||
if (red0 > red1) {
|
|
||||||
switch (code) {
|
|
||||||
case 0:
|
|
||||||
return red0;
|
|
||||||
case 1:
|
|
||||||
return red1;
|
|
||||||
case 2:
|
|
||||||
return (6 * red0 + 1 * red1) / 7;
|
|
||||||
case 3:
|
|
||||||
return (5 * red0 + 2 * red1) / 7;
|
|
||||||
case 4:
|
|
||||||
return (4 * red0 + 3 * red1) / 7;
|
|
||||||
case 5:
|
|
||||||
return (3 * red0 + 4 * red1) / 7;
|
|
||||||
case 6:
|
|
||||||
return (2 * red0 + 5 * red1) / 7;
|
|
||||||
case 7:
|
|
||||||
return (1 * red0 + 6 * red1) / 7;
|
|
||||||
}
|
|
||||||
} else {
|
|
||||||
switch (code) {
|
|
||||||
case 0:
|
|
||||||
return red0;
|
|
||||||
case 1:
|
|
||||||
return red1;
|
|
||||||
case 2:
|
|
||||||
return (4 * red0 + 1 * red1) / 5;
|
|
||||||
case 3:
|
|
||||||
return (3 * red0 + 2 * red1) / 5;
|
|
||||||
case 4:
|
|
||||||
return (2 * red0 + 3 * red1) / 5;
|
|
||||||
case 5:
|
|
||||||
return (1 * red0 + 4 * red1) / 5;
|
|
||||||
case 6:
|
|
||||||
return 0;
|
|
||||||
case 7:
|
|
||||||
return 0xff;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
return 0;
|
|
||||||
}
|
|
||||||
|
|
||||||
void DecompressBC4(std::span<const u8> input, Extent3D extent, std::span<u8> output) {
|
|
||||||
UNIMPLEMENTED_IF_MSG(extent.width % 4 != 0, "Unaligned width={}", extent.width);
|
|
||||||
UNIMPLEMENTED_IF_MSG(extent.height % 4 != 0, "Unaligned height={}", extent.height);
|
|
||||||
static constexpr u32 BLOCK_SIZE = 4;
|
|
||||||
size_t input_offset = 0;
|
|
||||||
for (u32 slice = 0; slice < extent.depth; ++slice) {
|
|
||||||
for (u32 block_y = 0; block_y < extent.height / 4; ++block_y) {
|
|
||||||
for (u32 block_x = 0; block_x < extent.width / 4; ++block_x) {
|
|
||||||
u64 bits;
|
|
||||||
std::memcpy(&bits, &input[input_offset], sizeof(bits));
|
|
||||||
input_offset += sizeof(bits);
|
|
||||||
|
|
||||||
for (u32 y = 0; y < BLOCK_SIZE; ++y) {
|
|
||||||
for (u32 x = 0; x < BLOCK_SIZE; ++x) {
|
|
||||||
const u32 linear_z = slice;
|
|
||||||
const u32 linear_y = block_y * BLOCK_SIZE + y;
|
|
||||||
const u32 linear_x = block_x * BLOCK_SIZE + x;
|
|
||||||
const u32 offset_z = linear_z * extent.width * extent.height;
|
|
||||||
const u32 offset_y = linear_y * extent.width;
|
|
||||||
const u32 offset_x = linear_x;
|
|
||||||
const u32 output_offset = (offset_z + offset_y + offset_x) * 4ULL;
|
|
||||||
const u32 color = DecompressBlock(bits, x, y);
|
|
||||||
output[output_offset + 0] = static_cast<u8>(color);
|
|
||||||
output[output_offset + 1] = 0;
|
|
||||||
output[output_offset + 2] = 0;
|
|
||||||
output[output_offset + 3] = 0xff;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
} // namespace VideoCommon
|
|
|
@ -24,7 +24,7 @@
|
||||||
#include "video_core/engines/maxwell_3d.h"
|
#include "video_core/engines/maxwell_3d.h"
|
||||||
#include "video_core/memory_manager.h"
|
#include "video_core/memory_manager.h"
|
||||||
#include "video_core/surface.h"
|
#include "video_core/surface.h"
|
||||||
#include "video_core/texture_cache/decode_bc4.h"
|
#include "video_core/texture_cache/decode_bc.h"
|
||||||
#include "video_core/texture_cache/format_lookup_table.h"
|
#include "video_core/texture_cache/format_lookup_table.h"
|
||||||
#include "video_core/texture_cache/formatter.h"
|
#include "video_core/texture_cache/formatter.h"
|
||||||
#include "video_core/texture_cache/samples_helper.h"
|
#include "video_core/texture_cache/samples_helper.h"
|
||||||
|
@ -61,8 +61,6 @@ using VideoCore::Surface::PixelFormatFromDepthFormat;
|
||||||
using VideoCore::Surface::PixelFormatFromRenderTargetFormat;
|
using VideoCore::Surface::PixelFormatFromRenderTargetFormat;
|
||||||
using VideoCore::Surface::SurfaceType;
|
using VideoCore::Surface::SurfaceType;
|
||||||
|
|
||||||
constexpr u32 CONVERTED_BYTES_PER_BLOCK = BytesPerBlock(PixelFormat::A8B8G8R8_UNORM);
|
|
||||||
|
|
||||||
struct LevelInfo {
|
struct LevelInfo {
|
||||||
Extent3D size;
|
Extent3D size;
|
||||||
Extent3D block;
|
Extent3D block;
|
||||||
|
@ -612,7 +610,8 @@ u32 CalculateConvertedSizeBytes(const ImageInfo& info) noexcept {
|
||||||
}
|
}
|
||||||
return output_size;
|
return output_size;
|
||||||
}
|
}
|
||||||
return NumBlocksPerLayer(info, TILE_SIZE) * info.resources.layers * CONVERTED_BYTES_PER_BLOCK;
|
return NumBlocksPerLayer(info, TILE_SIZE) * info.resources.layers *
|
||||||
|
ConvertedBytesPerBlock(info.format);
|
||||||
}
|
}
|
||||||
|
|
||||||
u32 CalculateLayerStride(const ImageInfo& info) noexcept {
|
u32 CalculateLayerStride(const ImageInfo& info) noexcept {
|
||||||
|
@ -945,7 +944,8 @@ void ConvertImage(std::span<const u8> input, const ImageInfo& info, std::span<u8
|
||||||
tile_size.height, output.subspan(output_offset));
|
tile_size.height, output.subspan(output_offset));
|
||||||
|
|
||||||
output_offset += copy.image_extent.width * copy.image_extent.height *
|
output_offset += copy.image_extent.width * copy.image_extent.height *
|
||||||
copy.image_subresource.num_layers * CONVERTED_BYTES_PER_BLOCK;
|
copy.image_subresource.num_layers *
|
||||||
|
BytesPerBlock(PixelFormat::A8B8G8R8_UNORM);
|
||||||
} else if (astc) {
|
} else if (astc) {
|
||||||
// BC1 uses 0.5 bytes per texel
|
// BC1 uses 0.5 bytes per texel
|
||||||
// BC3 uses 1 byte per texel
|
// BC3 uses 1 byte per texel
|
||||||
|
@ -956,7 +956,8 @@ void ConvertImage(std::span<const u8> input, const ImageInfo& info, std::span<u8
|
||||||
|
|
||||||
const u32 plane_dim = copy.image_extent.width * copy.image_extent.height;
|
const u32 plane_dim = copy.image_extent.width * copy.image_extent.height;
|
||||||
const u32 level_size = plane_dim * copy.image_extent.depth *
|
const u32 level_size = plane_dim * copy.image_extent.depth *
|
||||||
copy.image_subresource.num_layers * CONVERTED_BYTES_PER_BLOCK;
|
copy.image_subresource.num_layers *
|
||||||
|
BytesPerBlock(PixelFormat::A8B8G8R8_UNORM);
|
||||||
decode_scratch.resize_destructive(level_size);
|
decode_scratch.resize_destructive(level_size);
|
||||||
|
|
||||||
Tegra::Texture::ASTC::Decompress(
|
Tegra::Texture::ASTC::Decompress(
|
||||||
|
@ -976,10 +977,15 @@ void ConvertImage(std::span<const u8> input, const ImageInfo& info, std::span<u8
|
||||||
bpp_div;
|
bpp_div;
|
||||||
output_offset += static_cast<u32>(copy.buffer_size);
|
output_offset += static_cast<u32>(copy.buffer_size);
|
||||||
} else {
|
} else {
|
||||||
DecompressBC4(input_offset, copy.image_extent, output.subspan(output_offset));
|
const Extent3D image_extent{
|
||||||
|
.width = copy.image_extent.width,
|
||||||
|
.height = copy.image_extent.height * copy.image_subresource.num_layers,
|
||||||
|
.depth = copy.image_extent.depth,
|
||||||
|
};
|
||||||
|
DecompressBCn(input_offset, output.subspan(output_offset), image_extent, info.format);
|
||||||
output_offset += copy.image_extent.width * copy.image_extent.height *
|
output_offset += copy.image_extent.width * copy.image_extent.height *
|
||||||
copy.image_subresource.num_layers * CONVERTED_BYTES_PER_BLOCK;
|
copy.image_subresource.num_layers *
|
||||||
|
ConvertedBytesPerBlock(info.format);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -3,7 +3,6 @@
|
||||||
|
|
||||||
#include <stb_dxt.h>
|
#include <stb_dxt.h>
|
||||||
#include <string.h>
|
#include <string.h>
|
||||||
|
|
||||||
#include "common/alignment.h"
|
#include "common/alignment.h"
|
||||||
#include "video_core/textures/bcn.h"
|
#include "video_core/textures/bcn.h"
|
||||||
#include "video_core/textures/workers.h"
|
#include "video_core/textures/workers.h"
|
||||||
|
|
|
@ -4,14 +4,13 @@
|
||||||
#pragma once
|
#pragma once
|
||||||
|
|
||||||
#include <span>
|
#include <span>
|
||||||
#include <stdint.h>
|
|
||||||
|
#include "common/common_types.h"
|
||||||
|
|
||||||
namespace Tegra::Texture::BCN {
|
namespace Tegra::Texture::BCN {
|
||||||
|
|
||||||
void CompressBC1(std::span<const uint8_t> data, uint32_t width, uint32_t height, uint32_t depth,
|
void CompressBC1(std::span<const u8> data, u32 width, u32 height, u32 depth, std::span<u8> output);
|
||||||
std::span<uint8_t> output);
|
|
||||||
|
|
||||||
void CompressBC3(std::span<const uint8_t> data, uint32_t width, uint32_t height, uint32_t depth,
|
void CompressBC3(std::span<const u8> data, u32 width, u32 height, u32 depth, std::span<u8> output);
|
||||||
std::span<uint8_t> output);
|
|
||||||
|
|
||||||
} // namespace Tegra::Texture::BCN
|
} // namespace Tegra::Texture::BCN
|
||||||
|
|
|
@ -293,6 +293,11 @@ public:
|
||||||
return features.features.textureCompressionASTC_LDR;
|
return features.features.textureCompressionASTC_LDR;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Returns true if BCn is natively supported.
|
||||||
|
bool IsOptimalBcnSupported() const {
|
||||||
|
return features.features.textureCompressionBC;
|
||||||
|
}
|
||||||
|
|
||||||
/// Returns true if descriptor aliasing is natively supported.
|
/// Returns true if descriptor aliasing is natively supported.
|
||||||
bool IsDescriptorAliasingSupported() const {
|
bool IsDescriptorAliasingSupported() const {
|
||||||
return GetDriverID() != VK_DRIVER_ID_QUALCOMM_PROPRIETARY;
|
return GetDriverID() != VK_DRIVER_ID_QUALCOMM_PROPRIETARY;
|
||||||
|
@ -423,6 +428,11 @@ public:
|
||||||
return extensions.sampler_filter_minmax;
|
return extensions.sampler_filter_minmax;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Returns true if the device supports VK_EXT_shader_stencil_export.
|
||||||
|
bool IsExtShaderStencilExportSupported() const {
|
||||||
|
return extensions.shader_stencil_export;
|
||||||
|
}
|
||||||
|
|
||||||
/// Returns true if the device supports VK_EXT_depth_range_unrestricted.
|
/// Returns true if the device supports VK_EXT_depth_range_unrestricted.
|
||||||
bool IsExtDepthRangeUnrestrictedSupported() const {
|
bool IsExtDepthRangeUnrestrictedSupported() const {
|
||||||
return extensions.depth_range_unrestricted;
|
return extensions.depth_range_unrestricted;
|
||||||
|
@ -492,11 +502,6 @@ public:
|
||||||
return extensions.vertex_input_dynamic_state;
|
return extensions.vertex_input_dynamic_state;
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Returns true if the device supports VK_EXT_shader_stencil_export.
|
|
||||||
bool IsExtShaderStencilExportSupported() const {
|
|
||||||
return extensions.shader_stencil_export;
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Returns true if the device supports VK_EXT_shader_demote_to_helper_invocation
|
/// Returns true if the device supports VK_EXT_shader_demote_to_helper_invocation
|
||||||
bool IsExtShaderDemoteToHelperInvocationSupported() const {
|
bool IsExtShaderDemoteToHelperInvocationSupported() const {
|
||||||
return extensions.shader_demote_to_helper_invocation;
|
return extensions.shader_demote_to_helper_invocation;
|
||||||
|
|
Loading…
Reference in a new issue