using Ryujinx.Common; using System; using System.Runtime.Intrinsics; using static Ryujinx.Graphics.Texture.BlockLinearConstants; namespace Ryujinx.Graphics.Texture { public static class LayoutConverter { private const int HostStrideAlignment = 4; public static Span ConvertBlockLinearToLinear( int width, int height, int depth, int levels, int layers, int blockWidth, int blockHeight, int bytesPerPixel, int gobBlocksInY, int gobBlocksInZ, int gobBlocksInTileX, SizeInfo sizeInfo, ReadOnlySpan data) { int outSize = GetTextureSize( width, height, depth, levels, layers, blockWidth, blockHeight, bytesPerPixel); Span output = new byte[outSize]; int outOffs = 0; int mipGobBlocksInY = gobBlocksInY; int mipGobBlocksInZ = gobBlocksInZ; int gobWidth = (GobStride / bytesPerPixel) * gobBlocksInTileX; int gobHeight = gobBlocksInY * GobHeight; for (int level = 0; level < levels; level++) { int w = Math.Max(1, width >> level); int h = Math.Max(1, height >> level); int d = Math.Max(1, depth >> level); w = BitUtils.DivRoundUp(w, blockWidth); h = BitUtils.DivRoundUp(h, blockHeight); while (h <= (mipGobBlocksInY >> 1) * GobHeight && mipGobBlocksInY != 1) { mipGobBlocksInY >>= 1; } while (d <= (mipGobBlocksInZ >> 1) && mipGobBlocksInZ != 1) { mipGobBlocksInZ >>= 1; } int strideTrunc = BitUtils.AlignDown(w * bytesPerPixel, 16); int xStart = strideTrunc / bytesPerPixel; int stride = BitUtils.AlignUp(w * bytesPerPixel, HostStrideAlignment); int alignment = gobWidth; if (d < gobBlocksInZ || w <= gobWidth || h <= gobHeight) { alignment = GobStride / bytesPerPixel; } int wAligned = BitUtils.AlignUp(w, alignment); BlockLinearLayout layoutConverter = new BlockLinearLayout( wAligned, h, d, mipGobBlocksInY, mipGobBlocksInZ, bytesPerPixel); unsafe void Convert(Span output, ReadOnlySpan data) where T : unmanaged { fixed (byte* outputBPtr = output, dataBPtr = data) { for (int layer = 0; layer < layers; layer++) { int inBaseOffset = layer * sizeInfo.LayerSize + sizeInfo.GetMipOffset(level); for (int z = 0; z < d; z++) { layoutConverter.SetZ(z); for (int y = 0; y < h; y++) { layoutConverter.SetY(y); for (int x = 0; x < strideTrunc; x += 16) { int offset = inBaseOffset + layoutConverter.GetOffsetWithLineOffset(x); *(Vector128*)(outputBPtr + outOffs + x) = *(Vector128*)(dataBPtr + offset); } for (int x = xStart; x < w; x++) { int offset = inBaseOffset + layoutConverter.GetOffset(x); ((T*)(outputBPtr + outOffs))[x] = *(T*)(dataBPtr + offset); } outOffs += stride; } } } } } switch (bytesPerPixel) { case 1: Convert(output, data); break; case 2: Convert(output, data); break; case 4: Convert(output, data); break; case 8: Convert(output, data); break; case 12: Convert(output, data); break; case 16: Convert>(output, data); break; default: throw new NotSupportedException($"Unable to convert ${bytesPerPixel} bpp pixel format."); } } return output; } public static Span ConvertLinearStridedToLinear( int width, int height, int blockWidth, int blockHeight, int stride, int bytesPerPixel, ReadOnlySpan data) { int w = BitUtils.DivRoundUp(width, blockWidth); int h = BitUtils.DivRoundUp(height, blockHeight); int outStride = BitUtils.AlignUp(w * bytesPerPixel, HostStrideAlignment); Span output = new byte[h * outStride]; int outOffs = 0; unsafe void Convert(Span output, ReadOnlySpan data) where T : unmanaged { fixed (byte* outputBPtr = output, dataBPtr = data) { for (int y = 0; y < h; y++) { for (int x = 0; x < w; x++) { int offset = y * stride + x * bytesPerPixel; ((T*)(outputBPtr + outOffs))[x] = *(T*)(dataBPtr + offset); } outOffs += outStride; } } } switch (bytesPerPixel) { case 1: Convert(output, data); break; case 2: Convert(output, data); break; case 4: Convert(output, data); break; case 8: Convert(output, data); break; case 12: Convert(output, data); break; case 16: Convert>(output, data); break; default: throw new NotSupportedException($"Unable to convert ${bytesPerPixel} bpp pixel format."); } return output; } public static Span ConvertLinearToBlockLinear( int width, int height, int depth, int levels, int layers, int blockWidth, int blockHeight, int bytesPerPixel, int gobBlocksInY, int gobBlocksInZ, int gobBlocksInTileX, SizeInfo sizeInfo, ReadOnlySpan data) { Span output = new byte[sizeInfo.TotalSize]; int inOffs = 0; int mipGobBlocksInY = gobBlocksInY; int mipGobBlocksInZ = gobBlocksInZ; int gobWidth = (GobStride / bytesPerPixel) * gobBlocksInTileX; int gobHeight = gobBlocksInY * GobHeight; for (int level = 0; level < levels; level++) { int w = Math.Max(1, width >> level); int h = Math.Max(1, height >> level); int d = Math.Max(1, depth >> level); w = BitUtils.DivRoundUp(w, blockWidth); h = BitUtils.DivRoundUp(h, blockHeight); while (h <= (mipGobBlocksInY >> 1) * GobHeight && mipGobBlocksInY != 1) { mipGobBlocksInY >>= 1; } while (d <= (mipGobBlocksInZ >> 1) && mipGobBlocksInZ != 1) { mipGobBlocksInZ >>= 1; } int stride = BitUtils.AlignUp(w * bytesPerPixel, HostStrideAlignment); int alignment = gobWidth; if (d < gobBlocksInZ || w <= gobWidth || h <= gobHeight) { alignment = GobStride / bytesPerPixel; } int wAligned = BitUtils.AlignUp(w, alignment); BlockLinearLayout layoutConverter = new BlockLinearLayout( wAligned, h, d, mipGobBlocksInY, mipGobBlocksInZ, bytesPerPixel); unsafe void Convert(Span output, ReadOnlySpan data) where T : unmanaged { fixed (byte* outputBPtr = output, dataBPtr = data) { for (int layer = 0; layer < layers; layer++) { int outBaseOffset = layer * sizeInfo.LayerSize + sizeInfo.GetMipOffset(level); for (int z = 0; z < d; z++) { layoutConverter.SetZ(z); for (int y = 0; y < h; y++) { layoutConverter.SetY(y); for (int x = 0; x < w; x++) { int offset = outBaseOffset + layoutConverter.GetOffset(x); *(T*)(outputBPtr + offset) = ((T*)(dataBPtr + inOffs))[x]; } inOffs += stride; } } } } } switch (bytesPerPixel) { case 1: Convert(output, data); break; case 2: Convert(output, data); break; case 4: Convert(output, data); break; case 8: Convert(output, data); break; case 12: Convert(output, data); break; case 16: Convert>(output, data); break; default: throw new NotSupportedException($"Unable to convert ${bytesPerPixel} bpp pixel format."); } } return output; } public static Span ConvertLinearToLinearStrided( int width, int height, int blockWidth, int blockHeight, int stride, int bytesPerPixel, ReadOnlySpan data) { int w = BitUtils.DivRoundUp(width, blockWidth); int h = BitUtils.DivRoundUp(height, blockHeight); int inStride = BitUtils.AlignUp(w * bytesPerPixel, HostStrideAlignment); Span output = new byte[h * stride]; int inOffs = 0; unsafe void Convert(Span output, ReadOnlySpan data) where T : unmanaged { fixed (byte* outputBPtr = output, dataBPtr = data) { for (int y = 0; y < h; y++) { for (int x = 0; x < w; x++) { int offset = y * stride + x * bytesPerPixel; *(T*)(outputBPtr + offset) = ((T*)(dataBPtr + inOffs))[x]; } inOffs += inStride; } } } switch (bytesPerPixel) { case 1: Convert(output, data); break; case 2: Convert(output, data); break; case 4: Convert(output, data); break; case 8: Convert(output, data); break; case 12: Convert(output, data); break; case 16: Convert>(output, data); break; default: throw new NotSupportedException($"Unable to convert ${bytesPerPixel} bpp pixel format."); } return output; } private static int GetTextureSize( int width, int height, int depth, int levels, int layers, int blockWidth, int blockHeight, int bytesPerPixel) { int layerSize = 0; for (int level = 0; level < levels; level++) { int w = Math.Max(1, width >> level); int h = Math.Max(1, height >> level); int d = Math.Max(1, depth >> level); w = BitUtils.DivRoundUp(w, blockWidth); h = BitUtils.DivRoundUp(h, blockHeight); int stride = BitUtils.AlignUp(w * bytesPerPixel, HostStrideAlignment); layerSize += stride * h * d; } return layerSize * layers; } } }