forked from Mirror/Ryujinx
Support texture rectangle targets (non-normalized coords)
This commit is contained in:
parent
2eccc7023a
commit
9d7a142a48
23 changed files with 473 additions and 356 deletions
|
@ -21,7 +21,7 @@ namespace Ryujinx.Graphics.Gpu.Engine
|
||||||
ulong shaderGpuVa = shaderBaseAddress.Pack() + (uint)dispatchParams.ShaderOffset;
|
ulong shaderGpuVa = shaderBaseAddress.Pack() + (uint)dispatchParams.ShaderOffset;
|
||||||
|
|
||||||
// Note: A size of 0 is also invalid, the size must be at least 1.
|
// Note: A size of 0 is also invalid, the size must be at least 1.
|
||||||
int sharedMemorySize = Math.Clamp(dispatchParams.SharedMemorySize & 0xffff, 4, _context.Capabilities.MaximumComputeSharedMemorySize);
|
int sharedMemorySize = Math.Clamp(dispatchParams.SharedMemorySize & 0xffff, 1, _context.Capabilities.MaximumComputeSharedMemorySize);
|
||||||
|
|
||||||
ComputeShader cs = _shaderCache.GetComputeShader(
|
ComputeShader cs = _shaderCache.GetComputeShader(
|
||||||
shaderGpuVa,
|
shaderGpuVa,
|
||||||
|
|
|
@ -671,9 +671,7 @@ namespace Ryujinx.Graphics.Gpu.Engine
|
||||||
addressesArray[index] = baseAddress + shader.Offset;
|
addressesArray[index] = baseAddress + shader.Offset;
|
||||||
}
|
}
|
||||||
|
|
||||||
bool viewportTransformEnable = GetViewportTransformEnable(state);
|
GraphicsShader gs = _shaderCache.GetGraphicsShader(state, addresses);
|
||||||
|
|
||||||
GraphicsShader gs = _shaderCache.GetGraphicsShader(addresses, !viewportTransformEnable);
|
|
||||||
|
|
||||||
_vsUsesInstanceId = gs.Shader[0].Program.Info.UsesInstanceId;
|
_vsUsesInstanceId = gs.Shader[0].Program.Info.UsesInstanceId;
|
||||||
|
|
||||||
|
@ -734,7 +732,7 @@ namespace Ryujinx.Graphics.Gpu.Engine
|
||||||
_context.Renderer.Pipeline.BindProgram(gs.HostProgram);
|
_context.Renderer.Pipeline.BindProgram(gs.HostProgram);
|
||||||
}
|
}
|
||||||
|
|
||||||
private bool GetViewportTransformEnable(GpuState state)
|
public bool GetViewportTransformEnable(GpuState state)
|
||||||
{
|
{
|
||||||
// FIXME: We should read ViewportTransformEnable, but it seems that some games writes 0 there?
|
// FIXME: We should read ViewportTransformEnable, but it seems that some games writes 0 there?
|
||||||
// return state.Get<Boolean32>(MethodOffset.ViewportTransformEnable) != 0;
|
// return state.Get<Boolean32>(MethodOffset.ViewportTransformEnable) != 0;
|
||||||
|
|
|
@ -199,6 +199,21 @@ namespace Ryujinx.Graphics.Gpu.Image
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public TextureDescriptor GetTextureDescriptor(GpuState state, int stageIndex, int handle)
|
||||||
|
{
|
||||||
|
int packedId = ReadPackedId(stageIndex, handle);
|
||||||
|
|
||||||
|
int textureId = UnpackTextureId(packedId);
|
||||||
|
|
||||||
|
var poolState = state.Get<PoolState>(MethodOffset.TexturePoolState);
|
||||||
|
|
||||||
|
ulong poolAddress = _context.MemoryManager.Translate(poolState.Address.Pack());
|
||||||
|
|
||||||
|
TexturePool texturePool = _texturePoolCache.FindOrCreate(poolAddress, poolState.MaximumId);
|
||||||
|
|
||||||
|
return texturePool.GetDescriptor(textureId);
|
||||||
|
}
|
||||||
|
|
||||||
private int ReadPackedId(int stage, int wordOffset)
|
private int ReadPackedId(int stage, int wordOffset)
|
||||||
{
|
{
|
||||||
ulong address;
|
ulong address;
|
||||||
|
|
|
@ -101,6 +101,11 @@ namespace Ryujinx.Graphics.Gpu.Image
|
||||||
return (int)((Word5 >> 16) & 0x3fff) + 1;
|
return (int)((Word5 >> 16) & 0x3fff) + 1;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public bool UnpackTextureCoordNormalized()
|
||||||
|
{
|
||||||
|
return (Word5 & (1 << 31)) != 0;
|
||||||
|
}
|
||||||
|
|
||||||
public int UnpackBaseLevel()
|
public int UnpackBaseLevel()
|
||||||
{
|
{
|
||||||
return (int)(Word7 & 0xf);
|
return (int)(Word7 & 0xf);
|
||||||
|
|
|
@ -129,6 +129,11 @@ namespace Ryujinx.Graphics.Gpu.Image
|
||||||
UpdateRenderTargets();
|
UpdateRenderTargets();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public TextureDescriptor GetGraphicsTextureDescriptor(GpuState state, int stageIndex, int handle)
|
||||||
|
{
|
||||||
|
return _gpBindingsManager.GetTextureDescriptor(state, stageIndex, handle);
|
||||||
|
}
|
||||||
|
|
||||||
private void UpdateRenderTargets()
|
private void UpdateRenderTargets()
|
||||||
{
|
{
|
||||||
bool anyChanged = false;
|
bool anyChanged = false;
|
||||||
|
|
|
@ -36,11 +36,7 @@ namespace Ryujinx.Graphics.Gpu.Image
|
||||||
|
|
||||||
if (texture == null)
|
if (texture == null)
|
||||||
{
|
{
|
||||||
ulong address = Address + (ulong)(uint)id * DescriptorSize;
|
TextureDescriptor descriptor = GetDescriptor(id);
|
||||||
|
|
||||||
Span<byte> data = Context.PhysicalMemory.Read(address, DescriptorSize);
|
|
||||||
|
|
||||||
TextureDescriptor descriptor = MemoryMarshal.Cast<byte, TextureDescriptor>(data)[0];
|
|
||||||
|
|
||||||
TextureInfo info = GetInfo(descriptor);
|
TextureInfo info = GetInfo(descriptor);
|
||||||
|
|
||||||
|
@ -66,6 +62,15 @@ namespace Ryujinx.Graphics.Gpu.Image
|
||||||
return texture;
|
return texture;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public TextureDescriptor GetDescriptor(int id)
|
||||||
|
{
|
||||||
|
ulong address = Address + (ulong)(uint)id * DescriptorSize;
|
||||||
|
|
||||||
|
Span<byte> data = Context.PhysicalMemory.Read(address, DescriptorSize);
|
||||||
|
|
||||||
|
return MemoryMarshal.Cast<byte, TextureDescriptor>(data)[0];
|
||||||
|
}
|
||||||
|
|
||||||
protected override void InvalidateRangeImpl(ulong address, ulong size)
|
protected override void InvalidateRangeImpl(ulong address, ulong size)
|
||||||
{
|
{
|
||||||
ulong endAddress = address + size;
|
ulong endAddress = address + size;
|
||||||
|
|
|
@ -11,7 +11,7 @@ namespace Ryujinx.Graphics.Gpu.Image
|
||||||
Texture1DArray,
|
Texture1DArray,
|
||||||
Texture2DArray,
|
Texture2DArray,
|
||||||
TextureBuffer,
|
TextureBuffer,
|
||||||
Texture2DLinear,
|
Texture2DRect,
|
||||||
CubemapArray
|
CubemapArray
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -33,7 +33,7 @@ namespace Ryujinx.Graphics.Gpu.Image
|
||||||
{
|
{
|
||||||
case TextureTarget.Texture1D: return Target.Texture1D;
|
case TextureTarget.Texture1D: return Target.Texture1D;
|
||||||
case TextureTarget.Texture2D: return Target.Texture2D;
|
case TextureTarget.Texture2D: return Target.Texture2D;
|
||||||
case TextureTarget.Texture2DLinear: return Target.Texture2D;
|
case TextureTarget.Texture2DRect: return Target.Texture2D;
|
||||||
case TextureTarget.Texture3D: return Target.Texture3D;
|
case TextureTarget.Texture3D: return Target.Texture3D;
|
||||||
case TextureTarget.Texture1DArray: return Target.Texture1DArray;
|
case TextureTarget.Texture1DArray: return Target.Texture1DArray;
|
||||||
case TextureTarget.Texture2DArray: return Target.Texture2DArray;
|
case TextureTarget.Texture2DArray: return Target.Texture2DArray;
|
||||||
|
|
|
@ -1,10 +1,10 @@
|
||||||
using Ryujinx.Graphics.GAL;
|
using Ryujinx.Graphics.GAL;
|
||||||
|
using Ryujinx.Graphics.Gpu.Image;
|
||||||
using Ryujinx.Graphics.Gpu.State;
|
using Ryujinx.Graphics.Gpu.State;
|
||||||
using Ryujinx.Graphics.Shader;
|
using Ryujinx.Graphics.Shader;
|
||||||
using Ryujinx.Graphics.Shader.Translation;
|
using Ryujinx.Graphics.Shader.Translation;
|
||||||
using System;
|
using System;
|
||||||
using System.Collections.Generic;
|
using System.Collections.Generic;
|
||||||
using System.Globalization;
|
|
||||||
using System.Runtime.InteropServices;
|
using System.Runtime.InteropServices;
|
||||||
|
|
||||||
namespace Ryujinx.Graphics.Gpu.Shader
|
namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
|
@ -13,6 +13,8 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
{
|
{
|
||||||
private const int MaxProgramSize = 0x100000;
|
private const int MaxProgramSize = 0x100000;
|
||||||
|
|
||||||
|
private const TranslationFlags DefaultFlags = TranslationFlags.DebugMode;
|
||||||
|
|
||||||
private GpuContext _context;
|
private GpuContext _context;
|
||||||
|
|
||||||
private ShaderDumper _dumper;
|
private ShaderDumper _dumper;
|
||||||
|
@ -69,7 +71,7 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
return cpShader;
|
return cpShader;
|
||||||
}
|
}
|
||||||
|
|
||||||
public GraphicsShader GetGraphicsShader(ShaderAddresses addresses, bool dividePosXY)
|
public GraphicsShader GetGraphicsShader(GpuState state, ShaderAddresses addresses)
|
||||||
{
|
{
|
||||||
bool isCached = _gpPrograms.TryGetValue(addresses, out List<GraphicsShader> list);
|
bool isCached = _gpPrograms.TryGetValue(addresses, out List<GraphicsShader> list);
|
||||||
|
|
||||||
|
@ -86,28 +88,19 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
|
|
||||||
GraphicsShader gpShaders = new GraphicsShader();
|
GraphicsShader gpShaders = new GraphicsShader();
|
||||||
|
|
||||||
TranslationFlags flags =
|
|
||||||
TranslationFlags.DebugMode |
|
|
||||||
TranslationFlags.Unspecialized;
|
|
||||||
|
|
||||||
if (dividePosXY)
|
|
||||||
{
|
|
||||||
flags |= TranslationFlags.DividePosXY;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (addresses.VertexA != 0)
|
if (addresses.VertexA != 0)
|
||||||
{
|
{
|
||||||
gpShaders.Shader[0] = TranslateGraphicsShader(flags, addresses.Vertex, addresses.VertexA);
|
gpShaders.Shader[0] = TranslateGraphicsShader(state, ShaderStage.Vertex, addresses.Vertex, addresses.VertexA);
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
gpShaders.Shader[0] = TranslateGraphicsShader(flags, addresses.Vertex);
|
gpShaders.Shader[0] = TranslateGraphicsShader(state, ShaderStage.Vertex, addresses.Vertex);
|
||||||
}
|
}
|
||||||
|
|
||||||
gpShaders.Shader[1] = TranslateGraphicsShader(flags, addresses.TessControl);
|
gpShaders.Shader[1] = TranslateGraphicsShader(state, ShaderStage.TessellationControl, addresses.TessControl);
|
||||||
gpShaders.Shader[2] = TranslateGraphicsShader(flags, addresses.TessEvaluation);
|
gpShaders.Shader[2] = TranslateGraphicsShader(state, ShaderStage.TessellationEvaluation, addresses.TessEvaluation);
|
||||||
gpShaders.Shader[3] = TranslateGraphicsShader(flags, addresses.Geometry);
|
gpShaders.Shader[3] = TranslateGraphicsShader(state, ShaderStage.Geometry, addresses.Geometry);
|
||||||
gpShaders.Shader[4] = TranslateGraphicsShader(flags, addresses.Fragment);
|
gpShaders.Shader[4] = TranslateGraphicsShader(state, ShaderStage.Fragment, addresses.Fragment);
|
||||||
|
|
||||||
BackpropQualifiers(gpShaders);
|
BackpropQualifiers(gpShaders);
|
||||||
|
|
||||||
|
@ -199,25 +192,31 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
return null;
|
return null;
|
||||||
}
|
}
|
||||||
|
|
||||||
ShaderProgram program;
|
QueryInfoCallback queryInfo = (QueryInfoName info, int index) =>
|
||||||
|
{
|
||||||
|
switch (info)
|
||||||
|
{
|
||||||
|
case QueryInfoName.ComputeLocalSizeX:
|
||||||
|
return localSizeX;
|
||||||
|
case QueryInfoName.ComputeLocalSizeY:
|
||||||
|
return localSizeY;
|
||||||
|
case QueryInfoName.ComputeLocalSizeZ:
|
||||||
|
return localSizeZ;
|
||||||
|
case QueryInfoName.ComputeSharedMemorySize:
|
||||||
|
return sharedMemorySize;
|
||||||
|
}
|
||||||
|
|
||||||
const TranslationFlags flags =
|
return QueryInfoCommon(info);
|
||||||
TranslationFlags.Compute |
|
};
|
||||||
TranslationFlags.DebugMode |
|
|
||||||
TranslationFlags.Unspecialized;
|
ShaderProgram program;
|
||||||
|
|
||||||
Span<byte> code = _context.MemoryAccessor.Read(gpuVa, MaxProgramSize);
|
Span<byte> code = _context.MemoryAccessor.Read(gpuVa, MaxProgramSize);
|
||||||
|
|
||||||
program = Translator.Translate(code, GetShaderCapabilities(), flags);
|
program = Translator.Translate(code, queryInfo, DefaultFlags | TranslationFlags.Compute);
|
||||||
|
|
||||||
int[] codeCached = MemoryMarshal.Cast<byte, int>(code.Slice(0, program.Size)).ToArray();
|
int[] codeCached = MemoryMarshal.Cast<byte, int>(code.Slice(0, program.Size)).ToArray();
|
||||||
|
|
||||||
program.Replace(DefineNames.SharedMemorySize, (sharedMemorySize / 4).ToString(CultureInfo.InvariantCulture));
|
|
||||||
|
|
||||||
program.Replace(DefineNames.LocalSizeX, localSizeX.ToString(CultureInfo.InvariantCulture));
|
|
||||||
program.Replace(DefineNames.LocalSizeY, localSizeY.ToString(CultureInfo.InvariantCulture));
|
|
||||||
program.Replace(DefineNames.LocalSizeZ, localSizeZ.ToString(CultureInfo.InvariantCulture));
|
|
||||||
|
|
||||||
_dumper.Dump(code, compute: true, out string fullPath, out string codePath);
|
_dumper.Dump(code, compute: true, out string fullPath, out string codePath);
|
||||||
|
|
||||||
if (fullPath != null && codePath != null)
|
if (fullPath != null && codePath != null)
|
||||||
|
@ -229,13 +228,30 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
return new CachedShader(program, codeCached);
|
return new CachedShader(program, codeCached);
|
||||||
}
|
}
|
||||||
|
|
||||||
private CachedShader TranslateGraphicsShader(TranslationFlags flags, ulong gpuVa, ulong gpuVaA = 0)
|
private CachedShader TranslateGraphicsShader(GpuState state, ShaderStage stage, ulong gpuVa, ulong gpuVaA = 0)
|
||||||
{
|
{
|
||||||
if (gpuVa == 0)
|
if (gpuVa == 0)
|
||||||
{
|
{
|
||||||
return new CachedShader(null, null);
|
return new CachedShader(null, null);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
QueryInfoCallback queryInfo = (QueryInfoName info, int index) =>
|
||||||
|
{
|
||||||
|
switch (info)
|
||||||
|
{
|
||||||
|
case QueryInfoName.IsTextureBuffer:
|
||||||
|
return Convert.ToInt32(QueryIsTextureBuffer(state, (int)stage - 1, index));
|
||||||
|
case QueryInfoName.IsTextureRectangle:
|
||||||
|
return Convert.ToInt32(QueryIsTextureRectangle(state, (int)stage - 1, index));
|
||||||
|
case QueryInfoName.PrimitiveTopology:
|
||||||
|
return (int)GetPrimitiveTopology();
|
||||||
|
case QueryInfoName.ViewportTransformEnable:
|
||||||
|
return Convert.ToInt32(_context.Methods.GetViewportTransformEnable(state));
|
||||||
|
}
|
||||||
|
|
||||||
|
return QueryInfoCommon(info);
|
||||||
|
};
|
||||||
|
|
||||||
ShaderProgram program;
|
ShaderProgram program;
|
||||||
|
|
||||||
int[] codeCached = null;
|
int[] codeCached = null;
|
||||||
|
@ -245,9 +261,9 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
Span<byte> codeA = _context.MemoryAccessor.Read(gpuVaA, MaxProgramSize);
|
Span<byte> codeA = _context.MemoryAccessor.Read(gpuVaA, MaxProgramSize);
|
||||||
Span<byte> codeB = _context.MemoryAccessor.Read(gpuVa, MaxProgramSize);
|
Span<byte> codeB = _context.MemoryAccessor.Read(gpuVa, MaxProgramSize);
|
||||||
|
|
||||||
program = Translator.Translate(codeA, codeB, GetShaderCapabilities(), flags);
|
program = Translator.Translate(codeA, codeB, queryInfo, DefaultFlags);
|
||||||
|
|
||||||
// TODO: We should also check "codeA" into account.
|
// TODO: We should also take "codeA" into account.
|
||||||
codeCached = MemoryMarshal.Cast<byte, int>(codeB.Slice(0, program.Size)).ToArray();
|
codeCached = MemoryMarshal.Cast<byte, int>(codeB.Slice(0, program.Size)).ToArray();
|
||||||
|
|
||||||
_dumper.Dump(codeA, compute: false, out string fullPathA, out string codePathA);
|
_dumper.Dump(codeA, compute: false, out string fullPathA, out string codePathA);
|
||||||
|
@ -265,7 +281,7 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
{
|
{
|
||||||
Span<byte> code = _context.MemoryAccessor.Read(gpuVa, MaxProgramSize);
|
Span<byte> code = _context.MemoryAccessor.Read(gpuVa, MaxProgramSize);
|
||||||
|
|
||||||
program = Translator.Translate(code, GetShaderCapabilities(), flags);
|
program = Translator.Translate(code, queryInfo, DefaultFlags);
|
||||||
|
|
||||||
codeCached = MemoryMarshal.Cast<byte, int>(code.Slice(0, program.Size)).ToArray();
|
codeCached = MemoryMarshal.Cast<byte, int>(code.Slice(0, program.Size)).ToArray();
|
||||||
|
|
||||||
|
@ -278,40 +294,6 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if (program.Stage == ShaderStage.Geometry)
|
|
||||||
{
|
|
||||||
PrimitiveType primitiveType = _context.Methods.PrimitiveType;
|
|
||||||
|
|
||||||
string inPrimitive = "points";
|
|
||||||
|
|
||||||
switch (primitiveType)
|
|
||||||
{
|
|
||||||
case PrimitiveType.Points:
|
|
||||||
inPrimitive = "points";
|
|
||||||
break;
|
|
||||||
case PrimitiveType.Lines:
|
|
||||||
case PrimitiveType.LineLoop:
|
|
||||||
case PrimitiveType.LineStrip:
|
|
||||||
inPrimitive = "lines";
|
|
||||||
break;
|
|
||||||
case PrimitiveType.LinesAdjacency:
|
|
||||||
case PrimitiveType.LineStripAdjacency:
|
|
||||||
inPrimitive = "lines_adjacency";
|
|
||||||
break;
|
|
||||||
case PrimitiveType.Triangles:
|
|
||||||
case PrimitiveType.TriangleStrip:
|
|
||||||
case PrimitiveType.TriangleFan:
|
|
||||||
inPrimitive = "triangles";
|
|
||||||
break;
|
|
||||||
case PrimitiveType.TrianglesAdjacency:
|
|
||||||
case PrimitiveType.TriangleStripAdjacency:
|
|
||||||
inPrimitive = "triangles_adjacency";
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
|
|
||||||
program.Replace(DefineNames.InputTopologyName, inPrimitive);
|
|
||||||
}
|
|
||||||
|
|
||||||
ulong address = _context.MemoryManager.Translate(gpuVa);
|
ulong address = _context.MemoryManager.Translate(gpuVa);
|
||||||
|
|
||||||
return new CachedShader(program, codeCached);
|
return new CachedShader(program, codeCached);
|
||||||
|
@ -350,13 +332,66 @@ namespace Ryujinx.Graphics.Gpu.Shader
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
private ShaderCapabilities GetShaderCapabilities()
|
private InputTopology GetPrimitiveTopology()
|
||||||
{
|
{
|
||||||
return new ShaderCapabilities(
|
switch (_context.Methods.PrimitiveType)
|
||||||
_context.Capabilities.MaximumViewportDimensions,
|
{
|
||||||
_context.Capabilities.MaximumComputeSharedMemorySize,
|
case PrimitiveType.Points:
|
||||||
_context.Capabilities.StorageBufferOffsetAlignment,
|
return InputTopology.Points;
|
||||||
_context.Capabilities.SupportsNonConstantTextureOffset);
|
case PrimitiveType.Lines:
|
||||||
|
case PrimitiveType.LineLoop:
|
||||||
|
case PrimitiveType.LineStrip:
|
||||||
|
return InputTopology.Lines;
|
||||||
|
case PrimitiveType.LinesAdjacency:
|
||||||
|
case PrimitiveType.LineStripAdjacency:
|
||||||
|
return InputTopology.LinesAdjacency;
|
||||||
|
case PrimitiveType.Triangles:
|
||||||
|
case PrimitiveType.TriangleStrip:
|
||||||
|
case PrimitiveType.TriangleFan:
|
||||||
|
return InputTopology.Triangles;
|
||||||
|
case PrimitiveType.TrianglesAdjacency:
|
||||||
|
case PrimitiveType.TriangleStripAdjacency:
|
||||||
|
return InputTopology.TrianglesAdjacency;
|
||||||
|
}
|
||||||
|
|
||||||
|
return InputTopology.Points;
|
||||||
|
}
|
||||||
|
|
||||||
|
private bool QueryIsTextureBuffer(GpuState state, int stageIndex, int index)
|
||||||
|
{
|
||||||
|
return GetTextureDescriptor(state, stageIndex, index).UnpackTextureTarget() == TextureTarget.TextureBuffer;
|
||||||
|
}
|
||||||
|
|
||||||
|
private bool QueryIsTextureRectangle(GpuState state, int stageIndex, int index)
|
||||||
|
{
|
||||||
|
var descriptor = GetTextureDescriptor(state, stageIndex, index);
|
||||||
|
|
||||||
|
TextureTarget target = descriptor.UnpackTextureTarget();
|
||||||
|
|
||||||
|
bool is2DTexture = target == TextureTarget.Texture2D ||
|
||||||
|
target == TextureTarget.Texture2DRect;
|
||||||
|
|
||||||
|
return !descriptor.UnpackTextureCoordNormalized() && is2DTexture;
|
||||||
|
}
|
||||||
|
|
||||||
|
private Image.TextureDescriptor GetTextureDescriptor(GpuState state, int stageIndex, int index)
|
||||||
|
{
|
||||||
|
return _context.Methods.TextureManager.GetGraphicsTextureDescriptor(state, stageIndex, index);
|
||||||
|
}
|
||||||
|
|
||||||
|
private int QueryInfoCommon(QueryInfoName info)
|
||||||
|
{
|
||||||
|
switch (info)
|
||||||
|
{
|
||||||
|
case QueryInfoName.MaximumViewportDimensions:
|
||||||
|
return _context.Capabilities.MaximumViewportDimensions;
|
||||||
|
case QueryInfoName.StorageBufferOffsetAlignment:
|
||||||
|
return _context.Capabilities.StorageBufferOffsetAlignment;
|
||||||
|
case QueryInfoName.SupportsNonConstantTextureOffset:
|
||||||
|
return Convert.ToInt32(_context.Capabilities.SupportsNonConstantTextureOffset);
|
||||||
|
}
|
||||||
|
|
||||||
|
return 0;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
|
@ -35,23 +35,11 @@ namespace Ryujinx.Graphics.Shader.CodeGen.Glsl
|
||||||
|
|
||||||
if (context.Config.Stage == ShaderStage.Geometry)
|
if (context.Config.Stage == ShaderStage.Geometry)
|
||||||
{
|
{
|
||||||
string inPrimitive = "points";
|
string inPrimitive = ((InputTopology)context.Config.QueryInfo(QueryInfoName.PrimitiveTopology)).ToGlslString();
|
||||||
|
|
||||||
if ((context.Config.Flags & TranslationFlags.Unspecialized) != 0)
|
|
||||||
{
|
|
||||||
inPrimitive = DefineNames.InputTopologyName;
|
|
||||||
}
|
|
||||||
|
|
||||||
context.AppendLine($"layout ({inPrimitive}) in;");
|
context.AppendLine($"layout ({inPrimitive}) in;");
|
||||||
|
|
||||||
string outPrimitive = "triangle_strip";
|
string outPrimitive = context.Config.OutputTopology.ToGlslString();
|
||||||
|
|
||||||
switch (context.Config.OutputTopology)
|
|
||||||
{
|
|
||||||
case OutputTopology.LineStrip: outPrimitive = "line_strip"; break;
|
|
||||||
case OutputTopology.PointList: outPrimitive = "points"; break;
|
|
||||||
case OutputTopology.TriangleStrip: outPrimitive = "triangle_strip"; break;
|
|
||||||
}
|
|
||||||
|
|
||||||
int maxOutputVertices = context.Config.MaxOutputVertices;
|
int maxOutputVertices = context.Config.MaxOutputVertices;
|
||||||
|
|
||||||
|
@ -75,16 +63,7 @@ namespace Ryujinx.Graphics.Shader.CodeGen.Glsl
|
||||||
|
|
||||||
if (context.Config.Stage == ShaderStage.Compute)
|
if (context.Config.Stage == ShaderStage.Compute)
|
||||||
{
|
{
|
||||||
string size;
|
string size = NumberFormatter.FormatInt(BitUtils.DivRoundUp(context.Config.QueryInfo(QueryInfoName.ComputeSharedMemorySize), 4));
|
||||||
|
|
||||||
if ((context.Config.Flags & TranslationFlags.Unspecialized) != 0)
|
|
||||||
{
|
|
||||||
size = DefineNames.SharedMemorySize;
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
size = NumberFormatter.FormatInt(context.Config.Capabilities.MaximumComputeSharedMemorySize / 4);
|
|
||||||
}
|
|
||||||
|
|
||||||
context.AppendLine($"shared uint {DefaultNames.SharedMemoryName}[{size}];");
|
context.AppendLine($"shared uint {DefaultNames.SharedMemoryName}[{size}];");
|
||||||
context.AppendLine();
|
context.AppendLine();
|
||||||
|
@ -136,19 +115,12 @@ namespace Ryujinx.Graphics.Shader.CodeGen.Glsl
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
string localSizeX = "1";
|
string localSizeX = NumberFormatter.FormatInt(context.Config.QueryInfo(QueryInfoName.ComputeLocalSizeX));
|
||||||
string localSizeY = "1";
|
string localSizeY = NumberFormatter.FormatInt(context.Config.QueryInfo(QueryInfoName.ComputeLocalSizeY));
|
||||||
string localSizeZ = "1";
|
string localSizeZ = NumberFormatter.FormatInt(context.Config.QueryInfo(QueryInfoName.ComputeLocalSizeZ));
|
||||||
|
|
||||||
if ((context.Config.Flags & TranslationFlags.Unspecialized) != 0)
|
|
||||||
{
|
|
||||||
localSizeX = DefineNames.LocalSizeX;
|
|
||||||
localSizeY = DefineNames.LocalSizeY;
|
|
||||||
localSizeZ = DefineNames.LocalSizeZ;
|
|
||||||
}
|
|
||||||
|
|
||||||
context.AppendLine(
|
context.AppendLine(
|
||||||
$"layout (" +
|
"layout (" +
|
||||||
$"local_size_x = {localSizeX}, " +
|
$"local_size_x = {localSizeX}, " +
|
||||||
$"local_size_y = {localSizeY}, " +
|
$"local_size_y = {localSizeY}, " +
|
||||||
$"local_size_z = {localSizeZ}) in;");
|
$"local_size_z = {localSizeZ}) in;");
|
||||||
|
|
|
@ -2,14 +2,6 @@ namespace Ryujinx.Graphics.Shader
|
||||||
{
|
{
|
||||||
public static class DefineNames
|
public static class DefineNames
|
||||||
{
|
{
|
||||||
public const string InputTopologyName = "S_INPUT_TOPOLOGY";
|
|
||||||
|
|
||||||
public const string OutQualifierPrefixName = "S_OUT_QUALIFIER";
|
public const string OutQualifierPrefixName = "S_OUT_QUALIFIER";
|
||||||
|
|
||||||
public const string SharedMemorySize = "S_SHARED_MEMORY_SIZE";
|
|
||||||
|
|
||||||
public const string LocalSizeX = "S_LOCAL_SIZE_X";
|
|
||||||
public const string LocalSizeY = "S_LOCAL_SIZE_Y";
|
|
||||||
public const string LocalSizeZ = "S_LOCAL_SIZE_Z";
|
|
||||||
}
|
}
|
||||||
}
|
}
|
28
Ryujinx.Graphics.Shader/InputTopology.cs
Normal file
28
Ryujinx.Graphics.Shader/InputTopology.cs
Normal file
|
@ -0,0 +1,28 @@
|
||||||
|
namespace Ryujinx.Graphics.Shader
|
||||||
|
{
|
||||||
|
public enum InputTopology
|
||||||
|
{
|
||||||
|
Points,
|
||||||
|
Lines,
|
||||||
|
LinesAdjacency,
|
||||||
|
Triangles,
|
||||||
|
TrianglesAdjacency
|
||||||
|
}
|
||||||
|
|
||||||
|
static class InputTopologyExtensions
|
||||||
|
{
|
||||||
|
public static string ToGlslString(this InputTopology topology)
|
||||||
|
{
|
||||||
|
switch (topology)
|
||||||
|
{
|
||||||
|
case InputTopology.Points: return "points";
|
||||||
|
case InputTopology.Lines: return "lines";
|
||||||
|
case InputTopology.LinesAdjacency: return "lines_adjacency";
|
||||||
|
case InputTopology.Triangles: return "triangles";
|
||||||
|
case InputTopology.TrianglesAdjacency: return "triangles_adjacency";
|
||||||
|
}
|
||||||
|
|
||||||
|
return "points";
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
|
@ -6,4 +6,19 @@ namespace Ryujinx.Graphics.Shader
|
||||||
LineStrip = 6,
|
LineStrip = 6,
|
||||||
TriangleStrip = 7
|
TriangleStrip = 7
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static class OutputTopologyExtensions
|
||||||
|
{
|
||||||
|
public static string ToGlslString(this OutputTopology topology)
|
||||||
|
{
|
||||||
|
switch (topology)
|
||||||
|
{
|
||||||
|
case OutputTopology.LineStrip: return "line_strip";
|
||||||
|
case OutputTopology.PointList: return "points";
|
||||||
|
case OutputTopology.TriangleStrip: return "triangle_strip";
|
||||||
|
}
|
||||||
|
|
||||||
|
return "points";
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
4
Ryujinx.Graphics.Shader/QueryInfoCallback.cs
Normal file
4
Ryujinx.Graphics.Shader/QueryInfoCallback.cs
Normal file
|
@ -0,0 +1,4 @@
|
||||||
|
namespace Ryujinx.Graphics.Shader
|
||||||
|
{
|
||||||
|
public delegate int QueryInfoCallback(QueryInfoName info, int index);
|
||||||
|
}
|
17
Ryujinx.Graphics.Shader/QueryInfoName.cs
Normal file
17
Ryujinx.Graphics.Shader/QueryInfoName.cs
Normal file
|
@ -0,0 +1,17 @@
|
||||||
|
namespace Ryujinx.Graphics.Shader
|
||||||
|
{
|
||||||
|
public enum QueryInfoName
|
||||||
|
{
|
||||||
|
ComputeLocalSizeX,
|
||||||
|
ComputeLocalSizeY,
|
||||||
|
ComputeLocalSizeZ,
|
||||||
|
ComputeSharedMemorySize,
|
||||||
|
IsTextureBuffer,
|
||||||
|
IsTextureRectangle,
|
||||||
|
MaximumViewportDimensions,
|
||||||
|
PrimitiveTopology,
|
||||||
|
StorageBufferOffsetAlignment,
|
||||||
|
SupportsNonConstantTextureOffset,
|
||||||
|
ViewportTransformEnable
|
||||||
|
}
|
||||||
|
}
|
|
@ -1,27 +0,0 @@
|
||||||
namespace Ryujinx.Graphics.Shader
|
|
||||||
{
|
|
||||||
public struct ShaderCapabilities
|
|
||||||
{
|
|
||||||
// Initialize with default values for Maxwell.
|
|
||||||
private static readonly ShaderCapabilities _default = new ShaderCapabilities(0x8000, 0xc000, 16, true);
|
|
||||||
|
|
||||||
public static ShaderCapabilities Default => _default;
|
|
||||||
|
|
||||||
public int MaximumViewportDimensions { get; }
|
|
||||||
public int MaximumComputeSharedMemorySize { get; }
|
|
||||||
public int StorageBufferOffsetAlignment { get; }
|
|
||||||
public bool SupportsNonConstantTextureOffset { get; }
|
|
||||||
|
|
||||||
public ShaderCapabilities(
|
|
||||||
int maximumViewportDimensions,
|
|
||||||
int maximumComputeSharedMemorySize,
|
|
||||||
int storageBufferOffsetAlignment,
|
|
||||||
bool supportsNonConstantTextureOffset)
|
|
||||||
{
|
|
||||||
MaximumViewportDimensions = maximumViewportDimensions;
|
|
||||||
MaximumComputeSharedMemorySize = maximumComputeSharedMemorySize;
|
|
||||||
StorageBufferOffsetAlignment = storageBufferOffsetAlignment;
|
|
||||||
SupportsNonConstantTextureOffset = supportsNonConstantTextureOffset;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,4 +1,5 @@
|
||||||
using Ryujinx.Graphics.Shader.Translation;
|
using Ryujinx.Graphics.Shader.Translation;
|
||||||
|
using System;
|
||||||
|
|
||||||
namespace Ryujinx.Graphics.Shader
|
namespace Ryujinx.Graphics.Shader
|
||||||
{
|
{
|
||||||
|
@ -6,26 +7,100 @@ namespace Ryujinx.Graphics.Shader
|
||||||
{
|
{
|
||||||
public ShaderStage Stage { get; }
|
public ShaderStage Stage { get; }
|
||||||
|
|
||||||
public ShaderCapabilities Capabilities { get; }
|
public OutputTopology OutputTopology { get; }
|
||||||
|
|
||||||
public TranslationFlags Flags { get; }
|
|
||||||
|
|
||||||
public int MaxOutputVertices { get; }
|
public int MaxOutputVertices { get; }
|
||||||
|
|
||||||
public OutputTopology OutputTopology { get; }
|
public OutputMapTarget[] OmapTargets { get; }
|
||||||
|
public bool OmapSampleMask { get; }
|
||||||
|
public bool OmapDepth { get; }
|
||||||
|
|
||||||
public ShaderConfig(
|
public TranslationFlags Flags { get; }
|
||||||
ShaderStage stage,
|
|
||||||
ShaderCapabilities capabilities,
|
private QueryInfoCallback _queryInfoCallback;
|
||||||
TranslationFlags flags,
|
|
||||||
int maxOutputVertices,
|
public ShaderConfig(TranslationFlags flags, QueryInfoCallback queryInfoCallback)
|
||||||
OutputTopology outputTopology)
|
|
||||||
{
|
{
|
||||||
Stage = stage;
|
Stage = ShaderStage.Compute;
|
||||||
Capabilities = capabilities;
|
OutputTopology = OutputTopology.PointList;
|
||||||
Flags = flags;
|
MaxOutputVertices = 0;
|
||||||
MaxOutputVertices = maxOutputVertices;
|
OmapTargets = null;
|
||||||
OutputTopology = outputTopology;
|
OmapSampleMask = false;
|
||||||
|
OmapDepth = false;
|
||||||
|
Flags = flags;
|
||||||
|
_queryInfoCallback = queryInfoCallback;
|
||||||
|
}
|
||||||
|
|
||||||
|
public ShaderConfig(ShaderHeader header, TranslationFlags flags, QueryInfoCallback queryInfoCallback)
|
||||||
|
{
|
||||||
|
Stage = header.Stage;
|
||||||
|
OutputTopology = header.OutputTopology;
|
||||||
|
MaxOutputVertices = header.MaxOutputVertexCount;
|
||||||
|
OmapTargets = header.OmapTargets;
|
||||||
|
OmapSampleMask = header.OmapSampleMask;
|
||||||
|
OmapDepth = header.OmapDepth;
|
||||||
|
Flags = flags;
|
||||||
|
_queryInfoCallback = queryInfoCallback;
|
||||||
|
}
|
||||||
|
|
||||||
|
public int GetDepthRegister()
|
||||||
|
{
|
||||||
|
int count = 0;
|
||||||
|
|
||||||
|
for (int index = 0; index < OmapTargets.Length; index++)
|
||||||
|
{
|
||||||
|
for (int component = 0; component < 4; component++)
|
||||||
|
{
|
||||||
|
if (OmapTargets[index].ComponentEnabled(component))
|
||||||
|
{
|
||||||
|
count++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// The depth register is always two registers after the last color output.
|
||||||
|
return count + 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
public bool QueryInfoBool(QueryInfoName info, int index = 0)
|
||||||
|
{
|
||||||
|
return Convert.ToBoolean(QueryInfo(info, index));
|
||||||
|
}
|
||||||
|
|
||||||
|
public int QueryInfo(QueryInfoName info, int index = 0)
|
||||||
|
{
|
||||||
|
if (_queryInfoCallback != null)
|
||||||
|
{
|
||||||
|
return _queryInfoCallback(info, index);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
switch (info)
|
||||||
|
{
|
||||||
|
case QueryInfoName.ComputeLocalSizeX:
|
||||||
|
case QueryInfoName.ComputeLocalSizeY:
|
||||||
|
case QueryInfoName.ComputeLocalSizeZ:
|
||||||
|
return 1;
|
||||||
|
case QueryInfoName.ComputeSharedMemorySize:
|
||||||
|
return 0xc000;
|
||||||
|
case QueryInfoName.IsTextureBuffer:
|
||||||
|
return Convert.ToInt32(false);
|
||||||
|
case QueryInfoName.IsTextureRectangle:
|
||||||
|
return Convert.ToInt32(false);
|
||||||
|
case QueryInfoName.MaximumViewportDimensions:
|
||||||
|
return 0x8000;
|
||||||
|
case QueryInfoName.PrimitiveTopology:
|
||||||
|
return (int)InputTopology.Points;
|
||||||
|
case QueryInfoName.StorageBufferOffsetAlignment:
|
||||||
|
return 16;
|
||||||
|
case QueryInfoName.SupportsNonConstantTextureOffset:
|
||||||
|
return Convert.ToInt32(true);
|
||||||
|
case QueryInfoName.ViewportTransformEnable:
|
||||||
|
return Convert.ToInt32(true);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return 0;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
|
@ -76,28 +76,6 @@ namespace Ryujinx.Graphics.Shader
|
||||||
public bool OmapSampleMask { get; }
|
public bool OmapSampleMask { get; }
|
||||||
public bool OmapDepth { get; }
|
public bool OmapDepth { get; }
|
||||||
|
|
||||||
public int DepthRegister
|
|
||||||
{
|
|
||||||
get
|
|
||||||
{
|
|
||||||
int count = 0;
|
|
||||||
|
|
||||||
for (int index = 0; index < OmapTargets.Length; index++)
|
|
||||||
{
|
|
||||||
for (int component = 0; component < 4; component++)
|
|
||||||
{
|
|
||||||
if (OmapTargets[index].ComponentEnabled(component))
|
|
||||||
{
|
|
||||||
count++;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Depth register is always two registers after the last color output.
|
|
||||||
return count + 1;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
public ShaderHeader(Span<byte> code)
|
public ShaderHeader(Span<byte> code)
|
||||||
{
|
{
|
||||||
Span<int> header = MemoryMarshal.Cast<byte, int>(code);
|
Span<int> header = MemoryMarshal.Cast<byte, int>(code);
|
||||||
|
|
|
@ -11,25 +11,15 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
public Block CurrBlock { get; set; }
|
public Block CurrBlock { get; set; }
|
||||||
public OpCode CurrOp { get; set; }
|
public OpCode CurrOp { get; set; }
|
||||||
|
|
||||||
private ShaderStage _stage;
|
private ShaderConfig _config;
|
||||||
private ShaderHeader _header;
|
|
||||||
private ShaderCapabilities _capabilities;
|
|
||||||
private TranslationFlags _flags;
|
|
||||||
|
|
||||||
private List<Operation> _operations;
|
private List<Operation> _operations;
|
||||||
|
|
||||||
private Dictionary<ulong, Operand> _labels;
|
private Dictionary<ulong, Operand> _labels;
|
||||||
|
|
||||||
public EmitterContext(
|
public EmitterContext(ShaderConfig config)
|
||||||
ShaderStage stage,
|
|
||||||
ShaderHeader header,
|
|
||||||
ShaderCapabilities capabilities,
|
|
||||||
TranslationFlags flags)
|
|
||||||
{
|
{
|
||||||
_stage = stage;
|
_config = config;
|
||||||
_header = header;
|
|
||||||
_capabilities = capabilities;
|
|
||||||
_flags = flags;
|
|
||||||
|
|
||||||
_operations = new List<Operation>();
|
_operations = new List<Operation>();
|
||||||
|
|
||||||
|
@ -69,24 +59,24 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
|
|
||||||
public void PrepareForReturn()
|
public void PrepareForReturn()
|
||||||
{
|
{
|
||||||
if (_stage == ShaderStage.Vertex)
|
if (_config.Stage == ShaderStage.Vertex)
|
||||||
{
|
{
|
||||||
if ((_flags & TranslationFlags.DividePosXY) != 0)
|
if (!_config.QueryInfoBool(QueryInfoName.ViewportTransformEnable))
|
||||||
{
|
{
|
||||||
Operand posX = Attribute(AttributeConsts.PositionX);
|
Operand posX = Attribute(AttributeConsts.PositionX);
|
||||||
Operand posY = Attribute(AttributeConsts.PositionY);
|
Operand posY = Attribute(AttributeConsts.PositionY);
|
||||||
|
|
||||||
this.Copy(posX, this.FPDivide(posX, ConstF(_capabilities.MaximumViewportDimensions / 2)));
|
this.Copy(posX, this.FPDivide(posX, ConstF(_config.QueryInfo(QueryInfoName.MaximumViewportDimensions) / 2)));
|
||||||
this.Copy(posY, this.FPDivide(posY, ConstF(_capabilities.MaximumViewportDimensions / 2)));
|
this.Copy(posY, this.FPDivide(posY, ConstF(_config.QueryInfo(QueryInfoName.MaximumViewportDimensions) / 2)));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else if (_stage == ShaderStage.Fragment)
|
else if (_config.Stage == ShaderStage.Fragment)
|
||||||
{
|
{
|
||||||
if (_header.OmapDepth)
|
if (_config.OmapDepth)
|
||||||
{
|
{
|
||||||
Operand dest = Attribute(AttributeConsts.FragmentOutputDepth);
|
Operand dest = Attribute(AttributeConsts.FragmentOutputDepth);
|
||||||
|
|
||||||
Operand src = Register(_header.DepthRegister, RegisterType.Gpr);
|
Operand src = Register(_config.GetDepthRegister(), RegisterType.Gpr);
|
||||||
|
|
||||||
this.Copy(dest, src);
|
this.Copy(dest, src);
|
||||||
}
|
}
|
||||||
|
@ -95,7 +85,7 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
|
|
||||||
for (int attachment = 0; attachment < 8; attachment++)
|
for (int attachment = 0; attachment < 8; attachment++)
|
||||||
{
|
{
|
||||||
OutputMapTarget target = _header.OmapTargets[attachment];
|
OutputMapTarget target = _config.OmapTargets[attachment];
|
||||||
|
|
||||||
for (int component = 0; component < 4; component++)
|
for (int component = 0; component < 4; component++)
|
||||||
{
|
{
|
||||||
|
|
|
@ -27,9 +27,9 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
node = RewriteGlobalAccess(node, config);
|
node = RewriteGlobalAccess(node, config);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (!config.Capabilities.SupportsNonConstantTextureOffset && operation.Inst == Instruction.TextureSample)
|
if (operation.Inst == Instruction.TextureSample)
|
||||||
{
|
{
|
||||||
node = RewriteTextureSample(node);
|
node = RewriteTextureSample(node, config);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -79,7 +79,7 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
sbSlot = PrependOperation(Instruction.ConditionalSelect, inRange, Const(slot), sbSlot);
|
sbSlot = PrependOperation(Instruction.ConditionalSelect, inRange, Const(slot), sbSlot);
|
||||||
}
|
}
|
||||||
|
|
||||||
Operand alignMask = Const(-config.Capabilities.StorageBufferOffsetAlignment);
|
Operand alignMask = Const(-config.QueryInfo(QueryInfoName.StorageBufferOffsetAlignment));
|
||||||
|
|
||||||
Operand baseAddrTrunc = PrependOperation(Instruction.BitwiseAnd, sbBaseAddrLow, Const(-64));
|
Operand baseAddrTrunc = PrependOperation(Instruction.BitwiseAnd, sbBaseAddrLow, Const(-64));
|
||||||
Operand byteOffset = PrependOperation(Instruction.Subtract, addrLow, baseAddrTrunc);
|
Operand byteOffset = PrependOperation(Instruction.Subtract, addrLow, baseAddrTrunc);
|
||||||
|
@ -124,23 +124,18 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
return node;
|
return node;
|
||||||
}
|
}
|
||||||
|
|
||||||
private static LinkedListNode<INode> RewriteTextureSample(LinkedListNode<INode> node)
|
private static LinkedListNode<INode> RewriteTextureSample(LinkedListNode<INode> node, ShaderConfig config)
|
||||||
{
|
{
|
||||||
// Technically, non-constant texture offsets are not allowed (according to the spec),
|
|
||||||
// however some GPUs does support that.
|
|
||||||
// For GPUs where it is not supported, we can replace the instruction with the following:
|
|
||||||
// For texture*Offset, we replace it by texture*, and add the offset to the P coords.
|
|
||||||
// The offset can be calculated as offset / textureSize(lod), where lod = textureQueryLod(coords).
|
|
||||||
// For texelFetchOffset, we replace it by texelFetch and add the offset to the P coords directly.
|
|
||||||
// For textureGatherOffset, we take advantage of the fact that the operation is already broken down
|
|
||||||
// to read the 4 pixels separately, and just replace it with 4 textureGather with a different offset
|
|
||||||
// for each pixel.
|
|
||||||
TextureOperation texOp = (TextureOperation)node.Value;
|
TextureOperation texOp = (TextureOperation)node.Value;
|
||||||
|
|
||||||
bool hasOffset = (texOp.Flags & TextureFlags.Offset) != 0;
|
bool hasOffset = (texOp.Flags & TextureFlags.Offset) != 0;
|
||||||
bool hasOffsets = (texOp.Flags & TextureFlags.Offsets) != 0;
|
bool hasOffsets = (texOp.Flags & TextureFlags.Offsets) != 0;
|
||||||
|
|
||||||
if (!(hasOffset || hasOffsets))
|
bool hasInvalidOffset = (hasOffset || hasOffsets) && !config.QueryInfoBool(QueryInfoName.SupportsNonConstantTextureOffset);
|
||||||
|
|
||||||
|
bool isRect = config.QueryInfoBool(QueryInfoName.IsTextureRectangle, texOp.Handle);
|
||||||
|
|
||||||
|
if (!(hasInvalidOffset || isRect))
|
||||||
{
|
{
|
||||||
return node;
|
return node;
|
||||||
}
|
}
|
||||||
|
@ -159,14 +154,24 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
|
|
||||||
int coordsCount = texOp.Type.GetDimensions();
|
int coordsCount = texOp.Type.GetDimensions();
|
||||||
|
|
||||||
int offsetsCount = coordsCount * (hasOffsets ? 4 : 1);
|
int offsetsCount;
|
||||||
|
|
||||||
|
if (hasOffsets)
|
||||||
|
{
|
||||||
|
offsetsCount = coordsCount * 4;
|
||||||
|
}
|
||||||
|
else if (hasOffset)
|
||||||
|
{
|
||||||
|
offsetsCount = coordsCount;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
offsetsCount = 0;
|
||||||
|
}
|
||||||
|
|
||||||
Operand[] offsets = new Operand[offsetsCount];
|
Operand[] offsets = new Operand[offsetsCount];
|
||||||
Operand[] sources = new Operand[texOp.SourcesCount - offsetsCount];
|
Operand[] sources = new Operand[texOp.SourcesCount - offsetsCount];
|
||||||
|
|
||||||
int srcIndex = 0;
|
|
||||||
int dstIndex = 0;
|
|
||||||
|
|
||||||
int copyCount = 0;
|
int copyCount = 0;
|
||||||
|
|
||||||
if (isBindless || isIndexed)
|
if (isBindless || isIndexed)
|
||||||
|
@ -207,6 +212,9 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
copyCount++;
|
copyCount++;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
int srcIndex = 0;
|
||||||
|
int dstIndex = 0;
|
||||||
|
|
||||||
for (int index = 0; index < copyCount; index++)
|
for (int index = 0; index < copyCount; index++)
|
||||||
{
|
{
|
||||||
sources[dstIndex++] = texOp.GetSource(srcIndex++);
|
sources[dstIndex++] = texOp.GetSource(srcIndex++);
|
||||||
|
@ -223,7 +231,9 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
offsets[index] = offset;
|
offsets[index] = offset;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (areAllOffsetsConstant)
|
hasInvalidOffset &= !areAllOffsetsConstant;
|
||||||
|
|
||||||
|
if (!(hasInvalidOffset || isRect))
|
||||||
{
|
{
|
||||||
return node;
|
return node;
|
||||||
}
|
}
|
||||||
|
@ -240,50 +250,32 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
|
|
||||||
int coordsIndex = isBindless || isIndexed ? 1 : 0;
|
int coordsIndex = isBindless || isIndexed ? 1 : 0;
|
||||||
|
|
||||||
if (intCoords)
|
int componentIndex = texOp.Index;
|
||||||
|
|
||||||
|
Operand Int(Operand value)
|
||||||
{
|
{
|
||||||
for (int index = 0; index < coordsCount; index++)
|
Operand res = Local();
|
||||||
{
|
|
||||||
Operand source = sources[coordsIndex + index];
|
|
||||||
|
|
||||||
Operand coordPlusOffset = Local();
|
node.List.AddBefore(node, new Operation(Instruction.ConvertFPToS32, res, value));
|
||||||
|
|
||||||
node.List.AddBefore(node, new Operation(Instruction.Add, coordPlusOffset, source, offsets[index]));
|
return res;
|
||||||
|
|
||||||
sources[coordsIndex + index] = coordPlusOffset;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
else
|
|
||||||
|
Operand Float(Operand value)
|
||||||
{
|
{
|
||||||
Operand lod = Local();
|
Operand res = Local();
|
||||||
|
|
||||||
node.List.AddBefore(node, new TextureOperation(
|
node.List.AddBefore(node, new Operation(Instruction.ConvertS32ToFP, res, value));
|
||||||
Instruction.Lod,
|
|
||||||
texOp.Type,
|
|
||||||
texOp.Flags,
|
|
||||||
texOp.Handle,
|
|
||||||
1,
|
|
||||||
lod,
|
|
||||||
lodSources));
|
|
||||||
|
|
||||||
Operand Int(Operand value)
|
return res;
|
||||||
{
|
}
|
||||||
Operand res = Local();
|
|
||||||
|
|
||||||
node.List.AddBefore(node, new Operation(Instruction.ConvertFPToS32, res, value));
|
|
||||||
|
|
||||||
return res;
|
|
||||||
}
|
|
||||||
|
|
||||||
Operand Float(Operand value)
|
|
||||||
{
|
|
||||||
Operand res = Local();
|
|
||||||
|
|
||||||
node.List.AddBefore(node, new Operation(Instruction.ConvertS32ToFP, res, value));
|
|
||||||
|
|
||||||
return res;
|
|
||||||
}
|
|
||||||
|
|
||||||
|
// Emulate texture rectangle by normalizing the coordinates on the shader.
|
||||||
|
// When sampler*Rect is used, the coords are expected to the in the [0, W or H] range,
|
||||||
|
// and otherwise, it is expected to be in the [0, 1] range.
|
||||||
|
// We normalize by dividing the coords by the texture size.
|
||||||
|
if (isRect && !intCoords)
|
||||||
|
{
|
||||||
for (int index = 0; index < coordsCount; index++)
|
for (int index = 0; index < coordsCount; index++)
|
||||||
{
|
{
|
||||||
Operand coordSize = Local();
|
Operand coordSize = Local();
|
||||||
|
@ -292,11 +284,11 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
|
|
||||||
if (isBindless || isIndexed)
|
if (isBindless || isIndexed)
|
||||||
{
|
{
|
||||||
texSizeSources = new Operand[] { sources[0], Int(lod) };
|
texSizeSources = new Operand[] { sources[0], Const(0) };
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
texSizeSources = new Operand[] { Int(lod) };
|
texSizeSources = new Operand[] { Const(0) };
|
||||||
}
|
}
|
||||||
|
|
||||||
node.List.AddBefore(node, new TextureOperation(
|
node.List.AddBefore(node, new TextureOperation(
|
||||||
|
@ -308,35 +300,101 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
coordSize,
|
coordSize,
|
||||||
texSizeSources));
|
texSizeSources));
|
||||||
|
|
||||||
Operand offset = Local();
|
|
||||||
|
|
||||||
Operand intOffset = offsets[index + (hasOffsets ? texOp.Index * coordsCount : 0)];
|
|
||||||
|
|
||||||
node.List.AddBefore(node, new Operation(Instruction.FP | Instruction.Divide, offset, Float(intOffset), Float(coordSize)));
|
|
||||||
|
|
||||||
Operand source = sources[coordsIndex + index];
|
Operand source = sources[coordsIndex + index];
|
||||||
|
|
||||||
Operand coordPlusOffset = Local();
|
Operand coordNormalized = Local();
|
||||||
|
|
||||||
node.List.AddBefore(node, new Operation(Instruction.FP | Instruction.Add, coordPlusOffset, source, offset));
|
node.List.AddBefore(node, new Operation(Instruction.FP | Instruction.Divide, coordNormalized, source, Float(coordSize)));
|
||||||
|
|
||||||
sources[coordsIndex + index] = coordPlusOffset;
|
sources[coordsIndex + index] = coordNormalized;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
int componentIndex;
|
// Technically, non-constant texture offsets are not allowed (according to the spec),
|
||||||
|
// however some GPUs does support that.
|
||||||
if (isGather && !isShadow)
|
// For GPUs where it is not supported, we can replace the instruction with the following:
|
||||||
|
// For texture*Offset, we replace it by texture*, and add the offset to the P coords.
|
||||||
|
// The offset can be calculated as offset / textureSize(lod), where lod = textureQueryLod(coords).
|
||||||
|
// For texelFetchOffset, we replace it by texelFetch and add the offset to the P coords directly.
|
||||||
|
// For textureGatherOffset, we take advantage of the fact that the operation is already broken down
|
||||||
|
// to read the 4 pixels separately, and just replace it with 4 textureGather with a different offset
|
||||||
|
// for each pixel.
|
||||||
|
if (hasInvalidOffset)
|
||||||
{
|
{
|
||||||
Operand gatherComponent = sources[dstIndex - 1];
|
if (intCoords)
|
||||||
|
{
|
||||||
|
for (int index = 0; index < coordsCount; index++)
|
||||||
|
{
|
||||||
|
Operand source = sources[coordsIndex + index];
|
||||||
|
|
||||||
Debug.Assert(gatherComponent.Type == OperandType.Constant);
|
Operand coordPlusOffset = Local();
|
||||||
|
|
||||||
componentIndex = gatherComponent.Value;
|
node.List.AddBefore(node, new Operation(Instruction.Add, coordPlusOffset, source, offsets[index]));
|
||||||
}
|
|
||||||
else
|
sources[coordsIndex + index] = coordPlusOffset;
|
||||||
{
|
}
|
||||||
componentIndex = texOp.Index;
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
Operand lod = Local();
|
||||||
|
|
||||||
|
node.List.AddBefore(node, new TextureOperation(
|
||||||
|
Instruction.Lod,
|
||||||
|
texOp.Type,
|
||||||
|
texOp.Flags,
|
||||||
|
texOp.Handle,
|
||||||
|
1,
|
||||||
|
lod,
|
||||||
|
lodSources));
|
||||||
|
|
||||||
|
for (int index = 0; index < coordsCount; index++)
|
||||||
|
{
|
||||||
|
Operand coordSize = Local();
|
||||||
|
|
||||||
|
Operand[] texSizeSources;
|
||||||
|
|
||||||
|
if (isBindless || isIndexed)
|
||||||
|
{
|
||||||
|
texSizeSources = new Operand[] { sources[0], Int(lod) };
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
texSizeSources = new Operand[] { Int(lod) };
|
||||||
|
}
|
||||||
|
|
||||||
|
node.List.AddBefore(node, new TextureOperation(
|
||||||
|
Instruction.TextureSize,
|
||||||
|
texOp.Type,
|
||||||
|
texOp.Flags,
|
||||||
|
texOp.Handle,
|
||||||
|
index,
|
||||||
|
coordSize,
|
||||||
|
texSizeSources));
|
||||||
|
|
||||||
|
Operand offset = Local();
|
||||||
|
|
||||||
|
Operand intOffset = offsets[index + (hasOffsets ? texOp.Index * coordsCount : 0)];
|
||||||
|
|
||||||
|
node.List.AddBefore(node, new Operation(Instruction.FP | Instruction.Divide, offset, Float(intOffset), Float(coordSize)));
|
||||||
|
|
||||||
|
Operand source = sources[coordsIndex + index];
|
||||||
|
|
||||||
|
Operand coordPlusOffset = Local();
|
||||||
|
|
||||||
|
node.List.AddBefore(node, new Operation(Instruction.FP | Instruction.Add, coordPlusOffset, source, offset));
|
||||||
|
|
||||||
|
sources[coordsIndex + index] = coordPlusOffset;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (isGather && !isShadow)
|
||||||
|
{
|
||||||
|
Operand gatherComponent = sources[dstIndex - 1];
|
||||||
|
|
||||||
|
Debug.Assert(gatherComponent.Type == OperandType.Constant);
|
||||||
|
|
||||||
|
componentIndex = gatherComponent.Value;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
TextureOperation newTexOp = new TextureOperation(
|
TextureOperation newTexOp = new TextureOperation(
|
||||||
|
|
|
@ -52,7 +52,7 @@ namespace Ryujinx.Graphics.Shader.Translation.Optimizations
|
||||||
|
|
||||||
Operand baseAddrTrunc = Local();
|
Operand baseAddrTrunc = Local();
|
||||||
|
|
||||||
Operand alignMask = Const(-config.Capabilities.StorageBufferOffsetAlignment);
|
Operand alignMask = Const(-config.QueryInfo(QueryInfoName.StorageBufferOffsetAlignment));
|
||||||
|
|
||||||
Operation andOp = new Operation(Instruction.BitwiseAnd, baseAddrTrunc, baseAddrLow, alignMask);
|
Operation andOp = new Operation(Instruction.BitwiseAnd, baseAddrTrunc, baseAddrLow, alignMask);
|
||||||
|
|
||||||
|
|
|
@ -4,9 +4,7 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
{
|
{
|
||||||
None = 0,
|
None = 0,
|
||||||
|
|
||||||
Compute = 1 << 0,
|
Compute = 1 << 0,
|
||||||
DebugMode = 1 << 1,
|
DebugMode = 1 << 1
|
||||||
Unspecialized = 1 << 2,
|
|
||||||
DividePosXY = 1 << 3
|
|
||||||
}
|
}
|
||||||
}
|
}
|
|
@ -16,14 +16,7 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
|
|
||||||
public static Span<byte> ExtractCode(Span<byte> code, bool compute, out int headerSize)
|
public static Span<byte> ExtractCode(Span<byte> code, bool compute, out int headerSize)
|
||||||
{
|
{
|
||||||
if (compute)
|
headerSize = compute ? 0 : HeaderSize;
|
||||||
{
|
|
||||||
headerSize = 0;
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
headerSize = HeaderSize;
|
|
||||||
}
|
|
||||||
|
|
||||||
Block[] cfg = Decoder.Decode(code, (ulong)headerSize);
|
Block[] cfg = Decoder.Decode(code, (ulong)headerSize);
|
||||||
|
|
||||||
|
@ -47,56 +40,21 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
return code.Slice(0, headerSize + (int)endAddress);
|
return code.Slice(0, headerSize + (int)endAddress);
|
||||||
}
|
}
|
||||||
|
|
||||||
public static ShaderProgram Translate(Span<byte> code, ShaderCapabilities capabilities, TranslationFlags flags)
|
public static ShaderProgram Translate(Span<byte> code, QueryInfoCallback queryInfoCallback, TranslationFlags flags)
|
||||||
{
|
{
|
||||||
bool compute = (flags & TranslationFlags.Compute) != 0;
|
bool compute = (flags & TranslationFlags.Compute) != 0;
|
||||||
|
|
||||||
Operation[] ops = DecodeShader(code, capabilities, flags, out ShaderHeader header, out int size);
|
Operation[] ops = DecodeShader(code, queryInfoCallback, flags, out ShaderConfig config, out int size);
|
||||||
|
|
||||||
ShaderStage stage;
|
|
||||||
|
|
||||||
if (compute)
|
|
||||||
{
|
|
||||||
stage = ShaderStage.Compute;
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
stage = header.Stage;
|
|
||||||
}
|
|
||||||
|
|
||||||
int maxOutputVertexCount = 0;
|
|
||||||
|
|
||||||
OutputTopology outputTopology = OutputTopology.LineStrip;
|
|
||||||
|
|
||||||
if (!compute)
|
|
||||||
{
|
|
||||||
maxOutputVertexCount = header.MaxOutputVertexCount;
|
|
||||||
outputTopology = header.OutputTopology;
|
|
||||||
}
|
|
||||||
|
|
||||||
ShaderConfig config = new ShaderConfig(
|
|
||||||
stage,
|
|
||||||
capabilities,
|
|
||||||
flags,
|
|
||||||
maxOutputVertexCount,
|
|
||||||
outputTopology);
|
|
||||||
|
|
||||||
return Translate(ops, config, size);
|
return Translate(ops, config, size);
|
||||||
}
|
}
|
||||||
|
|
||||||
public static ShaderProgram Translate(Span<byte> vpACode, Span<byte> vpBCode, ShaderCapabilities capabilities, TranslationFlags flags)
|
public static ShaderProgram Translate(Span<byte> vpACode, Span<byte> vpBCode, QueryInfoCallback queryInfoCallback, TranslationFlags flags)
|
||||||
{
|
{
|
||||||
bool debugMode = (flags & TranslationFlags.DebugMode) != 0;
|
bool debugMode = (flags & TranslationFlags.DebugMode) != 0;
|
||||||
|
|
||||||
Operation[] vpAOps = DecodeShader(vpACode, capabilities, flags, out _, out _);
|
Operation[] vpAOps = DecodeShader(vpACode, queryInfoCallback, flags, out _, out _);
|
||||||
Operation[] vpBOps = DecodeShader(vpBCode, capabilities, flags, out ShaderHeader header, out int sizeB);
|
Operation[] vpBOps = DecodeShader(vpBCode, queryInfoCallback, flags, out ShaderConfig config, out int sizeB);
|
||||||
|
|
||||||
ShaderConfig config = new ShaderConfig(
|
|
||||||
header.Stage,
|
|
||||||
capabilities,
|
|
||||||
flags,
|
|
||||||
header.MaxOutputVertexCount,
|
|
||||||
header.OutputTopology);
|
|
||||||
|
|
||||||
return Translate(Combine(vpAOps, vpBOps), config, sizeB);
|
return Translate(Combine(vpAOps, vpBOps), config, sizeB);
|
||||||
}
|
}
|
||||||
|
@ -136,31 +94,25 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
}
|
}
|
||||||
|
|
||||||
private static Operation[] DecodeShader(
|
private static Operation[] DecodeShader(
|
||||||
Span<byte> code,
|
Span<byte> code,
|
||||||
ShaderCapabilities capabilities,
|
QueryInfoCallback queryInfoCallback,
|
||||||
TranslationFlags flags,
|
TranslationFlags flags,
|
||||||
out ShaderHeader header,
|
out ShaderConfig config,
|
||||||
out int size)
|
out int size)
|
||||||
{
|
{
|
||||||
Block[] cfg;
|
Block[] cfg;
|
||||||
|
|
||||||
EmitterContext context;
|
|
||||||
|
|
||||||
if ((flags & TranslationFlags.Compute) != 0)
|
if ((flags & TranslationFlags.Compute) != 0)
|
||||||
{
|
{
|
||||||
header = null;
|
config = new ShaderConfig(flags, queryInfoCallback);
|
||||||
|
|
||||||
cfg = Decoder.Decode(code, 0);
|
cfg = Decoder.Decode(code, 0);
|
||||||
|
|
||||||
context = new EmitterContext(ShaderStage.Compute, header, capabilities, flags);
|
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
header = new ShaderHeader(code);
|
config = new ShaderConfig(new ShaderHeader(code), flags, queryInfoCallback);
|
||||||
|
|
||||||
cfg = Decoder.Decode(code, HeaderSize);
|
cfg = Decoder.Decode(code, HeaderSize);
|
||||||
|
|
||||||
context = new EmitterContext(header.Stage, header, capabilities, flags);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cfg == null)
|
if (cfg == null)
|
||||||
|
@ -172,6 +124,8 @@ namespace Ryujinx.Graphics.Shader.Translation
|
||||||
return new Operation[0];
|
return new Operation[0];
|
||||||
}
|
}
|
||||||
|
|
||||||
|
EmitterContext context = new EmitterContext(config);
|
||||||
|
|
||||||
ulong maxEndAddress = 0;
|
ulong maxEndAddress = 0;
|
||||||
|
|
||||||
for (int blkIndex = 0; blkIndex < cfg.Length; blkIndex++)
|
for (int blkIndex = 0; blkIndex < cfg.Length; blkIndex++)
|
||||||
|
|
|
@ -20,7 +20,7 @@ namespace Ryujinx.ShaderTools
|
||||||
|
|
||||||
byte[] data = File.ReadAllBytes(args[args.Length - 1]);
|
byte[] data = File.ReadAllBytes(args[args.Length - 1]);
|
||||||
|
|
||||||
string code = Translator.Translate(data, ShaderCapabilities.Default, flags).Code;
|
string code = Translator.Translate(data, null, flags).Code;
|
||||||
|
|
||||||
Console.WriteLine(code);
|
Console.WriteLine(code);
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue