using Ryujinx.Graphics.Gpu.Engine.Types; using System; using System.Runtime.CompilerServices; namespace Ryujinx.Graphics.Gpu.Engine.Compute { /// <summary> /// Type of the dependent Queue Meta Data. /// </summary> enum DependentQmdType { Queue, Grid, } /// <summary> /// Type of the release memory barrier. /// </summary> enum ReleaseMembarType { FeNone, FeSysmembar, } /// <summary> /// Type of the CWD memory barrier. /// </summary> enum CwdMembarType { L1None, L1Sysmembar, L1Membar, } /// <summary> /// NaN behavior of 32-bits float operations on the shader. /// </summary> enum Fp32NanBehavior { Legacy, Fp64Compatible, } /// <summary> /// NaN behavior of 32-bits float to integer conversion on the shader. /// </summary> enum Fp32F2iNanBehavior { PassZero, PassIndefinite, } /// <summary> /// Limit of calls. /// </summary> enum ApiVisibleCallLimit { _32, NoCheck, } /// <summary> /// Shared memory bank mapping mode. /// </summary> enum SharedMemoryBankMapping { FourBytesPerBank, EightBytesPerBank, } /// <summary> /// Denormal behavior of 32-bits float narrowing instructions. /// </summary> enum Fp32NarrowInstruction { KeepDenorms, FlushDenorms, } /// <summary> /// Configuration of the L1 cache. /// </summary> enum L1Configuration { DirectlyAddressableMemorySize16kb, DirectlyAddressableMemorySize32kb, DirectlyAddressableMemorySize48kb, } /// <summary> /// Reduction operation. /// </summary> enum ReductionOp { RedAdd, RedMin, RedMax, RedInc, RedDec, RedAnd, RedOr, RedXor, } /// <summary> /// Reduction format. /// </summary> enum ReductionFormat { Unsigned32, Signed32, } /// <summary> /// Size of a structure in words. /// </summary> enum StructureSize { FourWords, OneWord, } /// <summary> /// Compute Queue Meta Data. /// </summary> unsafe struct ComputeQmd { private fixed int _words[64]; public readonly int OuterPut => BitRange(30, 0); public readonly bool OuterOverflow => Bit(31); public readonly int OuterGet => BitRange(62, 32); public readonly bool OuterStickyOverflow => Bit(63); public readonly int InnerGet => BitRange(94, 64); public readonly bool InnerOverflow => Bit(95); public readonly int InnerPut => BitRange(126, 96); public readonly bool InnerStickyOverflow => Bit(127); public readonly int QmdReservedAA => BitRange(159, 128); public readonly int DependentQmdPointer => BitRange(191, 160); public readonly int QmdGroupId => BitRange(197, 192); public readonly bool SmGlobalCachingEnable => Bit(198); public readonly bool RunCtaInOneSmPartition => Bit(199); public readonly bool IsQueue => Bit(200); public readonly bool AddToHeadOfQmdGroupLinkedList => Bit(201); public readonly bool SemaphoreReleaseEnable0 => Bit(202); public readonly bool SemaphoreReleaseEnable1 => Bit(203); public readonly bool RequireSchedulingPcas => Bit(204); public readonly bool DependentQmdScheduleEnable => Bit(205); public readonly DependentQmdType DependentQmdType => (DependentQmdType)BitRange(206, 206); public readonly bool DependentQmdFieldCopy => Bit(207); public readonly int QmdReservedB => BitRange(223, 208); public readonly int CircularQueueSize => BitRange(248, 224); public readonly bool QmdReservedC => Bit(249); public readonly bool InvalidateTextureHeaderCache => Bit(250); public readonly bool InvalidateTextureSamplerCache => Bit(251); public readonly bool InvalidateTextureDataCache => Bit(252); public readonly bool InvalidateShaderDataCache => Bit(253); public readonly bool InvalidateInstructionCache => Bit(254); public readonly bool InvalidateShaderConstantCache => Bit(255); public readonly int ProgramOffset => BitRange(287, 256); public readonly int CircularQueueAddrLower => BitRange(319, 288); public readonly int CircularQueueAddrUpper => BitRange(327, 320); public readonly int QmdReservedD => BitRange(335, 328); public readonly int CircularQueueEntrySize => BitRange(351, 336); public readonly int CwdReferenceCountId => BitRange(357, 352); public readonly int CwdReferenceCountDeltaMinusOne => BitRange(365, 358); public readonly ReleaseMembarType ReleaseMembarType => (ReleaseMembarType)BitRange(366, 366); public readonly bool CwdReferenceCountIncrEnable => Bit(367); public readonly CwdMembarType CwdMembarType => (CwdMembarType)BitRange(369, 368); public readonly bool SequentiallyRunCtas => Bit(370); public readonly bool CwdReferenceCountDecrEnable => Bit(371); public readonly bool Throttled => Bit(372); public readonly Fp32NanBehavior Fp32NanBehavior => (Fp32NanBehavior)BitRange(376, 376); public readonly Fp32F2iNanBehavior Fp32F2iNanBehavior => (Fp32F2iNanBehavior)BitRange(377, 377); public readonly ApiVisibleCallLimit ApiVisibleCallLimit => (ApiVisibleCallLimit)BitRange(378, 378); public readonly SharedMemoryBankMapping SharedMemoryBankMapping => (SharedMemoryBankMapping)BitRange(379, 379); public readonly SamplerIndex SamplerIndex => (SamplerIndex)BitRange(382, 382); public readonly Fp32NarrowInstruction Fp32NarrowInstruction => (Fp32NarrowInstruction)BitRange(383, 383); public readonly int CtaRasterWidth => BitRange(415, 384); public readonly int CtaRasterHeight => BitRange(431, 416); public readonly int CtaRasterDepth => BitRange(447, 432); public readonly int CtaRasterWidthResume => BitRange(479, 448); public readonly int CtaRasterHeightResume => BitRange(495, 480); public readonly int CtaRasterDepthResume => BitRange(511, 496); public readonly int QueueEntriesPerCtaMinusOne => BitRange(518, 512); public readonly int CoalesceWaitingPeriod => BitRange(529, 522); public readonly int SharedMemorySize => BitRange(561, 544); public readonly int QmdReservedG => BitRange(575, 562); public readonly int QmdVersion => BitRange(579, 576); public readonly int QmdMajorVersion => BitRange(583, 580); public readonly int QmdReservedH => BitRange(591, 584); public readonly int CtaThreadDimension0 => BitRange(607, 592); public readonly int CtaThreadDimension1 => BitRange(623, 608); public readonly int CtaThreadDimension2 => BitRange(639, 624); public readonly bool ConstantBufferValid(int i) => Bit(640 + i * 1); public readonly int QmdReservedI => BitRange(668, 648); public readonly L1Configuration L1Configuration => (L1Configuration)BitRange(671, 669); public readonly int SmDisableMaskLower => BitRange(703, 672); public readonly int SmDisableMaskUpper => BitRange(735, 704); public readonly int Release0AddressLower => BitRange(767, 736); public readonly int Release0AddressUpper => BitRange(775, 768); public readonly int QmdReservedJ => BitRange(783, 776); public readonly ReductionOp Release0ReductionOp => (ReductionOp)BitRange(790, 788); public readonly bool QmdReservedK => Bit(791); public readonly ReductionFormat Release0ReductionFormat => (ReductionFormat)BitRange(793, 792); public readonly bool Release0ReductionEnable => Bit(794); public readonly StructureSize Release0StructureSize => (StructureSize)BitRange(799, 799); public readonly int Release0Payload => BitRange(831, 800); public readonly int Release1AddressLower => BitRange(863, 832); public readonly int Release1AddressUpper => BitRange(871, 864); public readonly int QmdReservedL => BitRange(879, 872); public readonly ReductionOp Release1ReductionOp => (ReductionOp)BitRange(886, 884); public readonly bool QmdReservedM => Bit(887); public readonly ReductionFormat Release1ReductionFormat => (ReductionFormat)BitRange(889, 888); public readonly bool Release1ReductionEnable => Bit(890); public readonly StructureSize Release1StructureSize => (StructureSize)BitRange(895, 895); public readonly int Release1Payload => BitRange(927, 896); public readonly int ConstantBufferAddrLower(int i) => BitRange(959 + i * 64, 928 + i * 64); public readonly int ConstantBufferAddrUpper(int i) => BitRange(967 + i * 64, 960 + i * 64); public readonly int ConstantBufferReservedAddr(int i) => BitRange(973 + i * 64, 968 + i * 64); public readonly bool ConstantBufferInvalidate(int i) => Bit(974 + i * 64); public readonly int ConstantBufferSize(int i) => BitRange(991 + i * 64, 975 + i * 64); public readonly int ShaderLocalMemoryLowSize => BitRange(1463, 1440); public readonly int QmdReservedN => BitRange(1466, 1464); public readonly int BarrierCount => BitRange(1471, 1467); public readonly int ShaderLocalMemoryHighSize => BitRange(1495, 1472); public readonly int RegisterCount => BitRange(1503, 1496); public readonly int ShaderLocalMemoryCrsSize => BitRange(1527, 1504); public readonly int SassVersion => BitRange(1535, 1528); public readonly int HwOnlyInnerGet => BitRange(1566, 1536); public readonly bool HwOnlyRequireSchedulingPcas => Bit(1567); public readonly int HwOnlyInnerPut => BitRange(1598, 1568); public readonly bool HwOnlyScgType => Bit(1599); public readonly int HwOnlySpanListHeadIndex => BitRange(1629, 1600); public readonly bool QmdReservedQ => Bit(1630); public readonly bool HwOnlySpanListHeadIndexValid => Bit(1631); public readonly int HwOnlySkedNextQmdPointer => BitRange(1663, 1632); public readonly int QmdSpareE => BitRange(1695, 1664); public readonly int QmdSpareF => BitRange(1727, 1696); public readonly int QmdSpareG => BitRange(1759, 1728); public readonly int QmdSpareH => BitRange(1791, 1760); public readonly int QmdSpareI => BitRange(1823, 1792); public readonly int QmdSpareJ => BitRange(1855, 1824); public readonly int QmdSpareK => BitRange(1887, 1856); public readonly int QmdSpareL => BitRange(1919, 1888); public readonly int QmdSpareM => BitRange(1951, 1920); public readonly int QmdSpareN => BitRange(1983, 1952); public readonly int DebugIdUpper => BitRange(2015, 1984); public readonly int DebugIdLower => BitRange(2047, 2016); [MethodImpl(MethodImplOptions.AggressiveInlining)] private readonly bool Bit(int bit) { if ((uint)bit >= 64 * 32) { throw new ArgumentOutOfRangeException(nameof(bit)); } return (_words[bit >> 5] & (1 << (bit & 31))) != 0; } [MethodImpl(MethodImplOptions.AggressiveInlining)] private readonly int BitRange(int upper, int lower) { if ((uint)lower >= 64 * 32) { throw new ArgumentOutOfRangeException(nameof(lower)); } int mask = (int)(uint.MaxValue >> (32 - (upper - lower + 1))); return (_words[lower >> 5] >> (lower & 31)) & mask; } } }