mlir.dialects._rocdl_ops_gen ============================ .. py:module:: mlir.dialects._rocdl_ops_gen Attributes ---------- .. autoapisummary:: mlir.dialects._rocdl_ops_gen._ods_ir Classes ------- .. autoapisummary:: mlir.dialects._rocdl_ops_gen._Dialect mlir.dialects._rocdl_ops_gen.BallotOp mlir.dialects._rocdl_ops_gen.BarrierInitOp mlir.dialects._rocdl_ops_gen.BarrierJoinOp mlir.dialects._rocdl_ops_gen.BarrierLeaveOp mlir.dialects._rocdl_ops_gen.BarrierOp mlir.dialects._rocdl_ops_gen.BarrierSignalIsfirstOp mlir.dialects._rocdl_ops_gen.BarrierSignalOp mlir.dialects._rocdl_ops_gen.BarrierSignalVarOp mlir.dialects._rocdl_ops_gen.BarrierWaitOp mlir.dialects._rocdl_ops_gen.BlockDimXOp mlir.dialects._rocdl_ops_gen.BlockDimYOp mlir.dialects._rocdl_ops_gen.BlockDimZOp mlir.dialects._rocdl_ops_gen.BlockIdXOp mlir.dialects._rocdl_ops_gen.BlockIdYOp mlir.dialects._rocdl_ops_gen.BlockIdZOp mlir.dialects._rocdl_ops_gen.CvtF32Bf8Op mlir.dialects._rocdl_ops_gen.CvtF32Fp8Op mlir.dialects._rocdl_ops_gen.CvtPkBf8F32Op mlir.dialects._rocdl_ops_gen.CvtPkF32Bf8Op mlir.dialects._rocdl_ops_gen.CvtPkF32Fp8Op mlir.dialects._rocdl_ops_gen.CvtPkFp8F32Op mlir.dialects._rocdl_ops_gen.CvtPkRtz mlir.dialects._rocdl_ops_gen.CvtPkScalePk8Bf16Bf8Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk8Bf16Fp4Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk8Bf16Fp8Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk8F16Bf8Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk8F16Fp4Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk8F16Fp8Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk8F32Bf8Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk8F32Fp4Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk8F32Fp8Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk16Bf16Bf6Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk16Bf16Fp6Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk16F16Bf6Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk16F16Fp6Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk16F32Bf6Op mlir.dialects._rocdl_ops_gen.CvtPkScalePk16F32Fp6Op mlir.dialects._rocdl_ops_gen.CvtScaleF32F16Bf8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32F16Fp8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32F32Bf8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32F32Fp8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Bf8Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Bf8F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Bf8F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Fp4Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Fp4F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Fp4F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Fp8Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Fp8F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk8Fp8F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk16Bf6Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk16Bf6F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk16Bf6F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk16Fp6Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk16Fp6F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk16Fp6F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32Bf6Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32Bf6F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32Bf16Bf6Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32Bf16Fp6Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32F16Bf6Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32F16Fp6Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32F32Bf6Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32F32Fp6Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32Fp6Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32Pk32Fp6F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkBf8Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkBf8F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkBf8F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkBf16Bf8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkBf16Fp4Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkBf16Fp8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkF16Bf8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkF16Fp4Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkF16Fp8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkF32Bf8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkF32Fp4Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkF32Fp8Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkFp4Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkFp4F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkFp4F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkFp8Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkFp8F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32PkFp8F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrBf8BF16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrBf8F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrBf8F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrFp8BF16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrFp8F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrFp8F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Bf8Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Bf8F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Bf8F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Fp4Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Fp4F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Fp4F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Fp8Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Fp8F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk8Fp8F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk16Bf6Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk16Bf6F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk16Bf6F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk16Fp6Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk16Fp6F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk16Fp6F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk32Bf6Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk32Bf6F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk32Bf6F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk32Fp6Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk32Fp6F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPk32Fp6F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPkFp4Bf16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPkFp4F16Op mlir.dialects._rocdl_ops_gen.CvtScaleF32SrPkFp4F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF322xPk16Bf6F32Op mlir.dialects._rocdl_ops_gen.CvtScaleF322xPk16Fp6F32Op mlir.dialects._rocdl_ops_gen.CvtSrBf8F32Op mlir.dialects._rocdl_ops_gen.CvtSrFp8F32Op mlir.dialects._rocdl_ops_gen.DPPUpdateOp mlir.dialects._rocdl_ops_gen.DsBpermuteOp mlir.dialects._rocdl_ops_gen.DsLoadTr4_B64 mlir.dialects._rocdl_ops_gen.DsLoadTr6_B96 mlir.dialects._rocdl_ops_gen.DsLoadTr8_B64 mlir.dialects._rocdl_ops_gen.DsLoadTr16_B128 mlir.dialects._rocdl_ops_gen.DsSwizzleOp mlir.dialects._rocdl_ops_gen.FMed3Op mlir.dialects._rocdl_ops_gen.GetBarrierStateOp mlir.dialects._rocdl_ops_gen.GlobalLoadAsyncToLDSB8Op mlir.dialects._rocdl_ops_gen.GlobalLoadAsyncToLDSB32Op mlir.dialects._rocdl_ops_gen.GlobalLoadAsyncToLDSB64Op mlir.dialects._rocdl_ops_gen.GlobalLoadAsyncToLDSB128Op mlir.dialects._rocdl_ops_gen.GlobalLoadLDSOp mlir.dialects._rocdl_ops_gen.GlobalLoadTr4_B64 mlir.dialects._rocdl_ops_gen.GlobalLoadTr6_B96 mlir.dialects._rocdl_ops_gen.GlobalLoadTr8_B64 mlir.dialects._rocdl_ops_gen.GlobalLoadTr8_B128 mlir.dialects._rocdl_ops_gen.GridDimXOp mlir.dialects._rocdl_ops_gen.GridDimYOp mlir.dialects._rocdl_ops_gen.GridDimZOp mlir.dialects._rocdl_ops_gen.IglpOpt mlir.dialects._rocdl_ops_gen.LoadToLDSOp mlir.dialects._rocdl_ops_gen.MakeBufferRsrcOp mlir.dialects._rocdl_ops_gen.MbcntHiOp mlir.dialects._rocdl_ops_gen.MbcntLoOp mlir.dialects._rocdl_ops_gen.Permlane16SwapOp mlir.dialects._rocdl_ops_gen.Permlane32SwapOp mlir.dialects._rocdl_ops_gen.PermlaneX16Op mlir.dialects._rocdl_ops_gen.RawBufferAtomicCmpSwap mlir.dialects._rocdl_ops_gen.RawBufferAtomicFAddOp mlir.dialects._rocdl_ops_gen.RawBufferAtomicFMaxOp mlir.dialects._rocdl_ops_gen.RawBufferAtomicSMaxOp mlir.dialects._rocdl_ops_gen.RawBufferAtomicUMinOp mlir.dialects._rocdl_ops_gen.RawBufferLoadOp mlir.dialects._rocdl_ops_gen.RawBufferStoreOp mlir.dialects._rocdl_ops_gen.RawPtrBufferAtomicCmpSwap mlir.dialects._rocdl_ops_gen.RawPtrBufferAtomicFaddOp mlir.dialects._rocdl_ops_gen.RawPtrBufferAtomicFmaxOp mlir.dialects._rocdl_ops_gen.RawPtrBufferAtomicSmaxOp mlir.dialects._rocdl_ops_gen.RawPtrBufferAtomicUminOp mlir.dialects._rocdl_ops_gen.RawPtrBufferLoadLdsOp mlir.dialects._rocdl_ops_gen.RawPtrBufferLoadOp mlir.dialects._rocdl_ops_gen.RawPtrBufferStoreOp mlir.dialects._rocdl_ops_gen.ReadfirstlaneOp mlir.dialects._rocdl_ops_gen.ReadlaneOp mlir.dialects._rocdl_ops_gen.SBarrierOp mlir.dialects._rocdl_ops_gen.SSleepOp mlir.dialects._rocdl_ops_gen.SWaitcntOp mlir.dialects._rocdl_ops_gen.SchedBarrier mlir.dialects._rocdl_ops_gen.SchedGroupBarrier mlir.dialects._rocdl_ops_gen.SetPrioOp mlir.dialects._rocdl_ops_gen.TensorLoadToLDSD2Op mlir.dialects._rocdl_ops_gen.TensorLoadToLDSOp mlir.dialects._rocdl_ops_gen.TensorStoreFromLDSD2Op mlir.dialects._rocdl_ops_gen.TensorStoreFromLDSOp mlir.dialects._rocdl_ops_gen.ThreadIdXOp mlir.dialects._rocdl_ops_gen.ThreadIdYOp mlir.dialects._rocdl_ops_gen.ThreadIdZOp mlir.dialects._rocdl_ops_gen.WaitAsynccntOp mlir.dialects._rocdl_ops_gen.WaitDscntOp mlir.dialects._rocdl_ops_gen.WaitExpcntOp mlir.dialects._rocdl_ops_gen.WaitLoadcntOp mlir.dialects._rocdl_ops_gen.WaitStorecntOp mlir.dialects._rocdl_ops_gen.WaitTensorcntOp mlir.dialects._rocdl_ops_gen.WavefrontSizeOp mlir.dialects._rocdl_ops_gen.ds_read_tr4_b64 mlir.dialects._rocdl_ops_gen.ds_read_tr6_b96 mlir.dialects._rocdl_ops_gen.ds_read_tr8_b64 mlir.dialects._rocdl_ops_gen.ds_read_tr16_b64 mlir.dialects._rocdl_ops_gen.mfma_f32_4x4x1f32 mlir.dialects._rocdl_ops_gen.mfma_f32_4x4x2bf16 mlir.dialects._rocdl_ops_gen.mfma_f32_4x4x4bf16_1k mlir.dialects._rocdl_ops_gen.mfma_f32_4x4x4f16 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x1f32 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x2bf16 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x4bf16_1k mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x4f16 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x4f32 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x8_xf32 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x8bf16 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x16bf16_1k mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x16f16 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_bf8_bf8 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_bf8_fp8 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_bf16 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_f16 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_fp8_bf8 mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_fp8_fp8 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x1f32 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x2bf16 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x2f32 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x4_xf32 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x4bf16 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x4bf16_1k mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x4f16 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x8bf16_1k mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x8f16 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_bf8_bf8 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_bf8_fp8 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_bf16 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_f16 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_fp8_bf8 mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_fp8_fp8 mlir.dialects._rocdl_ops_gen.mfma_f64_4x4x4f64 mlir.dialects._rocdl_ops_gen.mfma_f64_16x16x4f64 mlir.dialects._rocdl_ops_gen.mfma_i32_4x4x4i8 mlir.dialects._rocdl_ops_gen.mfma_i32_16x16x4i8 mlir.dialects._rocdl_ops_gen.mfma_i32_16x16x16i8 mlir.dialects._rocdl_ops_gen.mfma_i32_16x16x32_i8 mlir.dialects._rocdl_ops_gen.mfma_i32_16x16x64_i8 mlir.dialects._rocdl_ops_gen.mfma_i32_32x32x4i8 mlir.dialects._rocdl_ops_gen.mfma_i32_32x32x8i8 mlir.dialects._rocdl_ops_gen.mfma_i32_32x32x16_i8 mlir.dialects._rocdl_ops_gen.mfma_i32_32x32x32_i8 mlir.dialects._rocdl_ops_gen.mfma_scale_f32_16x16x128_f8f6f4 mlir.dialects._rocdl_ops_gen.mfma_scale_f32_32x32x64_f8f6f4 mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x32_bf16 mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x32_f16 mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x64_bf8_bf8 mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x64_bf8_fp8 mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x64_fp8_bf8 mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x64_fp8_fp8 mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x16_bf16 mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x16_f16 mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x32_bf8_bf8 mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x32_bf8_fp8 mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x32_fp8_bf8 mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x32_fp8_fp8 mlir.dialects._rocdl_ops_gen.smfmac_i32_16x16x64_i8 mlir.dialects._rocdl_ops_gen.smfmac_i32_32x32x32_i8 mlir.dialects._rocdl_ops_gen.wmma_bf16_16x16x16_bf16 mlir.dialects._rocdl_ops_gen.wmma_bf16_16x16x32_bf16 mlir.dialects._rocdl_ops_gen.wmma_bf16f32_16x16x32_bf16 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x16_f16 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x32_f16 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x64_bf8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x64_bf8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x64_fp8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x64_fp8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x128_bf8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x128_bf8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x128_fp8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x128_fp8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x4_f32 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_bf8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_bf8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_bf16 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_f16 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_fp8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_fp8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x32_bf16 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x32_f16 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x64_bf8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x64_bf8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x64_fp8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x64_fp8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x128_bf8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x128_bf8_fp8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x128_fp8_bf8 mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x128_fp8_fp8 mlir.dialects._rocdl_ops_gen.wmma_i32_16x16x16_iu4 mlir.dialects._rocdl_ops_gen.wmma_i32_16x16x16_iu8 mlir.dialects._rocdl_ops_gen.wmma_i32_16x16x32_iu4 mlir.dialects._rocdl_ops_gen.wmma_i32_16x16x64_iu8 Functions --------- .. autoapisummary:: mlir.dialects._rocdl_ops_gen.ballot mlir.dialects._rocdl_ops_gen.s_barrier_init mlir.dialects._rocdl_ops_gen.s_barrier_join mlir.dialects._rocdl_ops_gen.s_barrier_leave mlir.dialects._rocdl_ops_gen.barrier mlir.dialects._rocdl_ops_gen.s_barrier_signal_isfirst mlir.dialects._rocdl_ops_gen.s_barrier_signal mlir.dialects._rocdl_ops_gen.s_barrier_signal_var mlir.dialects._rocdl_ops_gen.s_barrier_wait mlir.dialects._rocdl_ops_gen.workgroup_dim_x mlir.dialects._rocdl_ops_gen.workgroup_dim_y mlir.dialects._rocdl_ops_gen.workgroup_dim_z mlir.dialects._rocdl_ops_gen.workgroup_id_x mlir.dialects._rocdl_ops_gen.workgroup_id_y mlir.dialects._rocdl_ops_gen.workgroup_id_z mlir.dialects._rocdl_ops_gen.cvt_f32_bf8 mlir.dialects._rocdl_ops_gen.cvt_f32_fp8 mlir.dialects._rocdl_ops_gen.cvt_pk_bf8_f32 mlir.dialects._rocdl_ops_gen.cvt_pk_f32_bf8 mlir.dialects._rocdl_ops_gen.cvt_pk_f32_fp8 mlir.dialects._rocdl_ops_gen.cvt_pk_fp8_f32 mlir.dialects._rocdl_ops_gen.cvt_pkrtz mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_bf16_bf8 mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_bf16_fp4 mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_bf16_fp8 mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_f16_bf8 mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_f16_fp4 mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_f16_fp8 mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_f32_bf8 mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_f32_fp4 mlir.dialects._rocdl_ops_gen.cvt_scale_pk8_f32_fp8 mlir.dialects._rocdl_ops_gen.cvt_scale_pk16_bf16_bf6 mlir.dialects._rocdl_ops_gen.cvt_scale_pk16_bf16_fp6 mlir.dialects._rocdl_ops_gen.cvt_scale_pk16_f16_bf6 mlir.dialects._rocdl_ops_gen.cvt_scale_pk16_f16_fp6 mlir.dialects._rocdl_ops_gen.cvt_scale_pk16_f32_bf6 mlir.dialects._rocdl_ops_gen.cvt_scale_pk16_f32_fp6 mlir.dialects._rocdl_ops_gen.cvt_scalef32_f16_bf8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_f16_fp8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_f32_bf8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_f32_fp8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_bf8_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_bf8_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_bf8_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_fp4_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_fp4_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_fp4_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_fp8_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_fp8_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk8_fp8_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk16_bf6_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk16_bf6_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk16_bf6_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk16_fp6_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk16_fp6_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk16_fp6_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_bf6_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_bf6_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_bf16_bf6 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_bf16_fp6 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_f16_bf6 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_f16_fp6 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_f32_bf6 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_f32_fp6 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_fp6_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk32_fp6_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_bf8_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_bf8_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_bf8_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_bf16_bf8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_bf16_fp4 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_bf16_fp8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_f16_bf8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_f16_fp4 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_f16_fp8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_f32_bf8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_f32_fp4 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_f32_fp8 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_fp4_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_fp4_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_fp4_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_fp8_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_fp8_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_pk_fp8_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_bf8_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_bf8_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_bf8_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_fp8_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_fp8_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_fp8_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_bf8_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_bf8_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_bf8_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_fp4_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_fp4_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_fp4_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_fp8_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_fp8_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk8_fp8_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk16_bf6_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk16_bf6_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk16_bf6_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk16_fp6_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk16_fp6_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk16_fp6_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk32_bf6_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk32_bf6_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk32_bf6_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk32_fp6_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk32_fp6_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk32_fp6_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk_fp4_bf16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk_fp4_f16 mlir.dialects._rocdl_ops_gen.cvt_scalef32_sr_pk_fp4_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_2xpk16_bf6_f32 mlir.dialects._rocdl_ops_gen.cvt_scalef32_2xpk16_fp6_f32 mlir.dialects._rocdl_ops_gen.cvt_sr_bf8_f32 mlir.dialects._rocdl_ops_gen.cvt_sr_fp8_f32 mlir.dialects._rocdl_ops_gen.update_dpp mlir.dialects._rocdl_ops_gen.ds_bpermute mlir.dialects._rocdl_ops_gen.ds_load_tr4_b64 mlir.dialects._rocdl_ops_gen.ds_load_tr6_b96 mlir.dialects._rocdl_ops_gen.ds_load_tr8_b64 mlir.dialects._rocdl_ops_gen.ds_load_tr16_b128 mlir.dialects._rocdl_ops_gen.ds_swizzle mlir.dialects._rocdl_ops_gen.fmed3 mlir.dialects._rocdl_ops_gen.s_get_barrier_state mlir.dialects._rocdl_ops_gen.global_load_async_to_lds_b8 mlir.dialects._rocdl_ops_gen.global_load_async_to_lds_b32 mlir.dialects._rocdl_ops_gen.global_load_async_to_lds_b64 mlir.dialects._rocdl_ops_gen.global_load_async_to_lds_b128 mlir.dialects._rocdl_ops_gen.global_load_lds mlir.dialects._rocdl_ops_gen.global_load_tr4_b64 mlir.dialects._rocdl_ops_gen.global_load_tr6_b96 mlir.dialects._rocdl_ops_gen.global_load_tr_b64 mlir.dialects._rocdl_ops_gen.global_load_tr_b128 mlir.dialects._rocdl_ops_gen.grid_dim_x mlir.dialects._rocdl_ops_gen.grid_dim_y mlir.dialects._rocdl_ops_gen.grid_dim_z mlir.dialects._rocdl_ops_gen.iglp_opt mlir.dialects._rocdl_ops_gen.load_to_lds mlir.dialects._rocdl_ops_gen.make_buffer_rsrc mlir.dialects._rocdl_ops_gen.mbcnt_hi mlir.dialects._rocdl_ops_gen.mbcnt_lo mlir.dialects._rocdl_ops_gen.permlane16_swap mlir.dialects._rocdl_ops_gen.permlane32_swap mlir.dialects._rocdl_ops_gen.permlanex16 mlir.dialects._rocdl_ops_gen.raw_buffer_atomic_cmpswap mlir.dialects._rocdl_ops_gen.raw_buffer_atomic_fadd mlir.dialects._rocdl_ops_gen.raw_buffer_atomic_fmax mlir.dialects._rocdl_ops_gen.raw_buffer_atomic_smax mlir.dialects._rocdl_ops_gen.raw_buffer_atomic_umin mlir.dialects._rocdl_ops_gen.raw_buffer_load mlir.dialects._rocdl_ops_gen.raw_buffer_store mlir.dialects._rocdl_ops_gen.raw_ptr_buffer_atomic_cmpswap mlir.dialects._rocdl_ops_gen.raw_ptr_buffer_atomic_fadd mlir.dialects._rocdl_ops_gen.raw_ptr_buffer_atomic_fmax mlir.dialects._rocdl_ops_gen.raw_ptr_buffer_atomic_smax mlir.dialects._rocdl_ops_gen.raw_ptr_buffer_atomic_umin mlir.dialects._rocdl_ops_gen.raw_ptr_buffer_load_lds mlir.dialects._rocdl_ops_gen.raw_ptr_buffer_load mlir.dialects._rocdl_ops_gen.raw_ptr_buffer_store mlir.dialects._rocdl_ops_gen.readfirstlane mlir.dialects._rocdl_ops_gen.readlane mlir.dialects._rocdl_ops_gen.s_barrier mlir.dialects._rocdl_ops_gen.s_sleep mlir.dialects._rocdl_ops_gen.s_waitcnt mlir.dialects._rocdl_ops_gen.sched_barrier mlir.dialects._rocdl_ops_gen.sched_group_barrier mlir.dialects._rocdl_ops_gen.s_setprio mlir.dialects._rocdl_ops_gen.tensor_load_to_lds_d2 mlir.dialects._rocdl_ops_gen.tensor_load_to_lds mlir.dialects._rocdl_ops_gen.tensor_store_from_lds_d2 mlir.dialects._rocdl_ops_gen.tensor_store_from_lds mlir.dialects._rocdl_ops_gen.workitem_id_x mlir.dialects._rocdl_ops_gen.workitem_id_y mlir.dialects._rocdl_ops_gen.workitem_id_z mlir.dialects._rocdl_ops_gen.s_wait_asynccnt mlir.dialects._rocdl_ops_gen.s_wait_dscnt mlir.dialects._rocdl_ops_gen.s_wait_expcnt mlir.dialects._rocdl_ops_gen.s_wait_loadcnt mlir.dialects._rocdl_ops_gen.s_wait_storecnt mlir.dialects._rocdl_ops_gen.s_wait_tensorcnt mlir.dialects._rocdl_ops_gen.wavefrontsize mlir.dialects._rocdl_ops_gen.ds_read_tr4_b64_ mlir.dialects._rocdl_ops_gen.ds_read_tr6_b96_ mlir.dialects._rocdl_ops_gen.ds_read_tr8_b64_ mlir.dialects._rocdl_ops_gen.ds_read_tr16_b64_ mlir.dialects._rocdl_ops_gen.mfma_f32_4x4x1f32_ mlir.dialects._rocdl_ops_gen.mfma_f32_4x4x2bf16_ mlir.dialects._rocdl_ops_gen.mfma_f32_4x4x4bf16_1k_ mlir.dialects._rocdl_ops_gen.mfma_f32_4x4x4f16_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x1f32_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x2bf16_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x4bf16_1k_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x4f16_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x4f32_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x8_xf32_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x8bf16_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x16bf16_1k_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x16f16_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_bf8_bf8_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_bf8_fp8_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_bf16_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_f16_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_fp8_bf8_ mlir.dialects._rocdl_ops_gen.mfma_f32_16x16x32_fp8_fp8_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x1f32_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x2bf16_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x2f32_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x4_xf32_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x4bf16_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x4bf16_1k_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x4f16_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x8bf16_1k_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x8f16_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_bf8_bf8_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_bf8_fp8_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_bf16_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_f16_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_fp8_bf8_ mlir.dialects._rocdl_ops_gen.mfma_f32_32x32x16_fp8_fp8_ mlir.dialects._rocdl_ops_gen.mfma_f64_4x4x4f64_ mlir.dialects._rocdl_ops_gen.mfma_f64_16x16x4f64_ mlir.dialects._rocdl_ops_gen.mfma_i32_4x4x4i8_ mlir.dialects._rocdl_ops_gen.mfma_i32_16x16x4i8_ mlir.dialects._rocdl_ops_gen.mfma_i32_16x16x16i8_ mlir.dialects._rocdl_ops_gen.mfma_i32_16x16x32_i8_ mlir.dialects._rocdl_ops_gen.mfma_i32_16x16x64_i8_ mlir.dialects._rocdl_ops_gen.mfma_i32_32x32x4i8_ mlir.dialects._rocdl_ops_gen.mfma_i32_32x32x8i8_ mlir.dialects._rocdl_ops_gen.mfma_i32_32x32x16_i8_ mlir.dialects._rocdl_ops_gen.mfma_i32_32x32x32_i8_ mlir.dialects._rocdl_ops_gen.mfma_scale_f32_16x16x128_f8f6f4_ mlir.dialects._rocdl_ops_gen.mfma_scale_f32_32x32x64_f8f6f4_ mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x32_bf16_ mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x32_f16_ mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x64_bf8_bf8_ mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x64_bf8_fp8_ mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x64_fp8_bf8_ mlir.dialects._rocdl_ops_gen.smfmac_f32_16x16x64_fp8_fp8_ mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x16_bf16_ mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x16_f16_ mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x32_bf8_bf8_ mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x32_bf8_fp8_ mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x32_fp8_bf8_ mlir.dialects._rocdl_ops_gen.smfmac_f32_32x32x32_fp8_fp8_ mlir.dialects._rocdl_ops_gen.smfmac_i32_16x16x64_i8_ mlir.dialects._rocdl_ops_gen.smfmac_i32_32x32x32_i8_ mlir.dialects._rocdl_ops_gen.wmma_bf16_16x16x16_bf16_ mlir.dialects._rocdl_ops_gen.wmma_bf16_16x16x32_bf16_ mlir.dialects._rocdl_ops_gen.wmma_bf16f32_16x16x32_bf16_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x16_f16_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x32_f16_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x64_bf8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x64_bf8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x64_fp8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x64_fp8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x128_bf8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x128_bf8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x128_fp8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f16_16x16x128_fp8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x4_f32_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_bf8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_bf8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_bf16_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_f16_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_fp8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x16_fp8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x32_bf16_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x32_f16_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x64_bf8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x64_bf8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x64_fp8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x64_fp8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x128_bf8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x128_bf8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x128_fp8_bf8_ mlir.dialects._rocdl_ops_gen.wmma_f32_16x16x128_fp8_fp8_ mlir.dialects._rocdl_ops_gen.wmma_i32_16x16x16_iu4_ mlir.dialects._rocdl_ops_gen.wmma_i32_16x16x16_iu8_ mlir.dialects._rocdl_ops_gen.wmma_i32_16x16x32_iu4_ mlir.dialects._rocdl_ops_gen.wmma_i32_16x16x64_iu8_ Module Contents --------------- .. py:data:: _ods_ir .. py:class:: _Dialect(descriptor: object) Bases: :py:obj:`_ods_ir` .. py:attribute:: DIALECT_NAMESPACE :value: 'rocdl' .. py:class:: BallotOp(res, pred, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Ballot provides a bit mask containing the 1-bit predicate value from each lane. The nth bit of the result contains the 1 bit contributed by the nth warp lane. .. py:attribute:: OPERATION_NAME :value: 'rocdl.ballot' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: pred() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: ballot(res, pred, *, loc=None, ip=None) -> _ods_ir .. py:class:: BarrierInitOp(ptr, id, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.barrier.init' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: id() -> _ods_ir .. py:function:: s_barrier_init(ptr, id, *, loc=None, ip=None) -> BarrierInitOp .. py:class:: BarrierJoinOp(ptr, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.barrier.join' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:function:: s_barrier_join(ptr, *, loc=None, ip=None) -> BarrierJoinOp .. py:class:: BarrierLeaveOp(id, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.barrier.leave' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: id() -> _ods_ir .. py:function:: s_barrier_leave(id, *, loc=None, ip=None) -> BarrierLeaveOp .. py:class:: BarrierOp(*, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.barrier' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:function:: barrier(*, loc=None, ip=None) -> BarrierOp .. py:class:: BarrierSignalIsfirstOp(res, id, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.barrier.signal.isfirst' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: id() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: s_barrier_signal_isfirst(res, id, *, loc=None, ip=None) -> _ods_ir .. py:class:: BarrierSignalOp(id, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.barrier.signal' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: id() -> _ods_ir .. py:function:: s_barrier_signal(id, *, loc=None, ip=None) -> BarrierSignalOp .. py:class:: BarrierSignalVarOp(ptr, id, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.barrier.signal.var' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: id() -> _ods_ir .. py:function:: s_barrier_signal_var(ptr, id, *, loc=None, ip=None) -> BarrierSignalVarOp .. py:class:: BarrierWaitOp(id, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.barrier.wait' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: id() -> _ods_ir .. py:function:: s_barrier_wait(id, *, loc=None, ip=None) -> BarrierWaitOp .. py:class:: BlockDimXOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workgroup.dim.x' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workgroup_dim_x(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: BlockDimYOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workgroup.dim.y' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workgroup_dim_y(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: BlockDimZOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workgroup.dim.z' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workgroup_dim_z(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: BlockIdXOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workgroup.id.x' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workgroup_id_x(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: BlockIdYOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workgroup.id.y' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workgroup_id_y(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: BlockIdZOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workgroup.id.z' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workgroup_id_z(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: CvtF32Bf8Op(res, srcA, byteSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8-bit bf8 value from the ``byteSel``th bit of ``srcA`` to fp32. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.f32.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: srcA() -> _ods_ir .. py:method:: byteSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_f32_bf8(res, src_a, byte_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtF32Fp8Op(res, srcA, byteSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8-bit fp8 value from the ``byteSel``th bit of ``srcA`` to fp32. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.f32.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: srcA() -> _ods_ir .. py:method:: byteSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_f32_fp8(res, src_a, byte_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkBf8F32Op(res, srcA, srcB, old, wordSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert ``srcA`` and ``srcB`` to bf8 and store into the low/high word of ``old``, preserving the other word. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.pk.bf8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: srcA() -> _ods_ir .. py:method:: srcB() -> _ods_ir .. py:method:: old() -> _ods_ir .. py:method:: wordSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_pk_bf8_f32(res, src_a, src_b, old, word_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkF32Bf8Op(res, src, wordSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert ``src`` based on $wordSel to packed fp32, .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.pk.f32.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: wordSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_pk_f32_bf8(res, src, word_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkF32Fp8Op(res, src, wordSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert ``src`` based on $wordSel to packed fp32. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.pk.f32.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: wordSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_pk_f32_fp8(res, src, word_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkFp8F32Op(res, srcA, srcB, old, wordSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert ``srcA`` and ``srcB`` to fp8 and store into the low/high word of ``old``, preserving the other word. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.pk.fp8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: srcA() -> _ods_ir .. py:method:: srcB() -> _ods_ir .. py:method:: old() -> _ods_ir .. py:method:: wordSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_pk_fp8_f32(res, src_a, src_b, old, word_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkRtz(res, srcA, srcB, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two f32 values into a packed vector<2xf16>. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.pkrtz' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: srcA() -> _ods_ir .. py:method:: srcB() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_pkrtz(res, src_a, src_b, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8Bf16Bf8Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.bf16.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_bf16_bf8(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8Bf16Fp4Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.bf16.fp4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_bf16_fp4(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8Bf16Fp8Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.bf16.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_bf16_fp8(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8F16Bf8Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.f16.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_f16_bf8(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8F16Fp4Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.f16.fp4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_f16_fp4(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8F16Fp8Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.f16.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_f16_fp8(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8F32Bf8Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.f32.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_f32_bf8(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8F32Fp4Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.f32.fp4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_f32_fp4(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk8F32Fp8Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk8.f32.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk8_f32_fp8(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk16Bf16Bf6Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk16.bf16.bf6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk16_bf16_bf6(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk16Bf16Fp6Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk16.bf16.fp6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk16_bf16_fp6(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk16F16Bf6Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk16.f16.bf6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk16_f16_bf6(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk16F16Fp6Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk16.f16.fp6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk16_f16_fp6(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk16F32Bf6Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk16.f32.bf6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk16_f32_bf6(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtPkScalePk16F32Fp6Op(res, src, scale, scaleSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scale.pk16.f32.fp6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: scaleSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scale_pk16_f32_fp6(res, src, scale, scale_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32F16Bf8Op(res, oldVdst, src, scale, srcSelIndex, dstLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a bf8 byte from ``src``, selected by ``srcSelIndex``, to f16 while multiplying it by the expontent of ``scale``, and place it into the ``dstLoHiSel``th bit of ``oldVdst`` preserving the other element of that vector in the return value. The bytes are stored as an ``i32`` and not a ``<4 x i8>``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.f16.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcSelIndex() -> _ods_ir .. py:method:: dstLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_f16_bf8(res, old_vdst, src, scale, src_sel_index, dst_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32F16Fp8Op(res, oldVdst, src, scale, srcSelIndex, dstLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a fp8 byte from ``src``, selected by ``srcSelIndex``, to f16 while multiplying it by the expontent of ``scale``, and place it into the ``dstLoHiSel``th bit of ``oldVdst`` preserving the other element of that vector in the return value. The bytes are stored as an ``i32`` and not a ``<4 x i8>``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.f16.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcSelIndex() -> _ods_ir .. py:method:: dstLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_f16_fp8(res, old_vdst, src, scale, src_sel_index, dst_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32F32Bf8Op(res, src, scale, srcSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a bf8 byte from ``src``, selected by ``srcSelIndex``, to f32, multiplying it by the exponent of ``scale``. The bytes are stored in an ``i32``, not a ``<4 x i8>``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.f32.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_f32_bf8(res, src, scale, src_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32F32Fp8Op(res, src, scale, srcSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a fp8 byte from ``src``, selected by ``srcSelIndex``, to f32, multiplying it by the exponent of ``scale``. The bytes are stored in an ``i32``, not a ``<4 x i8>``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.f32.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_f32_fp8(res, src, scale, src_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Bf8Bf16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed bf8, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.bf8.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_bf8_bf16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Bf8F16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed bf8, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.bf8.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_bf8_f16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Bf8F32Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed bf8, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.bf8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_bf8_f32(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Fp4Bf16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed fp4, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.fp4.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_fp4_bf16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Fp4F16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed fp4, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.fp4.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_fp4_f16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Fp4F32Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed fp4, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.fp4.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_fp4_f32(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Fp8Bf16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed fp8, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.fp8.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_fp8_bf16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Fp8F16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed fp8, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.fp8.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_fp8_f16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk8Fp8F32Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed fp8, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk8.fp8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk8_fp8_f32(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk16Bf6Bf16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed bf6, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk16.bf6.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk16_bf6_bf16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk16Bf6F16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed bf6, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk16.bf6.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk16_bf6_f16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk16Bf6F32Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed bf6, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk16.bf6.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk16_bf6_f32(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk16Fp6Bf16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed fp6, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk16.fp6.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk16_fp6_bf16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk16Fp6F16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed fp6, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk16.fp6.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk16_fp6_f16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk16Fp6F32Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed fp6, multiplying by the exponent part of ``scale`` before doing so. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk16.fp6.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk16_fp6_f32(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32Bf6Bf16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed bf16 values to packed bf6, dividing by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.bf6.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_bf6_bf16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32Bf6F16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed f16 values to packed bf6, dividing by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.bf6.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_bf6_f16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32Bf16Bf6Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed bf6 values to packed bf16, multiplying by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.bf16.bf6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_bf16_bf6(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32Bf16Fp6Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed fp6 values to packed bf16, multiplying by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.bf16.fp6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_bf16_fp6(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32F16Bf6Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed bf6 values to packed f16, multiplying by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.f16.bf6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_f16_bf6(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32F16Fp6Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed fp6 values to packed f16, multiplying by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.f16.fp6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_f16_fp6(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32F32Bf6Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed bf6 values to packed f32, multiplying by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.f32.bf6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_f32_bf6(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32F32Fp6Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed fp6 values to packed f32, multiplying by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.f32.fp6' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_f32_fp6(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32Fp6Bf16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed bf16 values to packed fp6, dividing by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.fp6.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_fp6_bf16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32Pk32Fp6F16Op(res, src, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed f16 values to packed fp6, dividing by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk32.fp6.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk32_fp6_f16(res, src, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkBf8Bf16Op(res, oldVdst, src0, scale, dstLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two bf16 values in ``src0`` to two bf8 bytes, dividing by the exponent in ``scale``. The bytes are packed into a 16-bit value which is inserted into ``oldVdst`` at the ``dstLoHiSel`` position, with the entire updated vector being returned. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.bf8.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_bf8_bf16(res, old_vdst, src0, scale, dst_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkBf8F16Op(res, oldVdst, src0, scale, dstLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two f16 values in ``src0`` to two bf8 bytes, dividing by the exponent in ``scale``. The bytes are packed into a 16-bit value which is inserted into ``oldVdst`` at the ``dstLoHiSel`` position, with the entire updated vector being returned. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.bf8.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_bf8_f16(res, old_vdst, src0, scale, dst_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkBf8F32Op(res, oldVdst, src0, src1, scale, dstLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two f32 values in ``src0`` and ``src1`` to two bf8 bytes, dividing by the exponent in ``scale``. The bytes are packed into a 16-bit value which is inserted into ``oldVdst`` at the ``dstLoHiSel`` position, with the entire updated vector being returned. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.bf8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: src1() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_bf8_f32(res, old_vdst, src0, src1, scale, dst_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkBf16Bf8Op(res, src, scale, srcLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed bf8 values in ``src0`` to two bf16 values, multiplying by the exponent in ``scale``. The two values to be converted are selected from the low or high half of ``src`` (a packed vector represented as an ``i32``) on the basis of ``srcLoHiSel``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.bf16.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_bf16_bf8(res, src, scale, src_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkBf16Fp4Op(res, src, scale, srcSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed fp4 (f4E2M1) values stored as one byte of a 32-bit integer to packed bf16, multiplying by the exponent part of ``scale`` before doing so. The byte to convert is chosen by ``srcSelIndex``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.bf16.fp4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_bf16_fp4(res, src, scale, src_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkBf16Fp8Op(res, src, scale, srcLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed fp8 values in ``src0`` to two bf16 values, multiplying by the exponent in ``scale``. The two values to be converted are selected from the low or high half of ``src`` (a packed vector represented as an ``i32``) on the basis of ``srcLoHiSel``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.bf16.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_bf16_fp8(res, src, scale, src_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkF16Bf8Op(res, src, scale, srcLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed bf8 values in ``src0`` to two f16 values, multiplying by the exponent in ``scale``. The two values to be converted are selected from the low or high half of ``src`` (a packed vector represented as an ``i32``) on the basis of ``srcLoHiSel``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.f16.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_f16_bf8(res, src, scale, src_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkF16Fp4Op(res, src, scale, srcSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed fp4 (f4E2M1) values stored as one byte of a 32-bit integer to packed f16, multiplying by the exponent part of ``scale`` before doing so. The byte to convert is chosen by ``srcSelIndex``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.f16.fp4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_f16_fp4(res, src, scale, src_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkF16Fp8Op(res, src, scale, srcLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed fp8 values in ``src0`` to two f16 values, multiplying by the exponent in ``scale``. The two values to be converted are selected from the low or high half of ``src`` (a packed vector represented as an ``i32``) on the basis of ``srcLoHiSel``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.f16.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_f16_fp8(res, src, scale, src_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkF32Bf8Op(res, src, scale, srcLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed bf8 values in ``src0`` to two f32 values, multiplying by the exponent in ``scale``. The two values to be converted are selected from the low or high half of ``src`` (a packed vector represented as an ``i32``) on the basis of ``srcLoHiSel``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.f32.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_f32_bf8(res, src, scale, src_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkF32Fp4Op(res, src, scale, srcSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed fp4 (f4E2M1) values stored as one byte of a 32-bit integer to packed f32, multiplying by the exponent part of ``scale`` before doing so. The byte to convert is chosen by ``srcSelIndex``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.f32.fp4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_f32_fp4(res, src, scale, src_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkF32Fp8Op(res, src, scale, srcLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed fp8 values in ``src0`` to two f32 values, multiplying by the exponent in ``scale``. The two values to be converted are selected from the low or high half of ``src`` (a packed vector represented as an ``i32``) on the basis of ``srcLoHiSel``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.f32.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: srcLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_f32_fp8(res, src, scale, src_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkFp4Bf16Op(res, oldVdst, src, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed bf16 values to packed fp4, dividing by the exponent part of ``scale`` before doing so. The two scaled values are packed into a byte. That byte is used to update the ``dstSelIndex``th byte of ``oldVdst``, which is returned in its entirity. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.fp4.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_fp4_bf16(res, old_vdst, src, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkFp4F16Op(res, oldVdst, src, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed f16 values to packed fp4, dividing by the exponent part of ``scale`` before doing so. The two scaled values are packed into a byte. That byte is used to update the ``dstSelIndex``th byte of ``oldVdst``, which is returned in its entirity. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.fp4.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_fp4_f16(res, old_vdst, src, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkFp4F32Op(res, oldVdst, src0, src1, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two single-precision float values, passed in ``src0`` and ``src1`` into two fp4 values, dividing them by the expontent part of ``scale`` before doing so. The two scaled values are packed into a byte. That byte is used to update the ``dstSelIndex``th byte of ``oldVdst``, which is returned in its entirity. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.fp4.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: src1() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_fp4_f32(res, old_vdst, src0, src1, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkFp8Bf16Op(res, oldVdst, src0, scale, dstLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two bf16 values in ``src0`` to two fp8 bytes, dividing by the exponent in ``scale``. The bytes are packed into a 16-bit value which is inserted into ``oldVdst`` at the ``dstLoHiSel`` position, with the entire updated vector being returned. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.fp8.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_fp8_bf16(res, old_vdst, src0, scale, dst_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkFp8F16Op(res, oldVdst, src0, scale, dstLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two f16 values in ``src0`` to two fp8 bytes, dividing by the exponent in ``scale``. The bytes are packed into a 16-bit value which is inserted into ``oldVdst`` at the ``dstLoHiSel`` position, with the entire updated vector being returned. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.fp8.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_fp8_f16(res, old_vdst, src0, scale, dst_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32PkFp8F32Op(res, oldVdst, src0, src1, scale, dstLoHiSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two f32 values in ``src0`` and ``src1`` to two fp8 bytes, dividing by the exponent in ``scale``. The bytes are packed into a 16-bit value which is inserted into ``oldVdst`` at the ``dstLoHiSel`` position, with the entire updated vector being returned. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.pk.fp8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: src1() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstLoHiSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_pk_fp8_f32(res, old_vdst, src0, src1, scale, dst_lo_hi_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrBf8BF16Op(res, oldVdst, src0, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a bf16 value in ``src0`` to a bf8 bytes, dividing by the exponent in ``scale`` and using ``seed`` for stochiastic rounding. Place the resulting byte in the ``dstSelIndex``th bit of ``oldVdst`` and return the entire packed vector, which is stored as an ``i32``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.bf8.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_bf8_bf16(res, old_vdst, src0, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrBf8F16Op(res, oldVdst, src0, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a f16 value in ``src0`` to a bf8 bytes, dividing by the exponent in ``scale`` and using ``seed`` for stochiastic rounding. Place the resulting byte in the ``dstSelIndex``th bit of ``oldVdst`` and return the entire packed vector, which is stored as an ``i32``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.bf8.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_bf8_f16(res, old_vdst, src0, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrBf8F32Op(res, oldVdst, src0, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a f32 value in ``src0`` to a bf8 bytes, dividing by the exponent in ``scale`` and using ``seed`` for stochiastic rounding. Place the resulting byte in the ``dstSelIndex``th bit of ``oldVdst`` and return the entire packed vector, which is stored as an ``i32``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.bf8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_bf8_f32(res, old_vdst, src0, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrFp8BF16Op(res, oldVdst, src0, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a bf16 value in ``src0`` to a fp8 bytes, dividing by the exponent in ``scale`` and using ``seed`` for stochiastic rounding. Place the resulting byte in the ``dstSelIndex``th bit of ``oldVdst`` and return the entire packed vector, which is stored as an ``i32``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.fp8.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_fp8_bf16(res, old_vdst, src0, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrFp8F16Op(res, oldVdst, src0, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a f16 value in ``src0`` to a fp8 bytes, dividing by the exponent in ``scale`` and using ``seed`` for stochiastic rounding. Place the resulting byte in the ``dstSelIndex``th bit of ``oldVdst`` and return the entire packed vector, which is stored as an ``i32``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.fp8.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_fp8_f16(res, old_vdst, src0, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrFp8F32Op(res, oldVdst, src0, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert a f32 value in ``src0`` to a fp8 bytes, dividing by the exponent in ``scale`` and using ``seed`` for stochiastic rounding. Place the resulting byte in the ``dstSelIndex``th bit of ``oldVdst`` and return the entire packed vector, which is stored as an ``i32``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.fp8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_fp8_f32(res, old_vdst, src0, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Bf8Bf16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed bf8, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.bf8.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_bf8_bf16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Bf8F16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed bf8, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.bf8.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_bf8_f16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Bf8F32Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed bf8, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.bf8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_bf8_f32(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Fp4Bf16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed fp4, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.fp4.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_fp4_bf16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Fp4F16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed fp4, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.fp4.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_fp4_f16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Fp4F32Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed fp4, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.fp4.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_fp4_f32(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Fp8Bf16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed fp8, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.fp8.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_fp8_bf16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Fp8F16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed fp8, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.fp8.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_fp8_f16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk8Fp8F32Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed fp8, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk8.fp8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk8_fp8_f32(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk16Bf6Bf16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed bf6, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk16.bf6.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk16_bf6_bf16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk16Bf6F16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed bf6, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk16.bf6.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk16_bf6_f16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk16Bf6F32Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed bf6, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk16.bf6.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk16_bf6_f32(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk16Fp6Bf16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed bf16 values to packed fp6, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk16.fp6.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk16_fp6_bf16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk16Fp6F16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f16 values to packed fp6, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk16.fp6.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk16_fp6_f16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk16Fp6F32Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 8 packed f32 values to packed fp6, multiplying by the exponent part of ``scale`` before doing so and apply stochastic rounding. This op is for gfx1250+ arch. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk16.fp6.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk16_fp6_f32(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk32Bf6Bf16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed bf16 values to packed bf6, dividing by the exponent part of ``scale`` before doing so and applying random rounding derived from ``seed``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk32.bf6.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk32_bf6_bf16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk32Bf6F16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed f16 values to packed bf6, dividing by the exponent part of ``scale`` before doing so and applying random rounding derived from ``seed``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk32.bf6.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk32_bf6_f16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk32Bf6F32Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed f32 values to packed bf6, dividing by the exponent part of ``scale`` before doing so and applying random rounding derived from ``seed``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk32.bf6.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk32_bf6_f32(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk32Fp6Bf16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed bf16 values to packed fp6, dividing by the exponent part of ``scale`` before doing so and applying random rounding derived from ``seed``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk32.fp6.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk32_fp6_bf16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk32Fp6F16Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed f16 values to packed fp6, dividing by the exponent part of ``scale`` before doing so and applying random rounding derived from ``seed``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk32.fp6.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk32_fp6_f16(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPk32Fp6F32Op(res, src, seed, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 packed f32 values to packed fp6, dividing by the exponent part of ``scale`` before doing so and applying random rounding derived from ``seed``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk32.fp6.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk32_fp6_f32(res, src, seed, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPkFp4Bf16Op(res, oldVdst, src, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed bf16 values to packed fp4, dividing by the exponent part of ``scale`` before doing so and using ``seed`` as the random seed for stochiastic rounding. The two scaled values are packed (little-endian) into a byte. That byte is used to update the ``dstSelIndex``th byte of ``oldVdst``, which is returned in its entirity. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk.fp4.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk_fp4_bf16(res, old_vdst, src, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPkFp4F16Op(res, oldVdst, src, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed f16 values to packed fp4, dividing by the exponent part of ``scale`` before doing so and using ``seed`` as the random seed for stochiastic rounding. The two scaled values are packed (little-endian) into a byte. That byte is used to update the ``dstSelIndex``th byte of ``oldVdst``, which is returned in its entirity. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk.fp4.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk_fp4_f16(res, old_vdst, src, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF32SrPkFp4F32Op(res, oldVdst, src, seed, scale, dstSelIndex, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert two packed f32 values to packed fp4, dividing by the exponent part of ``scale`` before doing so and using ``seed`` as the random seed for stochiastic rounding. The two scaled values are packed (little-endian) into a byte. That byte is used to update the ``dstSelIndex``th byte of ``oldVdst``, which is returned in its entirity. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.sr.pk.fp4.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: oldVdst() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: seed() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: dstSelIndex() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_sr_pk_fp4_f32(res, old_vdst, src, seed, scale, dst_sel_index, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF322xPk16Bf6F32Op(res, src0, src1, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 single-precision float values, packed into two length-16 vectors that will be logically concanenated, to packed bf6, dividing by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.2xpk16.bf6.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src0() -> _ods_ir .. py:method:: src1() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_2xpk16_bf6_f32(res, src0, src1, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtScaleF322xPk16Fp6F32Op(res, src0, src1, scale, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert 32 single-precision float values, packed into two length-16 vectors that will be logically concanenated, to packed fp6, dividing by the exponent part of ``scale`` before doing so. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.scalef32.2xpk16.fp6.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src0() -> _ods_ir .. py:method:: src1() -> _ods_ir .. py:method:: scale() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_scalef32_2xpk16_fp6_f32(res, src0, src1, scale, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtSrBf8F32Op(res, srcA, srcB, old, byteSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert ``srcA`` to bf8, adding the rounding factor from ``srcB``, and store into the ``byteSel``th byte of ``old``, preserving the others. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.sr.bf8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: srcA() -> _ods_ir .. py:method:: srcB() -> _ods_ir .. py:method:: old() -> _ods_ir .. py:method:: byteSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_sr_bf8_f32(res, src_a, src_b, old, byte_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: CvtSrFp8F32Op(res, srcA, srcB, old, byteSel, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Convert ``srcA`` to fp8, adding the rounding factor from ``srcB``, and store into the ``byteSel``th byte of ``old``, preserving the others. .. py:attribute:: OPERATION_NAME :value: 'rocdl.cvt.sr.fp8.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: srcA() -> _ods_ir .. py:method:: srcB() -> _ods_ir .. py:method:: old() -> _ods_ir .. py:method:: byteSel() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: cvt_sr_fp8_f32(res, src_a, src_b, old, byte_sel, *, loc=None, ip=None) -> _ods_ir .. py:class:: DPPUpdateOp(res, old, src, dppCtrl, rowMask, bankMask, boundCtrl, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.update.dpp' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: old() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: dppCtrl() -> _ods_ir .. py:method:: rowMask() -> _ods_ir .. py:method:: bankMask() -> _ods_ir .. py:method:: boundCtrl() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: update_dpp(res, old, src, dpp_ctrl, row_mask, bank_mask, bound_ctrl, *, loc=None, ip=None) -> _ods_ir .. py:class:: DsBpermuteOp(res, index, src, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds_bpermute' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: index() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: ds_bpermute(res, index, src, *, loc=None, ip=None) -> _ods_ir .. py:class:: DsLoadTr4_B64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Load a matrix of 4-bit data from the ds memory, transpose data between row-major and column-major order, and store the result into a 64-bit vector register. Available in gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds.load.tr4.b64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: ds_load_tr4_b64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: DsLoadTr6_B96(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Load a matrix of 6-bit data from the ds memory, transpose data between row-major and column-major order, and store the result into a 96-bit vector register. Available in gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds.load.tr6.b96' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: ds_load_tr6_b96(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: DsLoadTr8_B64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Load a matrix of 8-bit data from the ds memory, transpose data between row-major and column-major order, and store the result into a 64-bit vector register. Available in gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds.load.tr8.b64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: ds_load_tr8_b64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: DsLoadTr16_B128(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Load a matrix of 16-bit data from the ds memory, transpose data between row-major and column-major order, and store the result into a 128-bit vector register. Available in gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds.load.tr16.b128' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: ds_load_tr16_b128(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: DsSwizzleOp(res, src, offset, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds_swizzle' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: ds_swizzle(res, src, offset, *, loc=None, ip=None) -> _ods_ir .. py:class:: FMed3Op(res, src0, src1, src2, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Computes the median of three floating-point values using the AMDGPU fmed3 intrinsic. This operation is equivalent to ``max(min(a, b), min(max(a, b), c))`` but uses the hardware-accelerated V_MED3_F16/V_MED3_F32 instruction for better performance. The operation supports both scalar and vector floating-point types (f16, f32). Example: .. code:: mlir // Scalar f32 median %result = rocdl.fmed3 %a, %b, %c : f32 // Vector f16 median %result = rocdl.fmed3 %va, %vb, %vc : vector<4xf16> .. py:attribute:: OPERATION_NAME :value: 'rocdl.fmed3' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src0() -> _ods_ir .. py:method:: src1() -> _ods_ir .. py:method:: src2() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: fmed3(res, src0, src1, src2, *, loc=None, ip=None) -> _ods_ir .. py:class:: GetBarrierStateOp(res, id, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.get.barrier.state' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: id() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: s_get_barrier_state(res, id, *, loc=None, ip=None) -> _ods_ir .. py:class:: GlobalLoadAsyncToLDSB8Op(globalPtr, ldsPtr, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Asynchronously loads 8 bits of data from a global memory pointer to a Local Data Share (LDS) pointer. Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.async.to.lds.b8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: globalPtr() -> _ods_ir .. py:method:: ldsPtr() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: global_load_async_to_lds_b8(global_ptr, lds_ptr, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> GlobalLoadAsyncToLDSB8Op .. py:class:: GlobalLoadAsyncToLDSB32Op(globalPtr, ldsPtr, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Asynchronously loads 32 bits of data from a global memory pointer to a Local Data Share (LDS) pointer. Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.async.to.lds.b32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: globalPtr() -> _ods_ir .. py:method:: ldsPtr() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: global_load_async_to_lds_b32(global_ptr, lds_ptr, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> GlobalLoadAsyncToLDSB32Op .. py:class:: GlobalLoadAsyncToLDSB64Op(globalPtr, ldsPtr, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Asynchronously loads 64 bits of data from a global memory pointer to a Local Data Share (LDS) pointer. Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.async.to.lds.b64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: globalPtr() -> _ods_ir .. py:method:: ldsPtr() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: global_load_async_to_lds_b64(global_ptr, lds_ptr, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> GlobalLoadAsyncToLDSB64Op .. py:class:: GlobalLoadAsyncToLDSB128Op(globalPtr, ldsPtr, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Asynchronously loads 128 bits of data from a global memory pointer to a Local Data Share (LDS) pointer. Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.async.to.lds.b128' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: globalPtr() -> _ods_ir .. py:method:: ldsPtr() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: global_load_async_to_lds_b128(global_ptr, lds_ptr, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> GlobalLoadAsyncToLDSB128Op .. py:class:: GlobalLoadLDSOp(globalPtr, ldsPtr, size, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.lds' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: globalPtr() -> _ods_ir .. py:method:: ldsPtr() -> _ods_ir .. py:method:: size() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: global_load_lds(global_ptr, lds_ptr, size, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> GlobalLoadLDSOp .. py:class:: GlobalLoadTr4_B64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Load a matrix of 4-bit data from the global memory, transpose data between row-major and column-major order, and store the result into a 64-bit vector register. Available in gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.tr4.b64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: global_load_tr4_b64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: GlobalLoadTr6_B96(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Load a matrix of 6-bit data from the global memory, transpose data between row-major and column-major order, and store the result into a 96-bit vector register. Available in gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.tr6.b96' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: global_load_tr6_b96(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: GlobalLoadTr8_B64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Load a matrix of 8-bit data from the global memory, transpose data between row-major and column-major order, and store the result into a 64-bit vector register. Available in gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.tr.b64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: global_load_tr_b64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: GlobalLoadTr8_B128(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Load a matrix of 16-bit data from the global memory, transpose data between row-major and column-major order, and store the result into a 128-bit vector register. Available in gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.global.load.tr.b128' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: global_load_tr_b128(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: GridDimXOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.grid.dim.x' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: grid_dim_x(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: GridDimYOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.grid.dim.y' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: grid_dim_y(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: GridDimZOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.grid.dim.z' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: grid_dim_z(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: IglpOpt(variant, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.iglp.opt' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: variant() -> _ods_ir .. py:function:: iglp_opt(variant, *, loc=None, ip=None) -> IglpOpt .. py:class:: LoadToLDSOp(globalPtr, ldsPtr, size, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.load.to.lds' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: globalPtr() -> _ods_ir .. py:method:: ldsPtr() -> _ods_ir .. py:method:: size() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: load_to_lds(global_ptr, lds_ptr, size, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> LoadToLDSOp .. py:class:: MakeBufferRsrcOp(res, base, stride, numRecords, flags, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.make.buffer.rsrc' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: base() -> _ods_ir .. py:method:: stride() -> _ods_ir .. py:method:: numRecords() -> _ods_ir .. py:method:: flags() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: make_buffer_rsrc(res, base, stride, num_records, flags, *, loc=None, ip=None) -> _ods_ir .. py:class:: MbcntHiOp(res, in0, in1, *, arg_attrs=None, res_attrs=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mbcnt.hi' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: in0() -> _ods_ir .. py:method:: in1() -> _ods_ir .. py:method:: arg_attrs() -> Optional[_ods_ir] .. py:method:: res_attrs() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: mbcnt_hi(res, in0, in1, *, arg_attrs=None, res_attrs=None, loc=None, ip=None) -> _ods_ir .. py:class:: MbcntLoOp(res, in0, in1, *, arg_attrs=None, res_attrs=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mbcnt.lo' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: in0() -> _ods_ir .. py:method:: in1() -> _ods_ir .. py:method:: arg_attrs() -> Optional[_ods_ir] .. py:method:: res_attrs() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: mbcnt_lo(res, in0, in1, *, arg_attrs=None, res_attrs=None, loc=None, ip=None) -> _ods_ir .. py:class:: Permlane16SwapOp(res, old, src, fi, boundControl, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Performs a ``permlane16.swap`` operation with the given operands, applying the permutation specified by $fi to the provided inputs. .. py:attribute:: OPERATION_NAME :value: 'rocdl.permlane16.swap' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: old() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: fi() -> _ods_ir .. py:method:: boundControl() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: permlane16_swap(res, old, src, fi, bound_control, *, loc=None, ip=None) -> _ods_ir .. py:class:: Permlane32SwapOp(res, old, src, fi, boundControl, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Performs a ``permlane32.swap`` operation with the given operands, applying the permutation specified by $fi to the provided inputs. .. py:attribute:: OPERATION_NAME :value: 'rocdl.permlane32.swap' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: old() -> _ods_ir .. py:method:: src() -> _ods_ir .. py:method:: fi() -> _ods_ir .. py:method:: boundControl() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: permlane32_swap(res, old, src, fi, bound_control, *, loc=None, ip=None) -> _ods_ir .. py:class:: PermlaneX16Op(res, old, src0, src1, src2, fi, boundControl, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Performs a ``permlanex16`` operation with the given operands, applying the permutation specified by $fi to the provided inputs. .. py:attribute:: OPERATION_NAME :value: 'rocdl.permlanex16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: old() -> _ods_ir .. py:method:: src0() -> _ods_ir .. py:method:: src1() -> _ods_ir .. py:method:: src2() -> _ods_ir .. py:method:: fi() -> _ods_ir .. py:method:: boundControl() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: permlanex16(res, old, src0, src1, src2, fi, bound_control, *, loc=None, ip=None) -> _ods_ir .. py:class:: RawBufferAtomicCmpSwap(res, src, cmp, rsrc, offset, soffset, aux, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.buffer.atomic.cmpswap' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: cmp() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: raw_buffer_atomic_cmpswap(res, src, cmp, rsrc, offset, soffset, aux, *, loc=None, ip=None) -> _ods_ir .. py:class:: RawBufferAtomicFAddOp(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.buffer.atomic.fadd' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:function:: raw_buffer_atomic_fadd(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) -> RawBufferAtomicFAddOp .. py:class:: RawBufferAtomicFMaxOp(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.buffer.atomic.fmax' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:function:: raw_buffer_atomic_fmax(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) -> RawBufferAtomicFMaxOp .. py:class:: RawBufferAtomicSMaxOp(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.buffer.atomic.smax' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:function:: raw_buffer_atomic_smax(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) -> RawBufferAtomicSMaxOp .. py:class:: RawBufferAtomicUMinOp(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.buffer.atomic.umin' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:function:: raw_buffer_atomic_umin(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) -> RawBufferAtomicUMinOp .. py:class:: RawBufferLoadOp(res, rsrc, offset, soffset, aux, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.buffer.load' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: raw_buffer_load(res, rsrc, offset, soffset, aux, *, loc=None, ip=None) -> _ods_ir .. py:class:: RawBufferStoreOp(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.buffer.store' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:function:: raw_buffer_store(vdata, rsrc, offset, soffset, aux, *, loc=None, ip=None) -> RawBufferStoreOp .. py:class:: RawPtrBufferAtomicCmpSwap(res, src, cmp, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.ptr.buffer.atomic.cmpswap' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: cmp() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: raw_ptr_buffer_atomic_cmpswap(res, src, cmp, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: RawPtrBufferAtomicFaddOp(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.ptr.buffer.atomic.fadd' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: raw_ptr_buffer_atomic_fadd(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> RawPtrBufferAtomicFaddOp .. py:class:: RawPtrBufferAtomicFmaxOp(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.ptr.buffer.atomic.fmax' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: raw_ptr_buffer_atomic_fmax(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> RawPtrBufferAtomicFmaxOp .. py:class:: RawPtrBufferAtomicSmaxOp(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.ptr.buffer.atomic.smax' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: raw_ptr_buffer_atomic_smax(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> RawPtrBufferAtomicSmaxOp .. py:class:: RawPtrBufferAtomicUminOp(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.ptr.buffer.atomic.umin' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: raw_ptr_buffer_atomic_umin(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> RawPtrBufferAtomicUminOp .. py:class:: RawPtrBufferLoadLdsOp(rsrc, ldsPtr, size, voffset, soffset, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.ptr.buffer.load.lds' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: rsrc() -> _ods_ir .. py:method:: ldsPtr() -> _ods_ir .. py:method:: size() -> _ods_ir .. py:method:: voffset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: raw_ptr_buffer_load_lds(rsrc, lds_ptr, size, voffset, soffset, offset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> RawPtrBufferLoadLdsOp .. py:class:: RawPtrBufferLoadOp(res, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.ptr.buffer.load' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: raw_ptr_buffer_load(res, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: RawPtrBufferStoreOp(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.raw.ptr.buffer.store' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: vdata() -> _ods_ir .. py:method:: rsrc() -> _ods_ir .. py:method:: offset() -> _ods_ir .. py:method:: soffset() -> _ods_ir .. py:method:: aux() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: raw_ptr_buffer_store(vdata, rsrc, offset, soffset, aux, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> RawPtrBufferStoreOp .. py:class:: ReadfirstlaneOp(res, src, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Returns the value in the lowest active lane of the input operand. .. py:attribute:: OPERATION_NAME :value: 'rocdl.readfirstlane' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: readfirstlane(res, src, *, loc=None, ip=None) -> _ods_ir .. py:class:: ReadlaneOp(res, src0, src1, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Get the value in lane ``src1`` from input ``src0``. .. py:attribute:: OPERATION_NAME :value: 'rocdl.readlane' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: src0() -> _ods_ir .. py:method:: src1() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: readlane(res, src0, src1, *, loc=None, ip=None) -> _ods_ir .. py:class:: SBarrierOp(*, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.barrier' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:function:: s_barrier(*, loc=None, ip=None) -> SBarrierOp .. py:class:: SSleepOp(count, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.sleep' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: count() -> _ods_ir .. py:function:: s_sleep(count, *, loc=None, ip=None) -> SSleepOp .. py:class:: SWaitcntOp(bitfield, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.waitcnt' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: bitfield() -> _ods_ir .. py:function:: s_waitcnt(bitfield, *, loc=None, ip=None) -> SWaitcntOp .. py:class:: SchedBarrier(mask, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.sched.barrier' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: mask() -> _ods_ir .. py:function:: sched_barrier(mask, *, loc=None, ip=None) -> SchedBarrier .. py:class:: SchedGroupBarrier(mask, size, groupId, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.sched.group.barrier' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: mask() -> _ods_ir .. py:method:: size() -> _ods_ir .. py:method:: groupId() -> _ods_ir .. py:function:: sched_group_barrier(mask, size, group_id, *, loc=None, ip=None) -> SchedGroupBarrier .. py:class:: SetPrioOp(priority, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.setprio' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: priority() -> _ods_ir .. py:function:: s_setprio(priority, *, loc=None, ip=None) -> SetPrioOp .. py:class:: TensorLoadToLDSD2Op(dgroup0, dgroup1, cachePolicy, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Moves tiles of tensor data between global memory and LDS. The tile is described by the $dgroup descriptors. 2 $dgroup descriptors allows for movement of up to 2D tensors. $cachePolicy describes the memory scope and an indicator of expected data re-use. This op is for gfx1250+ architectures. .. py:attribute:: OPERATION_NAME :value: 'rocdl.tensor.load.to.lds.d2' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: dgroup0() -> _ods_ir .. py:method:: dgroup1() -> _ods_ir .. py:method:: cachePolicy() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: tensor_load_to_lds_d2(dgroup0, dgroup1, cache_policy, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> TensorLoadToLDSD2Op .. py:class:: TensorLoadToLDSOp(dgroup0, dgroup1, dgroup2, dgroup3, cachePolicy, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Moves tiles of tensor data between global memory and LDS. The tile is described by the $dgroup descriptors. 4 $dgroup descriptors allows for movement of up to 5D tensors. $cachePolicy describes the memory scope and an indicator of expected data re-use. This op is for gfx1250+ architectures. .. py:attribute:: OPERATION_NAME :value: 'rocdl.tensor.load.to.lds' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: dgroup0() -> _ods_ir .. py:method:: dgroup1() -> _ods_ir .. py:method:: dgroup2() -> _ods_ir .. py:method:: dgroup3() -> _ods_ir .. py:method:: cachePolicy() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: tensor_load_to_lds(dgroup0, dgroup1, dgroup2, dgroup3, cache_policy, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> TensorLoadToLDSOp .. py:class:: TensorStoreFromLDSD2Op(dgroup0, dgroup1, cachePolicy, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Moves tiles of tensor data between global memory and LDS. The tile is described by the $dgroup descriptors. 2 $dgroup descriptors allows for movement of up to 2D tensors. $cachePolicy describes the memory scope and an indicator of expected data re-use. This op is for gfx1250+ architectures. .. py:attribute:: OPERATION_NAME :value: 'rocdl.tensor.store.from.lds.d2' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: dgroup0() -> _ods_ir .. py:method:: dgroup1() -> _ods_ir .. py:method:: cachePolicy() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: tensor_store_from_lds_d2(dgroup0, dgroup1, cache_policy, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> TensorStoreFromLDSD2Op .. py:class:: TensorStoreFromLDSOp(dgroup0, dgroup1, dgroup2, dgroup3, cachePolicy, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Moves tiles of tensor data between global memory and LDS. The tile is described by the $dgroup descriptors. 4 $dgroup descriptors allows for movement of up to 5D tensors. $cachePolicy describes the memory scope and an indicator of expected data re-use. This op is for gfx1250+ architectures. .. py:attribute:: OPERATION_NAME :value: 'rocdl.tensor.store.from.lds' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: dgroup0() -> _ods_ir .. py:method:: dgroup1() -> _ods_ir .. py:method:: dgroup2() -> _ods_ir .. py:method:: dgroup3() -> _ods_ir .. py:method:: cachePolicy() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:function:: tensor_store_from_lds(dgroup0, dgroup1, dgroup2, dgroup3, cache_policy, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> TensorStoreFromLDSOp .. py:class:: ThreadIdXOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workitem.id.x' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workitem_id_x(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: ThreadIdYOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workitem.id.y' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workitem_id_y(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: ThreadIdZOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.workitem.id.z' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: workitem_id_z(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: WaitAsynccntOp(count, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Wait for the counter specified to be less-than or equal-to the ``count`` before continuing. Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.wait.asynccnt' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: count() -> _ods_ir .. py:function:: s_wait_asynccnt(count, *, loc=None, ip=None) -> WaitAsynccntOp .. py:class:: WaitDscntOp(count, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Wait for the counter specified to be less-than or equal-to the ``count`` before continuing. Available on gfx12+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.wait.dscnt' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: count() -> _ods_ir .. py:function:: s_wait_dscnt(count, *, loc=None, ip=None) -> WaitDscntOp .. py:class:: WaitExpcntOp(count, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Wait for the counter specified to be less-than or equal-to the ``count`` before continuing. Available on gfx12+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.wait.expcnt' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: count() -> _ods_ir .. py:function:: s_wait_expcnt(count, *, loc=None, ip=None) -> WaitExpcntOp .. py:class:: WaitLoadcntOp(count, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Wait for the counter specified to be less-than or equal-to the ``count`` before continuing. Available on gfx12+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.wait.loadcnt' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: count() -> _ods_ir .. py:function:: s_wait_loadcnt(count, *, loc=None, ip=None) -> WaitLoadcntOp .. py:class:: WaitStorecntOp(count, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Wait for the counter specified to be less-than or equal-to the ``count`` before continuing. Available on gfx12+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.wait.storecnt' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: count() -> _ods_ir .. py:function:: s_wait_storecnt(count, *, loc=None, ip=None) -> WaitStorecntOp .. py:class:: WaitTensorcntOp(count, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` Wait for the counter specified to be less-than or equal-to the ``count`` before continuing. Available on gfx1250+. .. py:attribute:: OPERATION_NAME :value: 'rocdl.s.wait.tensorcnt' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: count() -> _ods_ir .. py:function:: s_wait_tensorcnt(count, *, loc=None, ip=None) -> WaitTensorcntOp .. py:class:: WavefrontSizeOp(res, *, range=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wavefrontsize' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: range() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: wavefrontsize(res, *, range=None, loc=None, ip=None) -> _ods_ir .. py:class:: ds_read_tr4_b64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds.read.tr4.b64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: ds_read_tr4_b64_(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: ds_read_tr6_b96(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds.read.tr6.b96' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: ds_read_tr6_b96_(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: ds_read_tr8_b64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds.read.tr8.b64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: ds_read_tr8_b64_(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: ds_read_tr16_b64(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.ds.read.tr16.b64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: ptr() -> _ods_ir .. py:method:: alias_scopes() -> Optional[_ods_ir] .. py:method:: noalias_scopes() -> Optional[_ods_ir] .. py:method:: tbaa() -> Optional[_ods_ir] .. py:method:: res() -> _ods_ir .. py:function:: ds_read_tr16_b64_(res, ptr, *, alias_scopes=None, noalias_scopes=None, tbaa=None, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_4x4x1f32(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.4x4x1f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_4x4x1f32_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_4x4x2bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.4x4x2bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_4x4x2bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_4x4x4bf16_1k(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.4x4x4bf16.1k' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_4x4x4bf16_1k_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_4x4x4f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.4x4x4f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_4x4x4f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x1f32(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x1f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x1f32_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x2bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x2bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x2bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x4bf16_1k(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x4bf16.1k' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x4bf16_1k_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x4f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x4f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x4f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x4f32(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x4f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x4f32_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x8_xf32(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x8.xf32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x8_xf32_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x8bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x8bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x8bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x16bf16_1k(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x16bf16.1k' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x16bf16_1k_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x16f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x16f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x16f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x32_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x32.bf8.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x32_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x32_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x32.bf8.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x32_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x32_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x32.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x32_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x32_f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x32.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x32_f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x32_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x32.fp8.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x32_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_16x16x32_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.16x16x32.fp8.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_16x16x32_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x1f32(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x1f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x1f32_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x2bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x2bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x2bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x2f32(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x2f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x2f32_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x4_xf32(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x4.xf32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x4_xf32_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x4bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x4bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x4bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x4bf16_1k(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x4bf16.1k' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x4bf16_1k_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x4f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x4f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x4f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x8bf16_1k(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x8bf16.1k' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x8bf16_1k_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x8f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x8f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x8f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x16_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x16.bf8.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x16_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x16_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x16.bf8.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x16_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x16_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x16.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x16_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x16_f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x16.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x16_f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x16_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x16.fp8.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x16_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f32_32x32x16_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f32.32x32x16.fp8.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f32_32x32x16_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f64_4x4x4f64(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f64.4x4x4f64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f64_4x4x4f64_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_f64_16x16x4f64(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.f64.16x16x4f64' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_f64_16x16x4f64_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_4x4x4i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.4x4x4i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_4x4x4i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_16x16x4i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.16x16x4i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_16x16x4i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_16x16x16i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.16x16x16i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_16x16x16i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_16x16x32_i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.16x16x32.i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_16x16x32_i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_16x16x64_i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.16x16x64.i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_16x16x64_i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_32x32x4i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.32x32x4i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_32x32x4i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_32x32x8i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.32x32x8i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_32x32x8i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_32x32x16_i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.32x32x16.i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_32x32x16_i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_i32_32x32x32_i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.i32.32x32x32.i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_i32_32x32x32_i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_scale_f32_16x16x128_f8f6f4(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.scale.f32.16x16x128.f8f6f4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_scale_f32_16x16x128_f8f6f4_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: mfma_scale_f32_32x32x64_f8f6f4(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.mfma.scale.f32.32x32x64.f8f6f4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: mfma_scale_f32_32x32x64_f8f6f4_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_16x16x32_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.16x16x32.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_16x16x32_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_16x16x32_f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.16x16x32.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_16x16x32_f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_16x16x64_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.16x16x64.bf8.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_16x16x64_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_16x16x64_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.16x16x64.bf8.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_16x16x64_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_16x16x64_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.16x16x64.fp8.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_16x16x64_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_16x16x64_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.16x16x64.fp8.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_16x16x64_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_32x32x16_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.32x32x16.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_32x32x16_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_32x32x16_f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.32x32x16.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_32x32x16_f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_32x32x32_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.32x32x32.bf8.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_32x32x32_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_32x32x32_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.32x32x32.bf8.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_32x32x32_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_32x32x32_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.32x32x32.fp8.bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_32x32x32_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_f32_32x32x32_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.f32.32x32x32.fp8.fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_f32_32x32x32_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_i32_16x16x64_i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.i32.16x16x64.i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_i32_16x16x64_i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: smfmac_i32_32x32x32_i8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.smfmac.i32.32x32x32.i8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: smfmac_i32_32x32x32_i8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_bf16_16x16x16_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.bf16.16x16x16.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_bf16_16x16x16_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_bf16_16x16x32_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.bf16.16x16x32.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_bf16_16x16x32_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_bf16f32_16x16x32_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.bf16f32.16x16x32.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_bf16f32_16x16x32_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x16_f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x16.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x16_f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x32_f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x32.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x32_f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x64_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x64.bf8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x64_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x64_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x64.bf8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x64_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x64_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x64.fp8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x64_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x64_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x64.fp8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x64_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x128_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x128.bf8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x128_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x128_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x128.bf8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x128_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x128_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x128.fp8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x128_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f16_16x16x128_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f16.16x16x128.fp8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f16_16x16x128_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x4_f32(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x4.f32' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x4_f32_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x16_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x16.bf8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x16_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x16_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x16.bf8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x16_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x16_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x16.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x16_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x16_f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x16.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x16_f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x16_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x16.fp8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x16_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x16_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x16.fp8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x16_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x32_bf16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x32.bf16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x32_bf16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x32_f16(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x32.f16' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x32_f16_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x64_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x64.bf8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x64_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x64_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x64.bf8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x64_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x64_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x64.fp8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x64_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x64_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x64.fp8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x64_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x128_bf8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x128.bf8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x128_bf8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x128_bf8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x128.bf8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x128_bf8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x128_fp8_bf8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x128.fp8_bf8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x128_fp8_bf8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_f32_16x16x128_fp8_fp8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.f32.16x16x128.fp8_fp8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_f32_16x16x128_fp8_fp8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_i32_16x16x16_iu4(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.i32.16x16x16.iu4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_i32_16x16x16_iu4_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_i32_16x16x16_iu8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.i32.16x16x16.iu8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_i32_16x16x16_iu8_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_i32_16x16x32_iu4(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.i32.16x16x32.iu4' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_i32_16x16x32_iu4_(res, args, *, loc=None, ip=None) -> _ods_ir .. py:class:: wmma_i32_16x16x64_iu8(res, args, *, loc=None, ip=None) Bases: :py:obj:`_ods_ir` .. py:attribute:: OPERATION_NAME :value: 'rocdl.wmma.i32.16x16x64.iu8' .. py:attribute:: _ODS_REGIONS :value: (0, True) .. py:method:: args() -> _ods_ir .. py:method:: res() -> _ods_ir .. py:function:: wmma_i32_16x16x64_iu8_(res, args, *, loc=None, ip=None) -> _ods_ir