From 5e66fb6ff4e92814cd2728055f630b0b5f086fe2 Mon Sep 17 00:00:00 2001 From: YangWen Huang Date: Thu, 26 Jun 2025 22:52:17 +0000 Subject: [PATCH] Update gfx1150 library to new format --- .../gfx1150_Cijk_Ailk_Bjlk_DB_UserArgs.yaml | 296 +- ...jk_Ailk_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml | 296 +- .../gfx1150_Cijk_Ailk_Bljk_DB_UserArgs.yaml | 296 +- ...jk_Ailk_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml | 296 +- .../gfx1150_Cijk_Alik_Bjlk_DB_UserArgs.yaml | 296 +- ...jk_Alik_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml | 296 +- .../gfx1150_Cijk_Alik_Bljk_DB_UserArgs.yaml | 296 +- ...jk_Alik_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml | 296 +- ...jlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml | 3727 +--------- ...ilk_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml | 3727 +--------- ...fx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAH.yaml | 258 +- ...ilk_Bjlk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml | 436 +- ...jlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml | 3727 +--------- ...ilk_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml | 3727 +--------- ...fx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAH.yaml | 258 +- ...ilk_Bjlk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml | 508 +- ..._Cijk_Ailk_Bjlk_I8BH_HAI_SAV_UserArgs.yaml | 364 +- ...jk_Ailk_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml | 292 +- ...ljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml | 5333 +-------------- ...ilk_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml | 5333 +-------------- ...fx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAH.yaml | 258 +- ...ilk_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml | 436 +- ...ljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml | 5114 +------------- ...ilk_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml | 5114 +------------- ...fx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAH.yaml | 258 +- ...ilk_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml | 436 +- ..._Cijk_Ailk_Bljk_I8BH_HAI_SAV_UserArgs.yaml | 364 +- ...jk_Ailk_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml | 436 +- ...jlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml | 5333 +-------------- ...lik_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml | 5333 +-------------- ...ijk_Alik_Bjlk_BSS_BH_HAS_SAV_UserArgs.yaml | 364 +- ...jlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml | 5990 +---------------- ...lik_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml | 5990 +---------------- ...ijk_Alik_Bjlk_HSS_BH_HAS_SAV_UserArgs.yaml | 580 +- ..._Cijk_Alik_Bjlk_I8BH_HAI_SAV_UserArgs.yaml | 508 +- ...jk_Alik_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml | 436 +- ...ljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml | 4676 +------------ ...lik_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml | 4676 +------------ ...fx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAH.yaml | 258 +- ...lik_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml | 364 +- ...ljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml | 5333 +-------------- ...lik_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml | 5333 +-------------- ...fx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAH.yaml | 258 +- ...lik_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml | 220 +- ..._Cijk_Alik_Bljk_I8BH_HAI_SAV_UserArgs.yaml | 580 +- ...jk_Alik_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml | 436 +- 46 files changed, 86 insertions(+), 89056 deletions(-) diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bjlk_DB_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bjlk_DB_UserArgs.yaml index f73ea7c51e1..e849da0abea 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bjlk_DB_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bjlk_DB_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 0 UseScaleCD: false - - 1LDSBuffer: 0 @@ -190,79 +190,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -433,79 +360,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -676,79 +530,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -919,79 +700,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml index 6df39a22943..6f9df3c1e06 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -190,79 +190,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -433,79 +360,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -676,79 +530,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -919,79 +700,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bljk_DB_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bljk_DB_UserArgs.yaml index 6734c58f72f..d7165a7c69e 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bljk_DB_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bljk_DB_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 0 UseScaleCD: false - - 1LDSBuffer: 0 @@ -190,79 +190,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -433,79 +360,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -676,79 +530,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -919,79 +700,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml index 40a25acedca..9fe04de5853 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Ailk_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -190,79 +190,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -433,79 +360,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -676,79 +530,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -919,79 +700,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bjlk_DB_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bjlk_DB_UserArgs.yaml index 3232eea2048..f7340957073 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bjlk_DB_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bjlk_DB_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 0 UseScaleCD: false - - 1LDSBuffer: 0 @@ -190,79 +190,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: true - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -433,79 +360,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: true - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -676,79 +530,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: true - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -919,79 +700,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: true - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml index d87ff009cec..2288fe1f864 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bjlk_SB_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -190,79 +190,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -433,79 +360,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -676,79 +530,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -919,79 +700,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bljk_DB_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bljk_DB_UserArgs.yaml index ec4027ac6a9..176a3c5fece 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bljk_DB_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bljk_DB_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 0 UseScaleCD: false - - 1LDSBuffer: 0 @@ -190,79 +190,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -433,79 +360,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -676,79 +530,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -919,79 +700,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: false - ActivationComputeDataType: 1 - ActivationNoGuard: false - ActivationType: none - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [1] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 1 - DataType: 1 - DataTypeA: 1 - DataTypeB: 1 - DataTypeE: 1 - DestDataType: 1 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 0 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml index 76f2831048b..2c540541cee 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/Equality/gfx1150_Cijk_Alik_Bljk_SB_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -190,79 +190,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -433,79 +360,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -676,79 +530,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 @@ -919,79 +700,6 @@ PrefetchGlobalRead: 1 PrefetchLocalRead: 0 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 0 - DataTypeA: 0 - DataTypeB: 0 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: false - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 1 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml index 6a15eafefb8..8acce3ea09f 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: true UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml index d6ead8dc821..952809cb6a7 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAH.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAH.yaml index ac9bcfe8a5c..79dcf5ed258 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAH.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAH.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -189,70 +189,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -430,70 +366,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -671,70 +543,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -912,70 +720,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml index b1e8cc8792a..42f9540a618 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -204,78 +204,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -461,78 +389,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -718,78 +574,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -975,78 +759,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1232,78 +944,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1489,78 +1129,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml index 297675b1a23..a00a7c2372c 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: true UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml index b2f59487a77..8a97b7da13d 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAH.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAH.yaml index b7792b0b4b7..5dcc6ab5896 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAH.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAH.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -189,70 +189,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -430,70 +366,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -671,70 +543,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -912,70 +720,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: true - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml index d8f6354d8bb..25bab52c420 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -204,78 +204,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -461,78 +389,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -718,78 +574,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -975,78 +759,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1232,78 +944,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1489,78 +1129,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1746,78 +1314,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_I8BH_HAI_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_I8BH_HAI_SAV_UserArgs.yaml index 88ef0468131..686d481e97a 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_I8BH_HAI_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_I8BH_HAI_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -198,78 +198,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -449,78 +377,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -700,78 +556,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -951,78 +735,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1202,78 +914,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml index 190bce6d2ab..51165bbb10e 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -198,78 +198,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -449,78 +377,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -700,78 +556,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -951,78 +735,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml index 08c374345a9..a903fdc3271 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: true UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18407,79 +13297,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18667,79 +13484,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18927,79 +13671,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml index e6343cc6fb0..26594fe7558 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18407,79 +13297,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18667,79 +13484,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18927,79 +13671,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAH.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAH.yaml index 283ece2bacf..df0b8dd225c 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAH.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAH.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -189,70 +189,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -430,70 +366,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -671,70 +543,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -912,70 +720,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml index 194912b2fb0..6902099e0cf 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -204,78 +204,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -461,78 +389,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -718,78 +574,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -975,78 +759,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1232,78 +944,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1489,78 +1129,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml index ec217d9c5c5..a734590311f 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: true UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml index e5b5dd3ca8c..e1336748fc6 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAH.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAH.yaml index 492d8b0ec27..48f69e2742c 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAH.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAH.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -189,70 +189,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -430,70 +366,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -671,70 +543,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -912,70 +720,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: false - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml index e33d4da75dc..a1e531ccf05 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -204,78 +204,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -461,78 +389,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -718,78 +574,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -975,78 +759,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1232,78 +944,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1489,78 +1129,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_I8BH_HAI_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_I8BH_HAI_SAV_UserArgs.yaml index 5d728271e89..d0defac74fb 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_I8BH_HAI_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_I8BH_HAI_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -198,78 +198,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -449,78 +377,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -700,78 +556,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -951,78 +735,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1202,78 +914,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml index e4091d4bfa2..d4d86dd3277 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Ailk_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -198,78 +198,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -449,78 +377,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -700,78 +556,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -951,78 +735,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1202,78 +914,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1453,78 +1093,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [0, 3, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 1 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: true - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 0 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml index 8cb191757c7..33d46ec4c1b 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: true UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18407,79 +13297,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18667,79 +13484,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18927,79 +13671,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml index ba49a884cdd..a325ff908cb 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18407,79 +13297,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18667,79 +13484,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18927,79 +13671,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BSS_BH_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BSS_BH_HAS_SAV_UserArgs.yaml index ece0d84ed39..eb381272271 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BSS_BH_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_BSS_BH_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -204,78 +204,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -461,78 +389,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -718,78 +574,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -975,78 +759,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1232,78 +944,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml index 747bc6b2e34..a6739f684f6 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: true UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18407,79 +13297,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18667,79 +13484,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18927,79 +13671,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -19187,79 +13858,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -19447,79 +14045,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -19707,79 +14232,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -19967,79 +14419,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -20227,79 +14606,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -20487,79 +14793,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -20747,79 +14980,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -21007,79 +15167,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -21267,79 +15354,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml index 9fd8a77f4be..71d5e57334b 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18407,79 +13297,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18667,79 +13484,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18927,79 +13671,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -19187,79 +13858,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -19447,79 +14045,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -19707,79 +14232,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -19967,79 +14419,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -20227,79 +14606,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -20487,79 +14793,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -20747,79 +14980,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -21007,79 +15167,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -21267,79 +15354,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HSS_BH_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HSS_BH_HAS_SAV_UserArgs.yaml index e378a9bbd16..d09fad2ad57 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HSS_BH_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_HSS_BH_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -204,78 +204,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -461,78 +389,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -718,78 +574,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -975,78 +759,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1232,78 +944,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1489,78 +1129,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1746,78 +1314,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2003,78 +1499,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_I8BH_HAI_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_I8BH_HAI_SAV_UserArgs.yaml index f99b7ecde2f..3393a5960c7 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_I8BH_HAI_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_I8BH_HAI_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -198,78 +198,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -449,78 +377,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -700,78 +556,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -951,78 +735,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1202,78 +914,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1453,78 +1093,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1704,78 +1272,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml index 92530638bd7..a91b677d165 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bjlk_I8II_BH_HAI_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -198,78 +198,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -449,78 +377,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -700,78 +556,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -951,78 +735,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1202,78 +914,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1453,78 +1093,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [1, 3, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 1 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: true - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 1 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml index 429da7c6368..64d42e6bbce 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BBS_BH_Bias_AuxB_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: true UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml index 6dc515c5b6d..0b47af2257f 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BBS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 7 - DestDataType: 7 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAH.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAH.yaml index 637e21ab6ac..fba4555a0fd 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAH.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAH.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -189,70 +189,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -430,70 +366,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -671,70 +543,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -912,70 +720,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml index 979bbad67dd..059fa1e660d 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_BSS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -204,78 +204,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -461,78 +389,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -718,78 +574,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -975,78 +759,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1232,78 +944,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 7] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 7 - DataTypeA: 7 - DataTypeB: 7 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml index eef50297039..2e26196c0b2 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HHS_BH_Bias_AuxH_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: true UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18407,79 +13297,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18667,79 +13484,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18927,79 +13671,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: true - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml index cd886b9b0ec..3926694cc12 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HHS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -71,7 +71,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -207,79 +207,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -467,79 +394,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -727,79 +581,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -987,79 +768,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1247,79 +955,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1507,79 +1142,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1767,79 +1329,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2027,79 +1516,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2287,79 +1703,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2547,79 +1890,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -2807,79 +2077,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3067,79 +2264,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3327,79 +2451,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3587,79 +2638,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -3847,79 +2825,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4107,79 +3012,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4367,79 +3199,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4627,79 +3386,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -4887,79 +3573,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5147,79 +3760,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5407,79 +3947,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5667,79 +4134,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -5927,79 +4321,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6187,79 +4508,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6447,79 +4695,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6707,79 +4882,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -6967,79 +5069,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7227,79 +5256,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7487,79 +5443,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -7747,79 +5630,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8007,79 +5817,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8267,79 +6004,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8527,79 +6191,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -8787,79 +6378,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9047,79 +6565,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9307,79 +6752,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9567,79 +6939,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -9827,79 +7126,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10087,79 +7313,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10347,79 +7500,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10607,79 +7687,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -10867,79 +7874,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11127,79 +8061,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11387,79 +8248,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11647,79 +8435,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -11907,79 +8622,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12167,79 +8809,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12427,79 +8996,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12687,79 +9183,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -12947,79 +9370,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13207,79 +9557,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13467,79 +9744,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13727,79 +9931,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -13987,79 +10118,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14247,79 +10305,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14507,79 +10492,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -14767,79 +10679,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15027,79 +10866,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15287,79 +11053,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15547,79 +11240,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -15807,79 +11427,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16067,79 +11614,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16327,79 +11801,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16587,79 +11988,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -16847,79 +12175,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17107,79 +12362,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17367,79 +12549,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17627,79 +12736,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -17887,79 +12923,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18147,79 +13110,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18407,79 +13297,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18667,79 +13484,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -18927,79 +13671,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 4 - DestDataType: 4 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StochasticRounding: false - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAH.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAH.yaml index f8811500cea..b87b801df02 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAH.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAH.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -189,70 +189,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -430,70 +366,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -671,70 +543,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -912,70 +720,6 @@ PackedC1IndicesX: [1] PrefetchGlobalRead: 2 PrefetchLocalRead: 3 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: true - TransposeB: false - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml index b519c6f54d1..8fb69bb4dac 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_HSS_BH_Bias_HAS_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -204,78 +204,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -461,78 +389,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -718,78 +574,6 @@ PrefetchGlobalRead: 2 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 0 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: true - BiasDataTypeList: [0, 4] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 0 - DataType: 4 - DataTypeA: 4 - DataTypeB: 4 - DataTypeE: 0 - DestDataType: 0 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 1 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_I8BH_HAI_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_I8BH_HAI_SAV_UserArgs.yaml index 359783b694b..4d8f9f019db 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_I8BH_HAI_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_I8BH_HAI_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -198,78 +198,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -449,78 +377,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -700,78 +556,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -951,78 +735,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1202,78 +914,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1453,78 +1093,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1704,78 +1272,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1955,78 +1451,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 8 - DestDataType: 8 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 diff --git a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml index 1e1c8920de0..afcd7931d2a 100644 --- a/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml +++ b/projects/hipblaslt/library/src/amd_detail/rocblaslt/src/Tensile/Logic/asm_full/gfx1150/GridBased/gfx1150_Cijk_Alik_Bljk_I8II_BH_HAI_SAV_UserArgs.yaml @@ -1,4 +1,4 @@ -- {MinimumRequiredVersion: 4.33.0} +- {MinimumRequiredVersion: 5.0.0} - gfx1150 - gfx1150 - [Device 150e] @@ -70,7 +70,7 @@ UseE: false UseInitialStridesAB: false UseInitialStridesCD: false - UseScaleAB: "" + UseScaleAB: '' UseScaleAlphaVec: 1 UseScaleCD: false - - 1LDSBuffer: 0 @@ -198,78 +198,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -449,78 +377,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -700,78 +556,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -951,78 +735,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1202,78 +914,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1 @@ -1453,78 +1093,6 @@ PrefetchGlobalRead: 0 PrefetchLocalRead: 1 PreloadKernArgs: 0 - ProblemType: - Activation: true - ActivationComputeDataType: 6 - ActivationNoGuard: false - ActivationType: hipblaslt_all - AllowNoFreeDims: false - AssignedDerivedParameters: true - Batched: true - BetaOnlyUseBias: false - BiasDataTypeList: [6] - BiasSrc: D - ComplexConjugateA: false - ComplexConjugateB: false - ComputeDataType: 6 - DataType: 8 - DataTypeA: 8 - DataTypeB: 8 - DataTypeE: 6 - DestDataType: 6 - F32XdlMathOp: 0 - Gradient: false - GroupedGemm: false - HighPrecisionAccumulate: true - Index0: 0 - Index01A: 0 - Index01B: 1 - Index1: 1 - IndexAssignmentsA: [3, 0, 2] - IndexAssignmentsB: [3, 1, 2] - IndexAssignmentsLD: [4, 5, 6, 7] - IndexAssignmentsMetadata: [3, 0, 2] - IndexUnroll: 3 - IndexUnrollA: 0 - IndexUnrollB: 0 - IndexUnrollM: 0 - IndicesBatch: [2] - IndicesFree: [0, 1] - IndicesSummation: [3] - MirrorDimsA: [] - MirrorDimsB: [] - MirrorDimsMetadata: [] - NumIndicesBatch: 1 - NumIndicesC: 3 - NumIndicesFree: 2 - NumIndicesLD: 4 - NumIndicesSummation: 1 - OperationType: GEMM - SetConstStrideA: [] - SetConstStrideB: [] - SetConstStrideBias: [] - SilentHighPrecisionAccumulate: false - Sparse: 0 - StridedBatched: true - SupportUserArgs: true - TLUA: false - TLUB: false - Tensor0: 0 - Tensor1: 1 - TileA: 0 - TileAwareSelection: false - TileB: 1 - TotalIndices: 4 - TransposeA: 1 - TransposeB: 0 - UseBeta: true - UseBias: 0 - UseE: false - UseInitialStridesAB: false - UseInitialStridesCD: false - UseScaleAB: "" - UseScaleAlphaVec: 1 - UseScaleCD: false ScheduleGlobalRead: 1 ScheduleIterAlg: 3 ScheduleLocalWrite: 1