shader-slang · jkwak-work · Mar 31, 2026 · Mar 30, 2026 · Feb 25, 2026 · Mar 21, 2026
@@ -857,6 +857,23 @@ typedef uint32_t SlangSizeT;
         SLANG_STAGE_PIXEL = SLANG_STAGE_FRAGMENT,
     };
 
+    typedef SlangUInt32 SlangCooperativeMatrixUseIntegral;
+    enum SlangCooperativeMatrixUse : SlangCooperativeMatrixUseIntegral
+    {
+        SLANG_COOPERATIVE_MATRIX_USE_A,
+        SLANG_COOPERATIVE_MATRIX_USE_B,
+        SLANG_COOPERATIVE_MATRIX_USE_ACCUMULATOR,
+    };
+
+    typedef SlangUInt32 SlangCooperativeVectorMatrixLayoutIntegral;
+    enum SlangCooperativeVectorMatrixLayout : SlangCooperativeVectorMatrixLayoutIntegral
+    {
+        SLANG_COOPERATIVE_VECTOR_MATRIX_LAYOUT_ROW_MAJOR,
+        SLANG_COOPERATIVE_VECTOR_MATRIX_LAYOUT_COLUMN_MAJOR,
+        SLANG_COOPERATIVE_VECTOR_MATRIX_LAYOUT_INFERENCING_OPTIMAL,
+        SLANG_COOPERATIVE_VECTOR_MATRIX_LAYOUT_TRAINING_OPTIMAL,
+    };
+
     typedef SlangUInt32 SlangDebugInfoLevelIntegral;
     enum SlangDebugInfoLevel : SlangDebugInfoLevelIntegral
     {
@@ -1964,7 +1981,10 @@ public:                                                              \
         SLANG_SCALAR_TYPE_INT16,
         SLANG_SCALAR_TYPE_UINT16,
         SLANG_SCALAR_TYPE_INTPTR,
-        SLANG_SCALAR_TYPE_UINTPTR
+        SLANG_SCALAR_TYPE_UINTPTR,
+        SLANG_SCALAR_TYPE_BFLOAT16,
+        SLANG_SCALAR_TYPE_FLOAT_E4M3,
+        SLANG_SCALAR_TYPE_FLOAT_E5M2,
     };
 
     // abstract decl reflection
@@ -2349,6 +2369,11 @@ struct TypeReflection
         UInt8 = SLANG_SCALAR_TYPE_UINT8,
         Int16 = SLANG_SCALAR_TYPE_INT16,
         UInt16 = SLANG_SCALAR_TYPE_UINT16,
+        IntPtr = SLANG_SCALAR_TYPE_INTPTR,
+        UIntPtr = SLANG_SCALAR_TYPE_UINTPTR,
+        BFloat16 = SLANG_SCALAR_TYPE_BFLOAT16,
+        FloatE4M3 = SLANG_SCALAR_TYPE_FLOAT_E4M3,
+        FloatE5M2 = SLANG_SCALAR_TYPE_FLOAT_E5M2,
     };
 
     Kind getKind() { return (Kind)spReflectionType_GetKind((SlangReflectionType*)this); }

@@ -6461,63 +6461,6 @@ _slang_waveClusteredRotate(bool4 value, unsigned int delta, unsigned int cluster
 
 #if (OPTIX_VERSION >= 90000)
 
-// Constexpr function to map Slang component type enum to OptiX cooperative vector element type
-__host__ __device__ constexpr OptixCoopVecElemType slangToOptixComponentType(unsigned slangEnum)
-{
-    switch (slangEnum)
-    {
-    case 0:
-        return OPTIX_COOP_VEC_ELEM_TYPE_FLOAT8_E4M3; // FloatE4M3
-    case 1:
-        return OPTIX_COOP_VEC_ELEM_TYPE_FLOAT8_E5M2; // FloatE5M2
-    case 2:
-        return OPTIX_COOP_VEC_ELEM_TYPE_FLOAT16; // Float16
-    case 3:
-        return OPTIX_COOP_VEC_ELEM_TYPE_FLOAT32; // Float32
-    case 5:
-        return OPTIX_COOP_VEC_ELEM_TYPE_INT8; // SignedInt8
-    case 7:
-        return OPTIX_COOP_VEC_ELEM_TYPE_INT32; // SignedInt32
-    case 10:
-        return OPTIX_COOP_VEC_ELEM_TYPE_UINT8; // UnsignedInt8
-    case 12:
-        return OPTIX_COOP_VEC_ELEM_TYPE_UINT32; // UnsignedInt32
-    default:
-        return OPTIX_COOP_VEC_ELEM_TYPE_FLOAT32; // Default
-    }
-}
-
-// Constexpr function to map Slang matrix layout enum to OptiX cooperative vector matrix layout
-__host__ __device__ constexpr OptixCoopVecMatrixLayout slangToOptixMatrixLayout(unsigned slangEnum)
-{
-    switch (slangEnum)
-    {
-    case 0:
-        return OPTIX_COOP_VEC_MATRIX_LAYOUT_ROW_MAJOR; // RowMajor
-    case 1:
-        return OPTIX_COOP_VEC_MATRIX_LAYOUT_COLUMN_MAJOR; // ColumnMajor
-    case 2:
-        return OPTIX_COOP_VEC_MATRIX_LAYOUT_INFERENCING_OPTIMAL; // InferencingOptimal
-    case 3:
-        return OPTIX_COOP_VEC_MATRIX_LAYOUT_TRAINING_OPTIMAL; // TrainingOptimal
-    default:
-        return OPTIX_COOP_VEC_MATRIX_LAYOUT_ROW_MAJOR; // Default
-    }
-}
-
-// Wrapper structs to maintain compatibility with existing template-based interface
-template<unsigned SlangEnum>
-struct SlangToOptixComponentType
-{
-    static constexpr OptixCoopVecElemType value = slangToOptixComponentType(SlangEnum);
-};
-
-template<unsigned SlangEnum>
-struct SlangToOptixMatrixLayout
-{
-    static constexpr OptixCoopVecMatrixLayout value = slangToOptixMatrixLayout(SlangEnum);
-};
-
 // Template trait to extract vector size from OptixCoopVec<T, N>
 // Conditional compilation for NVRTC compatibility
 template<typename T>
@@ -6537,9 +6480,9 @@ struct OptixCoopVecTraits<OptixCoopVec<T, N>>
 template<
     typename VecTOut,
     typename VecTIn,
-    unsigned inputInterpretation,
-    unsigned matrixInterpretation,
-    unsigned matrixLayout>
+    OptixCoopVecElemType inputInterpretation,
+    OptixCoopVecElemType matrixInterpretation,
+    OptixCoopVecMatrixLayout matrixLayout>
 __forceinline__ __device__ VecTOut slangOptixCoopVecMatMul(
     const VecTIn& inputVector,
     CUdeviceptr matrix,
@@ -6553,26 +6496,22 @@ __forceinline__ __device__ VecTOut slangOptixCoopVecMatMul(
     return optixCoopVecMatMul<
         VecTOut,
         VecTIn,
-        SlangToOptixComponentType<inputInterpretation>::value,
-        SlangToOptixMatrixLayout<matrixLayout>::value,
+        inputInterpretation,
+        matrixLayout,
         false,
         N,
         K,
-        SlangToOptixComponentType<matrixInterpretation>::value>(
-        inputVector,
-        matrix,
-        matrixOffset,
-        matrixStride);
+        matrixInterpretation>(inputVector, matrix, matrixOffset, matrixStride);
 }
 
 // OptiX cooperative vector matrix multiplication wrapper (WITH bias - 6 runtime params)
 template<
     typename VecTOut,
     typename VecTIn,
-    unsigned inputInterpretation,
-    unsigned matrixInterpretation,
-    unsigned matrixLayout,
-    unsigned biasInterpretation>
+    OptixCoopVecElemType inputInterpretation,
+    OptixCoopVecElemType matrixInterpretation,
+    OptixCoopVecMatrixLayout matrixLayout,
+    OptixCoopVecElemType biasInterpretation>
 __forceinline__ __device__ VecTOut slangOptixCoopVecMatMul(
     const VecTIn& inputVector,
     CUdeviceptr matrix,
@@ -6588,29 +6527,23 @@ __forceinline__ __device__ VecTOut slangOptixCoopVecMatMul(
     return optixCoopVecMatMul<
         VecTOut,
         VecTIn,
-        SlangToOptixComponentType<inputInterpretation>::value,
-        SlangToOptixMatrixLayout<matrixLayout>::value,
+        inputInterpretation,
+        matrixLayout,
         false,
         N,
         K,
-        SlangToOptixComponentType<matrixInterpretation>::value,
-        SlangToOptixComponentType<biasInterpretation>::value>(
-        inputVector,
-        matrix,
-        matrixOffset,
-        bias,
-        biasOffset,
-        matrixStride);
+        matrixInterpretation,
+        biasInterpretation>(inputVector, matrix, matrixOffset, bias, biasOffset, matrixStride);
 }
 
 // OptiX cooperative vector matrix multiplication wrapper (WITHOUT bias, 4 runtime params -
 // StructuredBuffer variant)
 template<
     typename VecTOut,
     typename VecTIn,
-    unsigned inputInterpretation,
-    unsigned matrixInterpretation,
-    unsigned matrixLayout>
+    OptixCoopVecElemType inputInterpretation,
+    OptixCoopVecElemType matrixInterpretation,
+    OptixCoopVecMatrixLayout matrixLayout>
 __forceinline__ __device__ VecTOut slangOptixCoopVecMatMul(
     const VecTIn& inputVector,
     CUdeviceptr matrix,
@@ -6624,16 +6557,12 @@ __forceinline__ __device__ VecTOut slangOptixCoopVecMatMul(
     return optixCoopVecMatMul<
         VecTOut,
         VecTIn,
-        SlangToOptixComponentType<inputInterpretation>::value,
-        SlangToOptixMatrixLayout<matrixLayout>::value,
+        inputInterpretation,
+        matrixLayout,
         false,
         N,
         K,
-        SlangToOptixComponentType<matrixInterpretation>::value>(
-        inputVector,
-        matrix,
-        matrixOffset,
-        matrixStride);
+        matrixInterpretation>(inputVector, matrix, matrixOffset, matrixStride);
 }
 
 #endif // (OPTIX_VERSION >= 90000)

@@ -25,7 +25,12 @@ namespace
     x(Int64, int64_t) \
     x(UInt64, uint64_t) \
     x(Float32, float) \
-    x(Float64, double)
+    x(Float64, double) \
+    x(IntPtr, intptr_t) \
+    x(UIntPtr, uintptr_t) \
+    x(BFloat16, bfloat16) \
+    x(FloatE4M3, float_e4m3) \
+    x(FloatE5M2, float_e5m2)
 // clang-format on
 
 struct ScalarTypeInfo

@@ -157,7 +157,12 @@ EMSCRIPTEN_BINDINGS(slang)
         .value("Int8", slang::TypeReflection::ScalarType::Int8)
         .value("UInt8", slang::TypeReflection::ScalarType::UInt8)
         .value("Int16", slang::TypeReflection::ScalarType::Int16)
-        .value("UInt16", slang::TypeReflection::ScalarType::UInt16);
+        .value("UInt16", slang::TypeReflection::ScalarType::UInt16)
+        .value("IntPtr", slang::TypeReflection::ScalarType::IntPtr)
+        .value("UIntPtr", slang::TypeReflection::ScalarType::UIntPtr)
+        .value("BFloat16", slang::TypeReflection::ScalarType::BFloat16)
+        .value("FloatE4M3", slang::TypeReflection::ScalarType::FloatE4M3)
+        .value("FloatE5M2", slang::TypeReflection::ScalarType::FloatE5M2);
 
     class_<slang::wgsl::TypeReflection>("TypeReflection")
         .function("getScalarType", &slang::wgsl::TypeReflection::getScalarType)
+1 −3		include/slang-rhi.h
+18 −14		src/core/task-pool.cpp
+9 −0		src/d3d12/d3d12-command.cpp
+21 −1		src/debug-layer/debug-command-encoder.cpp
+5 −0		src/debug-layer/debug-device.cpp
+1 −1		src/debug-layer/debug-helper-functions.cpp
+5 −0		src/debug-layer/debug-helper-functions.h
+14 −0		src/enum-strings.cpp
+1 −0		src/enum-strings.h
+15 −20		src/rhi-shared.cpp
+11 −4		src/rhi-shared.h
+5 −0		src/strings.h
+5 −2		src/vulkan/vk-command.cpp
+1 −12		src/vulkan/vk-device.cpp
+15 −0		src/vulkan/vk-utils.cpp
+2 −0		src/vulkan/vk-utils.h
+4 −1		src/wgpu/wgpu-shader-object-layout.cpp