We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 74e6232 commit eba0837Copy full SHA for eba0837
csrc/quantization/marlin/sparse/common/mma.h
@@ -17,6 +17,7 @@
17
18
#pragma once
19
#include "base.h"
20
+#include <cudaTypedefs.h>
21
22
namespace marlin_24 {
23
@@ -26,7 +27,7 @@ namespace marlin_24 {
26
27
// | Advisory: Modifier ‘.sp::ordered_metadata’ should be used on instruction
28
// | ‘mma’ instead of modifier ‘.sp’ as it is expected to have substantially
29
// | reduced performance on some future architectures
-#if defined CUDA_VERSION && CUDA_VERSION >= 12500
30
+#if defined CUDA_VERSION && CUDA_VERSION >= 12050
31
#define MMA_SP_INST \
32
"mma.sp::ordered_metadata.sync.aligned.m16n8k32.row.col.f32.f16.f16.f32 "
33
#else
0 commit comments