Set CUDA minimum versions for hopper/blackwell cutlass kernels
Browse files- build.toml +2 -0
- flake.lock +4 -3
- flake.nix +1 -1
build.toml
CHANGED
|
@@ -127,6 +127,7 @@ src = [
|
|
| 127 |
[kernel.cutlass_w8a8_hopper]
|
| 128 |
backend = "cuda"
|
| 129 |
cuda-capabilities = ["9.0a"]
|
|
|
|
| 130 |
depends = [
|
| 131 |
"cutlass_3_9",
|
| 132 |
"torch",
|
|
@@ -167,6 +168,7 @@ cuda-capabilities = [
|
|
| 167 |
"10.1a",
|
| 168 |
"12.0a",
|
| 169 |
]
|
|
|
|
| 170 |
depends = [
|
| 171 |
"cutlass_3_9",
|
| 172 |
"torch",
|
|
|
|
| 127 |
[kernel.cutlass_w8a8_hopper]
|
| 128 |
backend = "cuda"
|
| 129 |
cuda-capabilities = ["9.0a"]
|
| 130 |
+
cuda-minver = "12.0"
|
| 131 |
depends = [
|
| 132 |
"cutlass_3_9",
|
| 133 |
"torch",
|
|
|
|
| 168 |
"10.1a",
|
| 169 |
"12.0a",
|
| 170 |
]
|
| 171 |
+
cuda-minver = "12.9"
|
| 172 |
depends = [
|
| 173 |
"cutlass_3_9",
|
| 174 |
"torch",
|
flake.lock
CHANGED
|
@@ -98,15 +98,16 @@
|
|
| 98 |
]
|
| 99 |
},
|
| 100 |
"locked": {
|
| 101 |
-
"lastModified":
|
| 102 |
-
"narHash": "sha256-
|
| 103 |
"owner": "huggingface",
|
| 104 |
"repo": "kernel-builder",
|
| 105 |
-
"rev": "
|
| 106 |
"type": "github"
|
| 107 |
},
|
| 108 |
"original": {
|
| 109 |
"owner": "huggingface",
|
|
|
|
| 110 |
"repo": "kernel-builder",
|
| 111 |
"type": "github"
|
| 112 |
}
|
|
|
|
| 98 |
]
|
| 99 |
},
|
| 100 |
"locked": {
|
| 101 |
+
"lastModified": 1751544642,
|
| 102 |
+
"narHash": "sha256-WZC/9SO3a92pH5AjvPn3GXSdupysFI6JglF+t4o/TYQ=",
|
| 103 |
"owner": "huggingface",
|
| 104 |
"repo": "kernel-builder",
|
| 105 |
+
"rev": "e12cd4ae24b7315af65db72483e6578909f3dac8",
|
| 106 |
"type": "github"
|
| 107 |
},
|
| 108 |
"original": {
|
| 109 |
"owner": "huggingface",
|
| 110 |
+
"ref": "kernel-cuda-minver",
|
| 111 |
"repo": "kernel-builder",
|
| 112 |
"type": "github"
|
| 113 |
}
|
flake.nix
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
description = "Flake for quantization kernels";
|
| 3 |
|
| 4 |
inputs = {
|
| 5 |
-
kernel-builder.url = "github:huggingface/kernel-builder";
|
| 6 |
};
|
| 7 |
|
| 8 |
outputs =
|
|
|
|
| 2 |
description = "Flake for quantization kernels";
|
| 3 |
|
| 4 |
inputs = {
|
| 5 |
+
kernel-builder.url = "github:huggingface/kernel-builder/kernel-cuda-minver";
|
| 6 |
};
|
| 7 |
|
| 8 |
outputs =
|