We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6c728f7 commit d621cf6Copy full SHA for d621cf6
vllm/platforms/rocm.py
@@ -199,6 +199,9 @@ class RocmPlatform(Platform):
199
"petit_nvfp4",
200
"torchao",
201
]
202
+ # bitsandbytes is not supported on GPUs with warp size 64 (gfx9)
203
+ if not on_gfx9():
204
+ supported_quantization += ["bitsandbytes"]
205
206
@classmethod
207
def get_vit_attn_backend(cls, head_size: int, dtype: torch.dtype) -> "_Backend":
0 commit comments