diff --git a/python/pyproject.toml b/python/pyproject.toml index fee1b6e7ae8b..5acd2704bc26 100755 --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -9,7 +9,7 @@ build-backend = "setuptools.build_meta" [project] name = "sglang" -version = "0.5.5.post3+hs5" +version = "0.5.5.post3+hs7" description = "SGLang is a fast serving framework for large language models and vision language models." readme = "README.md" requires-python = ">=3.10" diff --git a/python/sglang/srt/layers/deep_gemm_wrapper/configurer.py b/python/sglang/srt/layers/deep_gemm_wrapper/configurer.py index 9bb34046d51c..494b884261d5 100644 --- a/python/sglang/srt/layers/deep_gemm_wrapper/configurer.py +++ b/python/sglang/srt/layers/deep_gemm_wrapper/configurer.py @@ -18,8 +18,14 @@ def _compute_enable_deep_gemm(): return envs.SGLANG_ENABLE_JIT_DEEPGEMM.get() - -ENABLE_JIT_DEEPGEMM = _compute_enable_deep_gemm() +# deepgemm requires CUDA toolkit and will error out on Blackwell GPU if missing. +# File "/.pyenv/versions/3.12.7/lib/python3.12/site-packages/deep_gemm/__init__.py", line 42, in _ensure_initialized +# torch.ops.deep_gemm.init(library_root, _find_cuda_home()) +# ^^^^^^^^^^^^^^^^^ +# File "/.pyenv/versions/3.12.7/lib/python3.12/site-packages/deep_gemm/__init__.py", line 30, in _find_cuda_home +# assert cuda_home is not None +# ^^^^^^^^^^^^^^^^^^^^^ +ENABLE_JIT_DEEPGEMM = False DEEPGEMM_BLACKWELL = ENABLE_JIT_DEEPGEMM and is_blackwell() DEEPGEMM_SCALE_UE8M0 = DEEPGEMM_BLACKWELL