[UX] Add FlashInfer as default CUDA dependency (#26443)

Signed-off-by: mgoin <mgoin64@gmail.com> Co-authored-by: Wentao Ye <44945378+yewentao256@users.noreply.github.com>
2025-10-20 23:03:52 +08:00 · 2025-10-09 17:10:02 -04:00
parent 2e54db4d2b
commit c9d33c60dc
4 changed files with 19 additions and 71 deletions
--- a/setup.py
+++ b/setup.py
@ -714,8 +714,7 @@ setup(
            "mistral_common[audio]",
        ],  # Required for audio processing
        "video": [],  # Kept for backwards compatibility
-        # FlashInfer should be updated together with the Dockerfile
-        "flashinfer": ["flashinfer-python==0.4.0"],
+        "flashinfer": [],  # Kept for backwards compatibility
        # Optional deps for AMD FP4 quantization support
        "petit-kernel": ["petit-kernel"],
    },