Use float32 for test_completion.py (#22385)

Signed-off-by: Michael Goin <mgoin64@gmail.com>
This commit is contained in:
Michael Goin
2025-08-06 23:07:47 -04:00
committed by GitHub
parent 04cf435d95
commit a00d8b236f

View File

@ -20,9 +20,8 @@ MODEL_NAME = "facebook/opt-125m"
@pytest.fixture(scope="module")
def default_server_args():
return [
# use half precision for speed and memory savings in CI environment
"--dtype",
"bfloat16",
"float32",
"--max-model-len",
"2048",
"--max-num-seqs",