QAT and quantization w/torchao
This commit is contained in:
salman
2025-05-28 12:35:47 +01:00
committed by GitHub
parent 20fda75917
commit 5fca214108
26 changed files with 1372 additions and 13 deletions

View File

@@ -4,7 +4,6 @@ GRPO test suite
import os
import random
import shutil
import subprocess # nosec B404
import sys
import tempfile
@@ -118,7 +117,10 @@ def start_vllm(
recursive_kill(process)
with open("/tmp/vllm.log", "r", encoding="utf-8") as log_file:
print(log_file.read())
shutil.rmtree("/tmp/vllm.log")
try:
os.remove("/tmp/vllm.log")
except FileNotFoundError:
pass
raise RuntimeError(f"VLLM server process did not start within {wait} seconds.")
# return the process