Skip to content

Commit

Permalink
fix flashinfer version with sglang
Browse files Browse the repository at this point in the history
  • Loading branch information
ZX-ModelCloud committed Jul 30, 2024
1 parent bd0765a commit f25d848
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions tests/test_sglang.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,8 +16,8 @@ class TestLoadSglang(unittest.TestCase):
@classmethod
def setUpClass(self):
# sglang set disable_flashinfer=True still import flashinfer
subprocess.check_call([sys.executable, "-m", "pip", "install", "flashinfer", "-i", f"https://flashinfer.ai/whl/cu{torch.version.cuda.replace('.', '')}/torch{'.'.join(torch.__version__.split('.')[:2])}"])
subprocess.check_call([sys.executable, "-m", "pip", "install", "sglang[srt]>=0.1.19"])
subprocess.check_call([sys.executable, "-m", "pip", "install", "flashinfer==0.1.2", "-i", f"https://flashinfer.ai/whl/cu{torch.version.cuda.replace('.', '')}/torch{'.'.join(torch.__version__.split('.')[:2])}"])
subprocess.check_call([sys.executable, "-m", "pip", "install", "sglang[srt]>=0.2.7"])

self.MODEL_ID = "LnL-AI/TinyLlama-1.1B-Chat-v1.0-GPTQ-4bit"
self.prompt = "The capital of France is"
Expand Down

0 comments on commit f25d848

Please sign in to comment.