johnbridges commited on
Commit
7e2c46b
·
1 Parent(s): 76f1775
Files changed (1) hide show
  1. vllm_backend.py +1 -2
vllm_backend.py CHANGED
@@ -25,8 +25,7 @@ class VLLMChatBackend(ChatBackend):
25
 
26
  params = SamplingParams(
27
  temperature=float(request.get("temperature", 0.7)),
28
- max_tokens=int(request.get("max_tokens", 512)),
29
- stream=False, # we want full text only
30
  )
31
 
32
  rid = f"chatcmpl-local-{int(time.time())}"
 
25
 
26
  params = SamplingParams(
27
  temperature=float(request.get("temperature", 0.7)),
28
+ max_tokens=int(request.get("max_tokens", 512))
 
29
  )
30
 
31
  rid = f"chatcmpl-local-{int(time.time())}"