Commit
·
7e2c46b
1
Parent(s):
76f1775
- vllm_backend.py +1 -2
vllm_backend.py
CHANGED
|
@@ -25,8 +25,7 @@ class VLLMChatBackend(ChatBackend):
|
|
| 25 |
|
| 26 |
params = SamplingParams(
|
| 27 |
temperature=float(request.get("temperature", 0.7)),
|
| 28 |
-
max_tokens=int(request.get("max_tokens", 512))
|
| 29 |
-
stream=False, # we want full text only
|
| 30 |
)
|
| 31 |
|
| 32 |
rid = f"chatcmpl-local-{int(time.time())}"
|
|
|
|
| 25 |
|
| 26 |
params = SamplingParams(
|
| 27 |
temperature=float(request.get("temperature", 0.7)),
|
| 28 |
+
max_tokens=int(request.get("max_tokens", 512))
|
|
|
|
| 29 |
)
|
| 30 |
|
| 31 |
rid = f"chatcmpl-local-{int(time.time())}"
|