Spaces:

inclusionAI
/

Ling-lite-1.5

Running

雷娃 commited on Jun 24, 2025

Commit

b3dfe3c

1 Parent(s): 291372b

modify output length

Files changed (2) hide show

app.py CHANGED Viewed

@@ -12,7 +12,7 @@ client = OpenAI(
 )
 # define chat function
-def chat(user_input, max_new_tokens=20480):
     # chat history
     messages_template = [
   #      {"role": "system", "content": "You are Ling, an assistant created by inclusionAI"},
@@ -22,7 +22,7 @@ def chat(user_input, max_new_tokens=20480):
     response = client.chat.completions.create(
         model="Ling-lite-1.5-250604",
         messages=messages_template,
-        max_tokens=11264,
         temperature=0.01,
         top_p=1,
     )
@@ -47,7 +47,7 @@ with gr.Blocks(css="""
     )
     with gr.Row():
-        max_tokens_slider = gr.Slider(minimum=128, maximum=20480, step=160, label="Generated length")
 #    output_box = gr.Textbox(lines=10, label="Response")
     output_box = gr.Markdown(label="Response", elem_id="markdown-output")

 )
 # define chat function
+def chat(user_input, max_tokens=11264):
     # chat history
     messages_template = [
   #      {"role": "system", "content": "You are Ling, an assistant created by inclusionAI"},
     response = client.chat.completions.create(
         model="Ling-lite-1.5-250604",
         messages=messages_template,
+        max_tokens=max_tokens,
         temperature=0.01,
         top_p=1,
     )
     )
     with gr.Row():
+        max_tokens_slider = gr.Slider(minimum=100, maximum=10000, step=100, label="Generated length")
 #    output_box = gr.Textbox(lines=10, label="Response")
     output_box = gr.Markdown(label="Response", elem_id="markdown-output")

app_api.py CHANGED Viewed

@@ -12,21 +12,23 @@ client = OpenAI(
 )
 # define chat function
-def chat(user_input, max_new_tokens=2048):
     # chat history
     messages_template = [
- #       {"role": "system", "content": "You are Ling, an assistant created by inclusionAI"},
         {"role": "user", "content": user_input}
     ]
     response = client.chat.completions.create(
         model="Ling-lite-1.5-250604",
         messages=messages_template,
-        max_tokens=11264,
         temperature=0.01,
         top_p=1,
     )
-    yield response.choices[0].message.content
@@ -45,7 +47,7 @@ with gr.Blocks(css="""
     )
     with gr.Row():
-        max_tokens_slider = gr.Slider(minimum=128, maximum=2048, step=16, label="Generated length")
 #    output_box = gr.Textbox(lines=10, label="Response")
     output_box = gr.Markdown(label="Response", elem_id="markdown-output")

 )
 # define chat function
+def chat(user_input, max_tokens=11264):
     # chat history
     messages_template = [
+  #      {"role": "system", "content": "You are Ling, an assistant created by inclusionAI"},
         {"role": "user", "content": user_input}
     ]
     response = client.chat.completions.create(
         model="Ling-lite-1.5-250604",
         messages=messages_template,
+        max_tokens=max_tokens,
         temperature=0.01,
         top_p=1,
     )
+    resp_text = response.choices[0].message.content
+    print(resp_text)
+    yield resp_text
     )
     with gr.Row():
+        max_tokens_slider = gr.Slider(minimum=100, maximum=10000, step=100, label="Generated length")
 #    output_box = gr.Textbox(lines=10, label="Response")
     output_box = gr.Markdown(label="Response", elem_id="markdown-output")