Spaces:

inclusionAI
/

ling-mini-2.0-local

Sleeping

雷娃 commited on 29 days ago

Commit

06a57b1

1 Parent(s): fd5c246

add install.sh

Files changed (1) hide show

app.py CHANGED Viewed

@@ -76,11 +76,15 @@ def respond(
     model_inputs = tokenizer([text], return_tensors="pt", return_token_type_ids=False).to(model.device)
-    model_inputs.update(dict(max_new_tokens=max_tokens,
-                             temperature = temperature,
-                             top_p = top_p,
                              presence_penalty = 1.5,
-                             streamer=streamer))
     # Start a separate thread for model generation to allow streaming output
     thread = Thread(

     model_inputs = tokenizer([text], return_tensors="pt", return_token_type_ids=False).to(model.device)
+    print(f"max_new_tokens={max_tokens}, temperature={temperature}, top_p={top_p}")
+    model_inputs.update(
+        dict(max_new_tokens=max_tokens,
+                             streamer = streamer,
+                             temperature = float(temperature),
+                             top_p = float(top_p),
                              presence_penalty = 1.5,
+             )
+    )
     # Start a separate thread for model generation to allow streaming output
     thread = Thread(