Spaces:

hibikigf88
/

Medical_Assistant-RAG

Sleeping

Gary commited on 27 days ago

Commit

c384c23

1 Parent(s): 27e1332

reduce new token length

Files changed (1) hide show

indexer.py CHANGED Viewed

@@ -15,7 +15,7 @@ def load_raw_dataset():
     df["combined"] = df["input"] + " " + df["output"]
-    df = df.sample(n=min(5000, len(df)), random_state=42).reset_index(drop=True)
     docs = [
         Document(
@@ -44,8 +44,8 @@ def get_llm(model_name):
         "text2text-generation",
         model=model,
         tokenizer=tokenizer,
-        max_new_tokens=1024,
-        temperature=0.7,
         do_sample=True,
     )

     df["combined"] = df["input"] + " " + df["output"]
+    df = df.sample(n=min(5000, len(df)), random_state=42)
     docs = [
         Document(
         "text2text-generation",
         model=model,
         tokenizer=tokenizer,
+        max_new_tokens=512,
+        temperature=1,
         do_sample=True,
     )