Spaces:

AmiyendraOP
/

llama3-legal-chat

Runtime error

AmiyendraOP commited on 13 days ago

Commit

51202ff

verified ·

1 Parent(s): 1aa692c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,20 +1,20 @@
-from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
-import torch
 import gradio as gr
 model_id = "AmiyendraOP/llama3-legal-finetuned"
-# Load tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained(model_id)
-model = AutoModelForCausalLM.from_pretrained(model_id)
-# Set device properly
 device = 0 if torch.cuda.is_available() else -1
-# Use pipeline for text generation
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, device=device)
-# Define chat function
 def chat(prompt):
     response = pipe(prompt, max_new_tokens=256, do_sample=True, temperature=0.7)[0]["generated_text"]
     return response
@@ -24,5 +24,5 @@ gr.Interface(
     fn=chat,
     inputs=gr.Textbox(lines=4, placeholder="Enter legal question...", label="Your Question"),
     outputs=gr.Textbox(label="Response"),
-    title="LLaMA 3 Legal Chatbot (Fine-tuned)",
 ).launch()

+from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 import gradio as gr
+import torch
 model_id = "AmiyendraOP/llama3-legal-finetuned"
+# Load tokenizer and model without quantization or bitsandbytes
 tokenizer = AutoTokenizer.from_pretrained(model_id)
+model = AutoModelForCausalLM.from_pretrained(model_id, low_cpu_mem_usage=True, torch_dtype=torch.float32)
+# Set device
 device = 0 if torch.cuda.is_available() else -1
+# Use the text-generation pipeline
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, device=device)
+# Define a chat function
 def chat(prompt):
     response = pipe(prompt, max_new_tokens=256, do_sample=True, temperature=0.7)[0]["generated_text"]
     return response
     fn=chat,
     inputs=gr.Textbox(lines=4, placeholder="Enter legal question...", label="Your Question"),
     outputs=gr.Textbox(label="Response"),
+    title="LLaMA 3 Legal Chatbot (Fine-tuned)"
 ).launch()