Spaces:

tosin2013
/

autogen-agent-gen

Runtime error

tosin2013 commited on Jan 2

Commit

eb872b8

1 Parent(s): 7e1e3c5

adding zerogpu

Files changed (1) hide show

app.py CHANGED Viewed

@@ -37,18 +37,23 @@ if model_provider.lower() == "openai":
     )
 else:
     MODEL_NAME = "meta-llama/Llama-3.3-70B-Instruct"
-    # Initialize Hugging Face InferenceClient
     hf_client = InferenceClient(
         model=MODEL_NAME,
-        api_key=os.environ.get("HF_TOKEN")
     )
 # Load the Hugging Face dataset
 dataset = load_dataset('tosin2013/autogen', streaming=True)
 dataset = Dataset.from_list(list(dataset['train']))
-# Initialize embeddings
-embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
 # Extract texts from the dataset
 texts = dataset['input']

     )
 else:
     MODEL_NAME = "meta-llama/Llama-3.3-70B-Instruct"
+    # Initialize Hugging Face InferenceClient with GPU support
     hf_client = InferenceClient(
         model=MODEL_NAME,
+        api_key=os.environ.get("HF_TOKEN"),
+        timeout=120  # Increased timeout for GPU inference
     )
 # Load the Hugging Face dataset
 dataset = load_dataset('tosin2013/autogen', streaming=True)
 dataset = Dataset.from_list(list(dataset['train']))
+# Initialize embeddings with GPU support if available
+device = "cuda" if torch.cuda.is_available() else "cpu"
+embeddings = HuggingFaceEmbeddings(
+    model_name="sentence-transformers/all-MiniLM-L6-v2",
+    model_kwargs={"device": device}
+)
 # Extract texts from the dataset
 texts = dataset['input']