Spaces:

fastrtc
/

talk-to-sambanova-gradio

Running

Use `huggingface_hub.InferenceClient` instead of `openai` to call Sambanova

by Wauplin HF staff - opened 1 day ago

←

Files changed (2) hide show

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ from pathlib import Path
 import gradio as gr
 import numpy as np
-import openai
 from dotenv import load_dotenv
 from fastapi import FastAPI
 from fastapi.responses import HTMLResponse, StreamingResponse
@@ -25,9 +25,9 @@ load_dotenv()
 curr_dir = Path(__file__).parent
-client = openai.OpenAI(
     api_key=os.environ.get("SAMBANOVA_API_KEY"),
-    base_url="https://api.sambanova.ai/v1",
 )
 stt_model = get_stt_model()
@@ -52,7 +52,7 @@ def response(
     raise WebRTCError("test")
     request = client.chat.completions.create(
-        model="Meta-Llama-3.2-3B-Instruct",
         messages=conversation_state,  # type: ignore
         temperature=0.1,
         top_p=0.1,

 import gradio as gr
 import numpy as np
+import huggingface_hub
 from dotenv import load_dotenv
 from fastapi import FastAPI
 from fastapi.responses import HTMLResponse, StreamingResponse
 curr_dir = Path(__file__).parent
+client = huggingface_hub.InferenceClient(
     api_key=os.environ.get("SAMBANOVA_API_KEY"),
+    provider="sambanova",
 )
 stt_model = get_stt_model()
     raise WebRTCError("test")
     request = client.chat.completions.create(
+        model="meta-llama/Llama-3.2-3B-Instruct",
         messages=conversation_state,  # type: ignore
         temperature=0.1,
         top_p=0.1,

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
 fastrtc[vad, stt]
 python-dotenv
-openai
 twilio

 fastrtc[vad, stt]
 python-dotenv
+huggingface_hub
 twilio