daniel-dona commited on
Commit
b2d905e
·
verified ·
1 Parent(s): 2067c10

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -12
app.py CHANGED
@@ -1,8 +1,8 @@
1
  import gradio as gr
2
- from huggingface_hub import InferenceClient
3
 
4
-
5
- client = InferenceClient("daniel-dona/google-gemma-3-270m")
6
 
7
 
8
  def respond(
@@ -25,19 +25,17 @@ def respond(
25
 
26
  messages.append({"role": "user", "content": message})
27
 
28
- response = ""
29
-
30
- for message in client.chat_completion(
31
  messages,
32
- max_tokens=max_tokens,
33
- stream=True,
34
  temperature=temperature,
35
  top_p=top_p,
36
- ):
37
- token = message.choices[0].delta.content
 
 
38
 
39
- response += token
40
- yield response
41
 
42
 
43
  """
 
1
  import gradio as gr
2
+ from transformers import pipeline
3
 
4
+ model = "daniel-dona/google-gemma-3-270m-it"
5
+ pipe = pipeline("text-generation", model=model)
6
 
7
 
8
  def respond(
 
25
 
26
  messages.append({"role": "user", "content": message})
27
 
28
+ response = pipe(
 
 
29
  messages,
30
+ max_new_tokens=max_tokens,
 
31
  temperature=temperature,
32
  top_p=top_p,
33
+ return_full_text=False,
34
+ )
35
+
36
+ generated_text = response[0]['generated_text']
37
 
38
+ yield generated_text
 
39
 
40
 
41
  """