xulh
commited on
Commit
·
df22e8a
1
Parent(s):
1e5f011
代码初始化
Browse files- inference/inference.py +1 -1
inference/inference.py
CHANGED
@@ -95,7 +95,7 @@ async def chat_completion(token: str = Body(...), messages: list = Body(...)):
|
|
95 |
|
96 |
# 使用 chat API 请求生成模型的回答 备选模型 google/gemma-2-2b-it
|
97 |
completion = client.chat.completions.create(
|
98 |
-
model="
|
99 |
messages=messages,
|
100 |
max_tokens=500
|
101 |
)
|
|
|
95 |
|
96 |
# 使用 chat API 请求生成模型的回答 备选模型 google/gemma-2-2b-it
|
97 |
completion = client.chat.completions.create(
|
98 |
+
model="google/gemma-2-2b-it",
|
99 |
messages=messages,
|
100 |
max_tokens=500
|
101 |
)
|