Update app.py
Browse files
app.py
CHANGED
@@ -57,7 +57,7 @@ CHUTES_KEY = os.getenv("CHUTES_KEY")
|
|
57 |
# GEMINI=os.getenv("GEMINI_API_KEY")
|
58 |
|
59 |
|
60 |
-
embeddings = HuggingFaceEmbeddings(model_name="
|
61 |
|
62 |
try:
|
63 |
client = QdrantClient(
|
@@ -163,9 +163,9 @@ def log_to_qdrant(question: str, answer: str):
|
|
163 |
|
164 |
llm = ChatOpenAI(
|
165 |
base_url="https://openrouter.ai/api/v1",
|
166 |
-
model="
|
167 |
api_key=OPENAPI_KEY,# if you prefer to pass api key in directly instaed of using env vars
|
168 |
-
temperature=0.
|
169 |
max_tokens=None,
|
170 |
timeout=None,
|
171 |
max_retries=3,
|
|
|
57 |
# GEMINI=os.getenv("GEMINI_API_KEY")
|
58 |
|
59 |
|
60 |
+
embeddings = HuggingFaceEmbeddings(model_name="ibm-granite/granite-embedding-small-english-r2")
|
61 |
|
62 |
try:
|
63 |
client = QdrantClient(
|
|
|
163 |
|
164 |
llm = ChatOpenAI(
|
165 |
base_url="https://openrouter.ai/api/v1",
|
166 |
+
model="z-ai/glm-4.5-air:free",
|
167 |
api_key=OPENAPI_KEY,# if you prefer to pass api key in directly instaed of using env vars
|
168 |
+
temperature=0.2,
|
169 |
max_tokens=None,
|
170 |
timeout=None,
|
171 |
max_retries=3,
|