Spaces:
Runtime error
Runtime error
--no-warmup
Browse files
app.py
CHANGED
@@ -93,6 +93,7 @@ def start_llama_server():
|
|
93 |
"-c", "2048",
|
94 |
"-t", "8",
|
95 |
"--port", "8081",
|
|
|
96 |
"-ngl", "999" # <--- CRUCIAL: GPU offload instruction
|
97 |
]
|
98 |
|
@@ -101,7 +102,7 @@ def start_llama_server():
|
|
101 |
print(f"Llama-server process started with PID {llama_process.pid}")
|
102 |
|
103 |
# You might need a small sleep here to wait for the server to initialize
|
104 |
-
|
105 |
|
106 |
|
107 |
custom_theme = ResearchMonochrome()
|
|
|
93 |
"-c", "2048",
|
94 |
"-t", "8",
|
95 |
"--port", "8081",
|
96 |
+
"--no-warmup",
|
97 |
"-ngl", "999" # <--- CRUCIAL: GPU offload instruction
|
98 |
]
|
99 |
|
|
|
102 |
print(f"Llama-server process started with PID {llama_process.pid}")
|
103 |
|
104 |
# You might need a small sleep here to wait for the server to initialize
|
105 |
+
time.sleep(5)
|
106 |
|
107 |
|
108 |
custom_theme = ResearchMonochrome()
|