TobDeBer commited on
Commit
7c96a88
·
verified ·
1 Parent(s): 58cc8dc

--no-warmup

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -93,6 +93,7 @@ def start_llama_server():
93
  "-c", "2048",
94
  "-t", "8",
95
  "--port", "8081",
 
96
  "-ngl", "999" # <--- CRUCIAL: GPU offload instruction
97
  ]
98
 
@@ -101,7 +102,7 @@ def start_llama_server():
101
  print(f"Llama-server process started with PID {llama_process.pid}")
102
 
103
  # You might need a small sleep here to wait for the server to initialize
104
- # time.sleep(5)
105
 
106
 
107
  custom_theme = ResearchMonochrome()
 
93
  "-c", "2048",
94
  "-t", "8",
95
  "--port", "8081",
96
+ "--no-warmup",
97
  "-ngl", "999" # <--- CRUCIAL: GPU offload instruction
98
  ]
99
 
 
102
  print(f"Llama-server process started with PID {llama_process.pid}")
103
 
104
  # You might need a small sleep here to wait for the server to initialize
105
+ time.sleep(5)
106
 
107
 
108
  custom_theme = ResearchMonochrome()