Spaces:

simone-papicchio
/

qatch-demo

Running

simone-papicchio commited on Apr 6

Commit

ab37bbe

1 Parent(s): a1a2a18

fix: correct path for togheter AI model

Files changed (1) hide show

prediction.py CHANGED Viewed

@@ -25,14 +25,14 @@ from tqdm import tqdm
 import subprocess
 # https://huggingface.co/spaces/zero-gpu-explorers/README/discussions/132
-subprocess.run("rm -rf /data-nvme/zerogpu-offload/*", env={}, shell=True)
-pipeline = hf_pipeline(
-    "text-generation",
-    model="meta-llama/Meta-Llama-3.1-8B-Instruct",
-    model_kwargs={"torch_dtype": 'bfloat16'},
-    device_map="auto",
-)
 class ModelPrediction:
@@ -140,7 +140,7 @@ class ModelPrediction:
         elif "DeepSeek-R1-Distill-Llama-70B" in model_name:
             model_name = "together_ai/deepseek-ai/DeepSeek-R1-Distill-Llama-70B"
         elif "llama-8" in model_name:
-            model_name = "together_ai/meta-llama/Meta-Llama-3-8B-Instruct"
         else:
             raise ValueError("Model forbidden")

 import subprocess
 # https://huggingface.co/spaces/zero-gpu-explorers/README/discussions/132
+# subprocess.run("rm -rf /data-nvme/zerogpu-offload/*", env={}, shell=True)
+# pipeline = hf_pipeline(
+#     "text-generation",
+#     model="meta-llama/Meta-Llama-3.1-8B-Instruct",
+#     model_kwargs={"torch_dtype": 'bfloat16'},
+#     device_map="auto",
+# )
 class ModelPrediction:
         elif "DeepSeek-R1-Distill-Llama-70B" in model_name:
             model_name = "together_ai/deepseek-ai/DeepSeek-R1-Distill-Llama-70B"
         elif "llama-8" in model_name:
+            model_name = "together_ai/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo"
         else:
             raise ValueError("Model forbidden")