Spaces:

vectara
/

leaderboard

Running on CPU Upgrade

Miaoran000 commited on Jul 23, 2024

Commit

6c3a616

2 Parent(s): 5c4aa1e a219d3f

merge with 'main'

Files changed (2) hide show

README.md CHANGED Viewed

@@ -4,12 +4,12 @@ emoji: 🥇
 colorFrom: green
 colorTo: indigo
 sdk: gradio
-sdk_version: 4.4.0
 app_file: app.py
 pinned: true
 license: apache-2.0
 tags:
-  - leaderboard
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 colorFrom: green
 colorTo: indigo
 sdk: gradio
+sdk_version: 4.37.1
 app_file: app.py
 pinned: true
 license: apache-2.0
 tags:
+- leaderboard
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

src/backend/model_operations.py CHANGED Viewed

@@ -328,7 +328,7 @@ class SummaryGenerator:
             try: # try use HuggingFace API
                 print('using huggingface api')
                 response = litellm.completion(
-                    model='command-r-plus' if 'command' in self.model else self.model,
                     messages=[{"role": "system", "content": system_prompt},
                                 {"role": "user", "content": user_prompt}],
                     temperature=0.0,
@@ -347,7 +347,7 @@ class SummaryGenerator:
                 else:
                     self.tokenizer = AutoTokenizer.from_pretrained("meta-llama/Llama-2-7b-hf" if 'openelm' in self.model_id.lower() else self.model_id, trust_remote_code=True)
                     print("Tokenizer loaded")
-                    self.local_model = AutoModelForCausalLM.from_pretrained(self.model_id, trust_remote_code=True, device_map="auto", torch_dtype="auto")
                     print("Local model loaded")
         # Using local model

             try: # try use HuggingFace API
                 print('using huggingface api')
                 response = litellm.completion(
+                    model='command-r-plus' if 'command' in self.model_id else self.model_id,
                     messages=[{"role": "system", "content": system_prompt},
                                 {"role": "user", "content": user_prompt}],
                     temperature=0.0,
                 else:
                     self.tokenizer = AutoTokenizer.from_pretrained("meta-llama/Llama-2-7b-hf" if 'openelm' in self.model_id.lower() else self.model_id, trust_remote_code=True)
                     print("Tokenizer loaded")
+                    self.local_model = AutoModelForCausalLM.from_pretrained(self.model_id, trust_remote_code=True, device_map="auto", torch_dtype="auto", cache_dir='/home/paperspace/cache')
                     print("Local model loaded")
         # Using local model