AIArchitect23
/

qwen2-0.5b-arxiv-300

Text Generation

text-generation-inference

Model card Files Files and versions

AIArchitect23 commited on Mar 30

Commit

6228932

·

verified ·

1 Parent(s): 2af4a10

Upload Qwen2ForCausalLM

Files changed (3) hide show

README.md +21 -21
config.json +2 -2
generation_config.json +1 -1

README.md CHANGED Viewed

@@ -1,29 +1,29 @@
 ---
 language:
-  - en
-license: apache-2.0
-tags:
-  - qwen
-  - arxiv
-  - science
-  - research
-  - causal-lm
 library_name: transformers
 pipeline_tag: text-generation
-base_model: Qwen/Qwen2-0.5B-Instruct
 model-index:
-  - name: Qwen2-0.5B-ArXiv
-    results:
-      - task:
-          type: text-generation
-          name: Scientific text generation
-        dataset:
-          type: arxiv
-          name: ArXiv
-        metrics:
-          - type: loss
-            value: 1.76
-            name: training loss
 ---
 # 🌌 The Qwen2-0.5B-ArXiv Oracle 🌌

 ---
+base_model: Qwen/Qwen2-0.5B-Instruct
 language:
+- en
 library_name: transformers
+license: apache-2.0
 pipeline_tag: text-generation
+tags:
+- qwen
+- arxiv
+- science
+- research
+- causal-lm
 model-index:
+- name: Qwen2-0.5B-ArXiv
+  results:
+  - task:
+      type: text-generation
+      name: Scientific text generation
+    dataset:
+      name: ArXiv
+      type: arxiv
+    metrics:
+    - type: loss
+      value: 1.76
+      name: training loss
 ---
 # 🌌 The Qwen2-0.5B-ArXiv Oracle 🌌

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "./qwen2-0.5b-arxiv-300",
   "architectures": [
     "Qwen2ForCausalLM"
   ],
@@ -21,7 +21,7 @@
   "sliding_window": null,
   "tie_word_embeddings": true,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.48.3",
   "use_cache": false,
   "use_sliding_window": false,
   "vocab_size": 151936

 {
+  "_name_or_path": "/home/nicknames/SN80/axolotl/qwen2-0.5b-arxiv-300-safetensors/",
   "architectures": [
     "Qwen2ForCausalLM"
   ],
   "sliding_window": null,
   "tie_word_embeddings": true,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.44.1",
   "use_cache": false,
   "use_sliding_window": false,
   "vocab_size": 151936

generation_config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "_from_model_config": true,
   "eos_token_id": 151645,
-  "transformers_version": "4.48.3",
   "use_cache": false
 }

 {
   "_from_model_config": true,
   "eos_token_id": 151645,
+  "transformers_version": "4.44.1",
   "use_cache": false
 }