Buggod commited on
Commit
9cc53ff
·
verified ·
1 Parent(s): 22a8539

Training in progress, step 50

Browse files
.ipynb_checkpoints/all_results-checkpoint.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "total_flos": 0.0,
3
+ "train_loss": 0.16526810049655613,
4
+ "train_runtime": 49656.4521,
5
+ "train_samples": 7000,
6
+ "train_samples_per_second": 0.483,
7
+ "train_steps_per_second": 0.01
8
+ }
.ipynb_checkpoints/generation_config-checkpoint.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 151646,
4
+ "do_sample": true,
5
+ "eos_token_id": 151643,
6
+ "temperature": 0.6,
7
+ "top_p": 0.95,
8
+ "transformers_version": "4.50.0"
9
+ }
.ipynb_checkpoints/train_results-checkpoint.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "total_flos": 0.0,
3
+ "train_loss": 0.16526810049655613,
4
+ "train_runtime": 49656.4521,
5
+ "train_samples": 7000,
6
+ "train_samples_per_second": 0.483,
7
+ "train_steps_per_second": 0.01
8
+ }
config.json CHANGED
@@ -22,7 +22,7 @@
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "bfloat16",
24
  "transformers_version": "4.50.0",
25
- "use_cache": true,
26
  "use_mrope": false,
27
  "use_sliding_window": false,
28
  "vocab_size": 151936
 
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "bfloat16",
24
  "transformers_version": "4.50.0",
25
+ "use_cache": false,
26
  "use_mrope": false,
27
  "use_sliding_window": false,
28
  "vocab_size": 151936
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51c29c6ff6aa4c71fa2667d4813595081aaeb49489769e7df8845cd682538d2a
3
  size 3554214752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5802e312c34f55feb031067c11668f23a4d765ebb4b8b2f8022360c38c4228e4
3
  size 3554214752
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59a3c6b46281b4adeff4678921308ef393abea46e619b88e7865c81196c32f86
3
- size 8568
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77372817777ee57a39496dcf790c82cf535ccb75d7e464e4f98eb6cf7d9fece5
3
+ size 8376