arthurwangheng commited on
Commit
dce4092
·
verified ·
1 Parent(s): 1d1487f

Training in progress, step 300

Browse files
Files changed (3) hide show
  1. config.json +1 -1
  2. model.safetensors +1 -1
  3. training_args.bin +1 -1
config.json CHANGED
@@ -23,7 +23,7 @@
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.49.0",
26
- "use_cache": true,
27
  "use_mrope": false,
28
  "use_sliding_window": false,
29
  "vocab_size": 151936
 
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.49.0",
26
+ "use_cache": false,
27
  "use_mrope": false,
28
  "use_sliding_window": false,
29
  "vocab_size": 151936
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf624d362d25a4b73337556a85ceeecf5fe6e5b3c1d75b1cf30cd876edf75266
3
  size 3554214752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07322ee26419ce5e5f9d31a8717407d7f812d3f73b802a7630b0e68859685cf5
3
  size 3554214752
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b51a3d92ccf4f5f2c5e66cc8c2503d6e4434dd3b78a96957c3ba0cc21074925
3
  size 8696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:854c535ab358fbb80a81ef44bb4c8d2f3b0a80c459642d2360048c6921aab90a
3
  size 8696