fauzansalim commited on
Commit
efbafdd
·
verified ·
1 Parent(s): 34ea616

Training in progress, epoch 0

Browse files
Files changed (3) hide show
  1. config.json +5 -5
  2. generation_config.json +1 -1
  3. model.safetensors +2 -2
config.json CHANGED
@@ -22,16 +22,16 @@
22
  "init_std": 0.02,
23
  "is_decoder": true,
24
  "is_encoder_decoder": false,
25
- "max_length": 768,
26
- "max_position_embeddings": 768,
27
  "model_type": "mbart",
28
  "num_hidden_layers": 12,
29
  "scale_embedding": true,
30
  "torch_dtype": "float32",
31
  "use_cache": true,
32
- "vocab_size": 57627
33
  },
34
- "decoder_start_token_id": 57626,
35
  "encoder": {
36
  "attention_probs_dropout_prob": 0.0,
37
  "depths": [
@@ -46,7 +46,7 @@
46
  "hidden_dropout_prob": 0.0,
47
  "hidden_size": 1024,
48
  "image_size": [
49
- 1280,
50
  960
51
  ],
52
  "initializer_range": 0.02,
 
22
  "init_std": 0.02,
23
  "is_decoder": true,
24
  "is_encoder_decoder": false,
25
+ "max_length": 1024,
26
+ "max_position_embeddings": 1536,
27
  "model_type": "mbart",
28
  "num_hidden_layers": 12,
29
  "scale_embedding": true,
30
  "torch_dtype": "float32",
31
  "use_cache": true,
32
+ "vocab_size": 57572
33
  },
34
+ "decoder_start_token_id": 57571,
35
  "encoder": {
36
  "attention_probs_dropout_prob": 0.0,
37
  "depths": [
 
46
  "hidden_dropout_prob": 0.0,
47
  "hidden_size": 1024,
48
  "image_size": [
49
+ 960,
50
  960
51
  ],
52
  "initializer_range": 0.02,
generation_config.json CHANGED
@@ -3,7 +3,7 @@
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
6
- "max_length": 768,
7
  "pad_token_id": 1,
8
  "transformers_version": "4.51.3"
9
  }
 
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
6
+ "max_length": 1024,
7
  "pad_token_id": 1,
8
  "transformers_version": "4.51.3"
9
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab61ebc6e55a44570085d89e955630b0d8bbd985cd5224a1c4156e9f4dc7418c
3
- size 806342808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddc6ed20531fa637ee73b9a60b269795c1671552a73b120c46b93fbc08be3c53
3
+ size 809263256