jatinshah commited on
Commit
b28ca2c
·
1 Parent(s): 69b6f30

Training in progress, epoch 1

Browse files
Files changed (23) hide show
  1. .gitignore +1 -0
  2. config.json +60 -0
  3. pytorch_model.bin +3 -0
  4. runs/Feb14_04-25-37_n4dps79gja/1644813729.5560415/events.out.tfevents.1644813729.n4dps79gja.1520.1 +3 -0
  5. runs/Feb14_04-25-37_n4dps79gja/events.out.tfevents.1644813686.n4dps79gja.1520.0 +3 -0
  6. runs/Feb14_04-42-17_n4dps79gja/1644813751.910177/events.out.tfevents.1644813751.n4dps79gja.1520.3 +3 -0
  7. runs/Feb14_04-42-17_n4dps79gja/events.out.tfevents.1644813751.n4dps79gja.1520.2 +3 -0
  8. runs/Feb14_04-42-46_n4dps79gja/1644813774.0708055/events.out.tfevents.1644813774.n4dps79gja.1520.5 +3 -0
  9. runs/Feb14_04-42-46_n4dps79gja/events.out.tfevents.1644813774.n4dps79gja.1520.4 +3 -0
  10. runs/Feb14_04-43-07_n4dps79gja/1644813795.6215308/events.out.tfevents.1644813795.n4dps79gja.1520.7 +3 -0
  11. runs/Feb14_04-43-07_n4dps79gja/events.out.tfevents.1644813795.n4dps79gja.1520.6 +3 -0
  12. runs/Feb14_04-44-09_n4dps79gja/1644813864.8714516/events.out.tfevents.1644813864.n4dps79gja.1947.1 +3 -0
  13. runs/Feb14_04-44-09_n4dps79gja/events.out.tfevents.1644813864.n4dps79gja.1947.0 +3 -0
  14. runs/Feb14_04-45-19_n4dps79gja/1644813930.040967/events.out.tfevents.1644813930.n4dps79gja.2056.1 +3 -0
  15. runs/Feb14_04-45-19_n4dps79gja/events.out.tfevents.1644813930.n4dps79gja.2056.0 +3 -0
  16. runs/Feb14_04-46-00_n4dps79gja/1644813971.4850163/events.out.tfevents.1644813971.n4dps79gja.2154.1 +3 -0
  17. runs/Feb14_04-46-00_n4dps79gja/events.out.tfevents.1644813971.n4dps79gja.2154.0 +3 -0
  18. source.spm +0 -0
  19. special_tokens_map.json +1 -0
  20. target.spm +0 -0
  21. tokenizer_config.json +1 -0
  22. training_args.bin +3 -0
  23. vocab.json +0 -0
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Helsinki-NLP/opus-mt-en-fr",
3
+ "_num_labels": 3,
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "swish",
6
+ "add_bias_logits": false,
7
+ "add_final_layer_norm": false,
8
+ "architectures": [
9
+ "MarianMTModel"
10
+ ],
11
+ "attention_dropout": 0.0,
12
+ "bad_words_ids": [
13
+ [
14
+ 59513
15
+ ]
16
+ ],
17
+ "bos_token_id": 0,
18
+ "classif_dropout": 0.0,
19
+ "classifier_dropout": 0.0,
20
+ "d_model": 512,
21
+ "decoder_attention_heads": 8,
22
+ "decoder_ffn_dim": 2048,
23
+ "decoder_layerdrop": 0.0,
24
+ "decoder_layers": 6,
25
+ "decoder_start_token_id": 59513,
26
+ "dropout": 0.1,
27
+ "encoder_attention_heads": 8,
28
+ "encoder_ffn_dim": 2048,
29
+ "encoder_layerdrop": 0.0,
30
+ "encoder_layers": 6,
31
+ "eos_token_id": 0,
32
+ "forced_eos_token_id": 0,
33
+ "gradient_checkpointing": false,
34
+ "id2label": {
35
+ "0": "LABEL_0",
36
+ "1": "LABEL_1",
37
+ "2": "LABEL_2"
38
+ },
39
+ "init_std": 0.02,
40
+ "is_encoder_decoder": true,
41
+ "label2id": {
42
+ "LABEL_0": 0,
43
+ "LABEL_1": 1,
44
+ "LABEL_2": 2
45
+ },
46
+ "max_length": 512,
47
+ "max_position_embeddings": 512,
48
+ "model_type": "marian",
49
+ "normalize_before": false,
50
+ "normalize_embedding": false,
51
+ "num_beams": 4,
52
+ "num_hidden_layers": 6,
53
+ "pad_token_id": 59513,
54
+ "scale_embedding": true,
55
+ "static_position_embeddings": true,
56
+ "torch_dtype": "float32",
57
+ "transformers_version": "4.16.2",
58
+ "use_cache": true,
59
+ "vocab_size": 59514
60
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf196d0cd4f25bae5fb6dd2d010466de4f778bab2e743e38b11451a78f22057
3
+ size 298771077
runs/Feb14_04-25-37_n4dps79gja/1644813729.5560415/events.out.tfevents.1644813729.n4dps79gja.1520.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8052ed2814707ffd060e9bcaea76f8623211c4a1610d6c1ccac112a6144eb7f2
3
+ size 5028
runs/Feb14_04-25-37_n4dps79gja/events.out.tfevents.1644813686.n4dps79gja.1520.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8634fe5c3d86388dd20f5ef499faefa01565b36c09566bd85c3d1c62e6972d3
3
+ size 4539
runs/Feb14_04-42-17_n4dps79gja/1644813751.910177/events.out.tfevents.1644813751.n4dps79gja.1520.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d97492847c0dd3a03de7187c95206b0bb1be6cb270f495e34944e8c0f212463
3
+ size 5028
runs/Feb14_04-42-17_n4dps79gja/events.out.tfevents.1644813751.n4dps79gja.1520.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18e3a8d09cbb81a2e058e23ef00a858e27afbbcc4c7e10160f90902a73820934
3
+ size 4147
runs/Feb14_04-42-46_n4dps79gja/1644813774.0708055/events.out.tfevents.1644813774.n4dps79gja.1520.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10c25bfdf407d7821a150f9dad8f67a48e28ae5de862e717582d600319261eb9
3
+ size 5028
runs/Feb14_04-42-46_n4dps79gja/events.out.tfevents.1644813774.n4dps79gja.1520.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccee7fe6ab2d6047b6ba506bcba34009440dd11e41c8a95ef8b09023673bb390
3
+ size 4146
runs/Feb14_04-43-07_n4dps79gja/1644813795.6215308/events.out.tfevents.1644813795.n4dps79gja.1520.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ad7ae3601814089b3bd3e05fef57956ea01d2da1d6cf1e2d3bd3601d05ab66a
3
+ size 5028
runs/Feb14_04-43-07_n4dps79gja/events.out.tfevents.1644813795.n4dps79gja.1520.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e54268fd7785f3841f72fddeb4b05fa901a8aa0accdd8a18b78638b801e936f2
3
+ size 4145
runs/Feb14_04-44-09_n4dps79gja/1644813864.8714516/events.out.tfevents.1644813864.n4dps79gja.1947.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c00f93da896368e173d484574ebd05d1e6efdbc05cd9a59bb1d1889c000dcb1
3
+ size 5028
runs/Feb14_04-44-09_n4dps79gja/events.out.tfevents.1644813864.n4dps79gja.1947.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6b992c88770bb66f177bda6bc9c4d5da179cd2bfadbf4045d07469063f308ed
3
+ size 4145
runs/Feb14_04-45-19_n4dps79gja/1644813930.040967/events.out.tfevents.1644813930.n4dps79gja.2056.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b006d4c8e80d5ed06e40fb6351b944c6c96d0650b5f216347fff5c3ed9ad9ecb
3
+ size 5028
runs/Feb14_04-45-19_n4dps79gja/events.out.tfevents.1644813930.n4dps79gja.2056.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:083437bc3fd84bd04762af5de1aac23952096a414f36fb0b17f5bd0899ebe615
3
+ size 4146
runs/Feb14_04-46-00_n4dps79gja/1644813971.4850163/events.out.tfevents.1644813971.n4dps79gja.2154.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:834d0e8f19fa3a2ffdaab34703a28c68d51afc5a2ea55c216f95b5fa501a7137
3
+ size 5028
runs/Feb14_04-46-00_n4dps79gja/events.out.tfevents.1644813971.n4dps79gja.2154.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e49ec20d4cfac3271212bbb9f1f11558c1127ece0899afebc0945fafd6966335
3
+ size 4930
source.spm ADDED
Binary file (778 kB). View file
 
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}
target.spm ADDED
Binary file (802 kB). View file
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"source_lang": "en", "target_lang": "fr", "unk_token": "<unk>", "eos_token": "</s>", "pad_token": "<pad>", "model_max_length": 512, "sp_model_kwargs": {}, "return_tensors": "tf", "special_tokens_map_file": null, "tokenizer_file": null, "name_or_path": "Helsinki-NLP/opus-mt-en-fr", "tokenizer_class": "MarianTokenizer"}
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2e0e4d6bda108f91243d7523ce75afc2a6047b4c9381565333523dae947125a
3
+ size 3247
vocab.json ADDED
The diff for this file is too large to render. See raw diff