Ketskapow commited on Feb 27, 2024

Commit

7122882

verified ·

1 Parent(s): 48c5f3f

Training in progress, epoch 2

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-4/checkpoint-214/config.json +25 -0
run-4/checkpoint-214/model.safetensors +3 -0
run-4/checkpoint-214/optimizer.pt +3 -0
run-4/checkpoint-214/rng_state.pth +3 -0
run-4/checkpoint-214/scheduler.pt +3 -0
run-4/checkpoint-214/special_tokens_map.json +7 -0
run-4/checkpoint-214/tokenizer.json +0 -0
run-4/checkpoint-214/tokenizer_config.json +55 -0
run-4/checkpoint-214/trainer_state.json +44 -0
run-4/checkpoint-214/training_args.bin +3 -0
run-4/checkpoint-214/vocab.txt +0 -0
run-4/checkpoint-321/config.json +25 -0
run-4/checkpoint-321/model.safetensors +3 -0
run-4/checkpoint-321/optimizer.pt +3 -0
run-4/checkpoint-321/rng_state.pth +3 -0
run-4/checkpoint-321/scheduler.pt +3 -0
run-4/checkpoint-321/special_tokens_map.json +7 -0
run-4/checkpoint-321/tokenizer.json +0 -0
run-4/checkpoint-321/tokenizer_config.json +55 -0
run-4/checkpoint-321/trainer_state.json +53 -0
run-4/checkpoint-321/training_args.bin +3 -0
run-4/checkpoint-321/vocab.txt +0 -0
run-8/checkpoint-108/config.json +25 -0
run-8/checkpoint-108/model.safetensors +3 -0
run-8/checkpoint-108/optimizer.pt +3 -0
run-8/checkpoint-108/rng_state.pth +3 -0
run-8/checkpoint-108/scheduler.pt +3 -0
run-8/checkpoint-108/special_tokens_map.json +7 -0
run-8/checkpoint-108/tokenizer.json +0 -0
run-8/checkpoint-108/tokenizer_config.json +55 -0
run-8/checkpoint-108/trainer_state.json +62 -0
run-8/checkpoint-108/training_args.bin +3 -0
run-8/checkpoint-108/vocab.txt +0 -0
run-8/checkpoint-135/config.json +25 -0
run-8/checkpoint-135/model.safetensors +3 -0
run-8/checkpoint-135/optimizer.pt +3 -0
run-8/checkpoint-135/rng_state.pth +3 -0
run-8/checkpoint-135/scheduler.pt +3 -0
run-8/checkpoint-135/special_tokens_map.json +7 -0
run-8/checkpoint-135/tokenizer.json +0 -0
run-8/checkpoint-135/tokenizer_config.json +55 -0
run-8/checkpoint-135/trainer_state.json +71 -0
run-8/checkpoint-135/training_args.bin +3 -0
run-8/checkpoint-135/vocab.txt +0 -0
run-8/checkpoint-27/config.json +25 -0
run-8/checkpoint-27/model.safetensors +3 -0
run-8/checkpoint-27/optimizer.pt +3 -0
run-8/checkpoint-27/rng_state.pth +3 -0
run-8/checkpoint-27/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:abae716af60ef08df4cfda8630d61b2a17e55b01951217054670529e3ef70248
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:77c2b7529d0fc011f1b68431931d2abd099e58914e531726ff0d1d6e228bf763
 size 267832560

run-4/checkpoint-214/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-4/checkpoint-214/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e4f0139b7c3cdc552269a802a493048ead5da175b3107303662e7b32c7882e0
+size 267832560

run-4/checkpoint-214/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be58717a40696dded28f6d1f3ec856fd22a3ef9d249bac0a8f343ff2ba786aae
+size 535727290

run-4/checkpoint-214/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c1e684b224f52ebe6d621443c80e405395f81e1d76627f9c4e29b63d527940e4
+size 14308

run-4/checkpoint-214/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8040697797fc04e139c6db45c3deb11e44d2e8d790bf2037c11c71d63361ed0e
+size 1064

run-4/checkpoint-214/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-214/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-214/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-214/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.22572628843417145,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-214",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 214,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6111112833023071,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6707,
+      "eval_samples_per_second": 1555.045,
+      "eval_steps_per_second": 98.402,
+      "step": 107
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.650396466255188,
+      "eval_matthews_correlation": 0.22572628843417145,
+      "eval_runtime": 0.753,
+      "eval_samples_per_second": 1385.204,
+      "eval_steps_per_second": 87.654,
+      "step": 214
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 321,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 9.050087494888513e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 8,
+    "seed": 24
+  }
+}

run-4/checkpoint-214/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e59fc4da2d33b8f536673ffdc9385a7429d46124b8cb2a495dc6969510ec995d
+size 4984

run-4/checkpoint-214/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-321/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-4/checkpoint-321/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0508bdffc60258a68e62e759a60e6f8d636d93435f85b55b0c24f94878f79f55
+size 267832560

run-4/checkpoint-321/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:97a0c1273d1694d2b9b59f596c3eec6c59d00b6e775ae27c7d0dc7a28a844f00
+size 535727290

run-4/checkpoint-321/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4fdcf411aa064e6835685d69d21c63e9b81392a6ec2fadcce4e9d337b1fbdae2
+size 14308

run-4/checkpoint-321/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e70c2b185b8264cccd10b048a578ff29a46b36b24a1975b4b906ba570662ad88
+size 1064

run-4/checkpoint-321/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-321/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-4/checkpoint-321/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-4/checkpoint-321/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.22572628843417145,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-214",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 321,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6111112833023071,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6707,
+      "eval_samples_per_second": 1555.045,
+      "eval_steps_per_second": 98.402,
+      "step": 107
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.650396466255188,
+      "eval_matthews_correlation": 0.22572628843417145,
+      "eval_runtime": 0.753,
+      "eval_samples_per_second": 1385.204,
+      "eval_steps_per_second": 87.654,
+      "step": 214
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 1.3015365600585938,
+      "eval_matthews_correlation": 0.21894626694065988,
+      "eval_runtime": 0.7997,
+      "eval_samples_per_second": 1304.27,
+      "eval_steps_per_second": 82.533,
+      "step": 321
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 321,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 9.050087494888513e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 8,
+    "seed": 24
+  }
+}

run-4/checkpoint-321/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e59fc4da2d33b8f536673ffdc9385a7429d46124b8cb2a495dc6969510ec995d
+size 4984

run-4/checkpoint-321/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-108/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-108/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aaef06a1cc1d4e112e67871fca687aafa3d24657847fa0c22c205d25b7c775ae
+size 267832560

run-8/checkpoint-108/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b245908c522b88cb8f7f2a511e1b243dff201706782fc4456f53df8704b2d8cb
+size 535727290

run-8/checkpoint-108/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8371dc77c66ec96b24e07becbfd23d83184b32b0a0b84acb61d7a72d8d68afb9
+size 14180

run-8/checkpoint-108/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77ca4ce0092abbb024680e1b49996d2783572933a476354c0f90e7bc9a33a0ac
+size 1064

run-8/checkpoint-108/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-108/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-108/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-108/trainer_state.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-8/checkpoint-27",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.633733332157135,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6697,
+      "eval_samples_per_second": 1557.488,
+      "eval_steps_per_second": 98.556,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6165023446083069,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7416,
+      "eval_samples_per_second": 1406.449,
+      "eval_steps_per_second": 88.999,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6124085187911987,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.1629,
+      "eval_samples_per_second": 896.912,
+      "eval_steps_per_second": 56.756,
+      "step": 81
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.6108661890029907,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7826,
+      "eval_samples_per_second": 1332.656,
+      "eval_steps_per_second": 84.329,
+      "step": 108
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 3.31601991514513e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 10
+  }
+}

run-8/checkpoint-108/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:876f865852373c961be6839854711de35bf3d97e08e0fde070ac6f4b53432187
+size 4984

run-8/checkpoint-108/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-135/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-135/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a97b8b070c5c3ed33550d8d9c98ac0f5b717087c304e2d27c075b647f127147f
+size 267832560

run-8/checkpoint-135/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d6efd5841a5acf584c47deed17fefdf3f785072873976e655342182e65313b5
+size 535727290

run-8/checkpoint-135/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1cd53b90dd5a4c271bf3850d8fe3d9864fcd30be7cb64af7d81ffd526a334aa4
+size 14180

run-8/checkpoint-135/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6cb31490cf03be26cb0df4d192cf8a6d29826537255b2c44e6ae1923421423f
+size 1064

run-8/checkpoint-135/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-135/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-135/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-135/trainer_state.json ADDED Viewed

	@@ -0,0 +1,71 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-8/checkpoint-27",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 135,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.633733332157135,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6697,
+      "eval_samples_per_second": 1557.488,
+      "eval_steps_per_second": 98.556,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6165023446083069,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7416,
+      "eval_samples_per_second": 1406.449,
+      "eval_steps_per_second": 88.999,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6124085187911987,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.1629,
+      "eval_samples_per_second": 896.912,
+      "eval_steps_per_second": 56.756,
+      "step": 81
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.6108661890029907,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7826,
+      "eval_samples_per_second": 1332.656,
+      "eval_steps_per_second": 84.329,
+      "step": 108
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 0.6103748679161072,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.0941,
+      "eval_samples_per_second": 953.3,
+      "eval_steps_per_second": 60.324,
+      "step": 135
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 3.31601991514513e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 10
+  }
+}

run-8/checkpoint-135/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:876f865852373c961be6839854711de35bf3d97e08e0fde070ac6f4b53432187
+size 4984

run-8/checkpoint-135/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-27/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-27/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:86cab5e1e8bf70cc615f5e3eab427a5d30df34194b2a7d193ccee770db5eabe3
+size 267832560

run-8/checkpoint-27/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:724aaaa5536cfc3ae2a3b5ddb577bdf4e90876847e63f45f9dca48dc7cb3801b
+size 535727290

run-8/checkpoint-27/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be2e61cfb32bd0131c8524d0f66b7881e91890fc6d136be5e1c3e92c518e8271
+size 14180

run-8/checkpoint-27/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:70d1d5e7125cc0cda6a38bbc08512bb9d0ed1e6f604b45d474557ef44cdb6824
+size 1064