kbberendsen commited on Feb 27, 2024

Commit

962ee1d

verified ·

1 Parent(s): cdc1a22

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-5/checkpoint-108/config.json +25 -0
run-5/checkpoint-108/model.safetensors +3 -0
run-5/checkpoint-108/optimizer.pt +3 -0
run-5/checkpoint-108/rng_state.pth +3 -0
run-5/checkpoint-108/scheduler.pt +3 -0
run-5/checkpoint-108/special_tokens_map.json +7 -0
run-5/checkpoint-108/tokenizer.json +0 -0
run-5/checkpoint-108/tokenizer_config.json +55 -0
run-5/checkpoint-108/trainer_state.json +44 -0
run-5/checkpoint-108/training_args.bin +3 -0
run-5/checkpoint-108/vocab.txt +0 -0
run-6/checkpoint-14/config.json +25 -0
run-6/checkpoint-14/model.safetensors +3 -0
run-6/checkpoint-14/optimizer.pt +3 -0
run-6/checkpoint-14/rng_state.pth +3 -0
run-6/checkpoint-14/scheduler.pt +3 -0
run-6/checkpoint-14/special_tokens_map.json +7 -0
run-6/checkpoint-14/tokenizer.json +0 -0
run-6/checkpoint-14/tokenizer_config.json +55 -0
run-6/checkpoint-14/trainer_state.json +35 -0
run-6/checkpoint-14/training_args.bin +3 -0
run-6/checkpoint-14/vocab.txt +0 -0
run-6/checkpoint-28/config.json +25 -0
run-6/checkpoint-28/model.safetensors +3 -0
run-6/checkpoint-28/optimizer.pt +3 -0
run-6/checkpoint-28/rng_state.pth +3 -0
run-6/checkpoint-28/scheduler.pt +3 -0
run-6/checkpoint-28/special_tokens_map.json +7 -0
run-6/checkpoint-28/tokenizer.json +0 -0
run-6/checkpoint-28/tokenizer_config.json +55 -0
run-6/checkpoint-28/trainer_state.json +44 -0
run-6/checkpoint-28/training_args.bin +3 -0
run-6/checkpoint-28/vocab.txt +0 -0
run-6/checkpoint-42/config.json +25 -0
run-6/checkpoint-42/model.safetensors +3 -0
run-6/checkpoint-42/optimizer.pt +3 -0
run-6/checkpoint-42/rng_state.pth +3 -0
run-6/checkpoint-42/scheduler.pt +3 -0
run-6/checkpoint-42/special_tokens_map.json +7 -0
run-6/checkpoint-42/tokenizer.json +0 -0
run-6/checkpoint-42/tokenizer_config.json +55 -0
run-6/checkpoint-42/trainer_state.json +53 -0
run-6/checkpoint-42/training_args.bin +3 -0
run-6/checkpoint-42/vocab.txt +0 -0
run-6/checkpoint-56/config.json +25 -0
run-6/checkpoint-56/model.safetensors +3 -0
run-6/checkpoint-56/optimizer.pt +3 -0
run-6/checkpoint-56/rng_state.pth +3 -0
run-6/checkpoint-56/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0bbf877073a9713d16c87b087bcc1bebfe560f12c2c9cba91b180f7cc275c7b1
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:8df23a34fff6106c674cfa449cebe353dc52f8e19e68422c6659c24d3d691429
 size 267832560

run-5/checkpoint-108/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-5/checkpoint-108/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9c7f4488b2b748037f98e7a6c9feeda7f406b46de98484670c7288f25f5a84f5
+size 267832560

run-5/checkpoint-108/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5a1adedb23733924ac3975c626f5c71af781780ac53becee41a9396509d1d11e
+size 535727290

run-5/checkpoint-108/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a976334fa343d2f8eb913d35a4116d1ea2c1500747f22b688e8d43721d7f320
+size 14244

run-5/checkpoint-108/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d4928d1fae39492f272735df0c2c91e218ae336a6337eaef8e871a259ea447f1
+size 1064

run-5/checkpoint-108/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-5/checkpoint-108/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-5/checkpoint-108/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-5/checkpoint-108/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-5/checkpoint-54",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6223766207695007,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7165,
+      "eval_samples_per_second": 1455.603,
+      "eval_steps_per_second": 92.109,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6125382781028748,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8176,
+      "eval_samples_per_second": 1275.667,
+      "eval_steps_per_second": 80.723,
+      "step": 108
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.6586381863896615e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 16,
+    "seed": 23
+  }
+}

run-5/checkpoint-108/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf05262a2ee600d4bc72f4472c7df009ef0f8da02a622b920dc4c1da59d98947
+size 4984

run-5/checkpoint-108/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-14/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-14/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:80bffceba74fadd0cd12bb130b52708bce3d6eecc45e229ecbaad092ab341815
+size 267832560

run-6/checkpoint-14/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:82e7303162e105ea68f9b4facdee2c83141ca69bb414d512eafd9d1e8954ac0b
+size 535727290

run-6/checkpoint-14/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e4ed288cd1d7f33983e156ebb2b0d229399c8436f09fc8fec974bc8a222d9801
+size 14308

run-6/checkpoint-14/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ded82efe92faf57d0e25b15a8d053639d82890ef5465631ae57a94232cdaed3
+size 1064

run-6/checkpoint-14/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-14/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-14/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-14/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.01845565733408863,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-14",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 14,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6778180599212646,
+      "eval_matthews_correlation": 0.01845565733408863,
+      "eval_runtime": 1.2856,
+      "eval_samples_per_second": 811.291,
+      "eval_steps_per_second": 51.338,
+      "step": 14
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 56,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.3409355672779142e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 64,
+    "seed": 17
+  }
+}

run-6/checkpoint-14/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7482407793d8c83d435fc746c3a21bf6bca34e9902d1310a394eabf83b64a64f
+size 4984

run-6/checkpoint-14/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-28/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-28/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:95bcefdb8592f1e75fd6019533cefec74ca422d130c6e597f384566e9f1a0c72
+size 267832560

run-6/checkpoint-28/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:36559365d77d92eb77ece2ff98ac759fdd35809d1e137aa7797c33953aa77b73
+size 535727290

run-6/checkpoint-28/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2fc36f9eb920a6c89e2fa6d5af3217dfa8b6a4addb2fd9e3640535336f63d888
+size 14308

run-6/checkpoint-28/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:abb1cdfb3c19d7f5275897a998405cbea9156f4c717f85133ddc956ea6841756
+size 1064

run-6/checkpoint-28/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-28/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-28/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-28/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.01845565733408863,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-14",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 28,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6778180599212646,
+      "eval_matthews_correlation": 0.01845565733408863,
+      "eval_runtime": 1.2856,
+      "eval_samples_per_second": 811.291,
+      "eval_steps_per_second": 51.338,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.669923722743988,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7843,
+      "eval_samples_per_second": 1329.908,
+      "eval_steps_per_second": 84.155,
+      "step": 28
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 56,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.3409355672779142e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 64,
+    "seed": 17
+  }
+}

run-6/checkpoint-28/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7482407793d8c83d435fc746c3a21bf6bca34e9902d1310a394eabf83b64a64f
+size 4984

run-6/checkpoint-28/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-42/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-42/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5995045e3f170944280bd5bb43d6dd7930e42372b6fcd49af1f359b815d2299e
+size 267832560

run-6/checkpoint-42/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c2d9df33a06d7912823e286252a2179125bac489225d0f23f670b7723d2481b
+size 535727290

run-6/checkpoint-42/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4351b22bdcc61e76de8acd65d8fb65e5aa258557cf250f57ae4aace13f907a65
+size 14308

run-6/checkpoint-42/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ceb8ae7c9e28abf885706548b41b1abccbbac37cbed073aa9a0f8948b69ee74
+size 1064

run-6/checkpoint-42/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-42/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-42/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-42/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.01845565733408863,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-14",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 42,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6778180599212646,
+      "eval_matthews_correlation": 0.01845565733408863,
+      "eval_runtime": 1.2856,
+      "eval_samples_per_second": 811.291,
+      "eval_steps_per_second": 51.338,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.669923722743988,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7843,
+      "eval_samples_per_second": 1329.908,
+      "eval_steps_per_second": 84.155,
+      "step": 28
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6650601625442505,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.4023,
+      "eval_samples_per_second": 743.777,
+      "eval_steps_per_second": 47.065,
+      "step": 42
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 56,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.3409355672779142e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 64,
+    "seed": 17
+  }
+}

run-6/checkpoint-42/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7482407793d8c83d435fc746c3a21bf6bca34e9902d1310a394eabf83b64a64f
+size 4984

run-6/checkpoint-42/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-56/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-56/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:03b9c2dad5451c2948d325d080ce2e80d02c9a71346df761cf483a9a87047971
+size 267832560

run-6/checkpoint-56/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2791ef0a32fc567e4912ae3115c8d1c488d67ac81656c48d78f8ae7101452727
+size 535727290

run-6/checkpoint-56/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c55e70547a976f4a79e02c6eba2f7e52fb42a748f35730d8cbdf4d340819dd29
+size 14308

run-6/checkpoint-56/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7185a8249b0d5c124fc96a5829cf631445dc527176cb5f6e59fe5c540977b37c
+size 1064