kbberendsen commited on Feb 27, 2024

Commit

d4f7847

verified ·

1 Parent(s): d05ba30

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-0/checkpoint-107/config.json +25 -0
run-0/checkpoint-107/model.safetensors +3 -0
run-0/checkpoint-107/optimizer.pt +3 -0
run-0/checkpoint-107/rng_state.pth +3 -0
run-0/checkpoint-107/scheduler.pt +3 -0
run-0/checkpoint-107/special_tokens_map.json +7 -0
run-0/checkpoint-107/tokenizer.json +0 -0
run-0/checkpoint-107/tokenizer_config.json +55 -0
run-0/checkpoint-107/trainer_state.json +35 -0
run-0/checkpoint-107/training_args.bin +3 -0
run-0/checkpoint-107/vocab.txt +0 -0
run-1/checkpoint-108/config.json +25 -0
run-1/checkpoint-108/model.safetensors +3 -0
run-1/checkpoint-108/optimizer.pt +3 -0
run-1/checkpoint-108/rng_state.pth +3 -0
run-1/checkpoint-108/scheduler.pt +3 -0
run-1/checkpoint-108/special_tokens_map.json +7 -0
run-1/checkpoint-108/tokenizer.json +0 -0
run-1/checkpoint-108/tokenizer_config.json +55 -0
run-1/checkpoint-108/trainer_state.json +44 -0
run-1/checkpoint-108/training_args.bin +3 -0
run-1/checkpoint-108/vocab.txt +0 -0
run-1/checkpoint-162/config.json +25 -0
run-1/checkpoint-162/model.safetensors +3 -0
run-1/checkpoint-162/optimizer.pt +3 -0
run-1/checkpoint-162/rng_state.pth +3 -0
run-1/checkpoint-162/scheduler.pt +3 -0
run-1/checkpoint-162/special_tokens_map.json +7 -0
run-1/checkpoint-162/tokenizer.json +0 -0
run-1/checkpoint-162/tokenizer_config.json +55 -0
run-1/checkpoint-162/trainer_state.json +53 -0
run-1/checkpoint-162/training_args.bin +3 -0
run-1/checkpoint-162/vocab.txt +0 -0
run-1/checkpoint-216/config.json +25 -0
run-1/checkpoint-216/model.safetensors +3 -0
run-1/checkpoint-216/optimizer.pt +3 -0
run-1/checkpoint-216/rng_state.pth +3 -0
run-1/checkpoint-216/scheduler.pt +3 -0
run-1/checkpoint-216/special_tokens_map.json +7 -0
run-1/checkpoint-216/tokenizer.json +0 -0
run-1/checkpoint-216/tokenizer_config.json +55 -0
run-1/checkpoint-216/trainer_state.json +62 -0
run-1/checkpoint-216/training_args.bin +3 -0
run-1/checkpoint-216/vocab.txt +0 -0
run-1/checkpoint-270/config.json +25 -0
run-1/checkpoint-270/model.safetensors +3 -0
run-1/checkpoint-270/optimizer.pt +3 -0
run-1/checkpoint-270/rng_state.pth +3 -0
run-1/checkpoint-270/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5e1c3da3a591a75b5098686af3e33bb6d5dbde8de64f9a250c5785b8b676e0e1
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:f355ff596fc9a81f9d48fca17727279c1b8e426ea17d864e94ad0fad9e40bae7
 size 267832560

run-0/checkpoint-107/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-0/checkpoint-107/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:09ed21a9b7cf2a1849ecfe79885181e7767655ddeaa05e6abe4341e9b056dba8
+size 267832560

run-0/checkpoint-107/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b99e5b177f8e929c01316f911337489bd6f6c6aad00cd7e839311e305f3b84c
+size 535727290

run-0/checkpoint-107/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae60ce2da9ba95e755793c0257c4f16dc182d10c2ea798817ac92d796dbfa806
+size 14308

run-0/checkpoint-107/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:88927de3756c5716c3890de82ceb0288144c073606e412421fbf9e21f57cf796
+size 1064

run-0/checkpoint-107/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-107/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-107/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-107/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-0/checkpoint-107",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 107,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6291466355323792,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.955,
+      "eval_samples_per_second": 1092.188,
+      "eval_steps_per_second": 69.113,
+      "step": 107
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 107,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 3.448385897205627e-06,
+    "num_train_epochs": 1,
+    "per_device_train_batch_size": 8,
+    "seed": 31
+  }
+}

run-0/checkpoint-107/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:81bd41e7d6266d202b2106105d36818a4d95755e2e776c9fbfaffaf77da124ad
+size 4984

run-0/checkpoint-107/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-108/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-108/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb6055d3fc8ec4f98259c860039d249358d0ce55d76a356257f96bc1f7419990
+size 267832560

run-1/checkpoint-108/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:83fc4756e451ebc73cdfca26dc21b7c04e2f6d87846151f52ce08b4ea15d191f
+size 535727290

run-1/checkpoint-108/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3d2ce677d59bd42c4069fde1f4e20262cfffbc9034e60063a7cb86b37e99e902
+size 14244

run-1/checkpoint-108/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8dd6c246cf2378133e9a0612f058a3b88aefcccc84f7bae72b9c5e5ee21483e
+size 1064

run-1/checkpoint-108/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-108/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-108/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-108/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-54",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6076961159706116,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.914,
+      "eval_samples_per_second": 1141.177,
+      "eval_steps_per_second": 72.213,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5892916321754456,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.1202,
+      "eval_samples_per_second": 931.043,
+      "eval_steps_per_second": 58.915,
+      "step": 108
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 270,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 9.09529636397016e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 16,
+    "seed": 22
+  }
+}

run-1/checkpoint-108/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29713d6be431df230f39d5c57e20e237737020640e0fc942f5f07ce3fac1960b
+size 4984

run-1/checkpoint-108/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-162/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-162/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce98dbf4dd6997fdb248433d847e33f25ae599bd82067d2d53c2065e98c1cb21
+size 267832560

run-1/checkpoint-162/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af6dff06fc37e7e8d0552936e2595c3ac98abbb71738dfa3ca573170028633b2
+size 535727290

run-1/checkpoint-162/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05cf25a8aac0197f9dd0fc73950ab5ebf0b0120b5a26a3fbb66223702c12946d
+size 14244

run-1/checkpoint-162/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c76a75841f906b92463c679ecefeed0663aafcde16398dffc514b15b668b1927
+size 1064

run-1/checkpoint-162/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-162/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-162/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-162/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.166651669293941,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-162",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 162,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6076961159706116,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.914,
+      "eval_samples_per_second": 1141.177,
+      "eval_steps_per_second": 72.213,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5892916321754456,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.1202,
+      "eval_samples_per_second": 931.043,
+      "eval_steps_per_second": 58.915,
+      "step": 108
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.5696114301681519,
+      "eval_matthews_correlation": 0.166651669293941,
+      "eval_runtime": 1.0426,
+      "eval_samples_per_second": 1000.412,
+      "eval_steps_per_second": 63.305,
+      "step": 162
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 270,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 9.09529636397016e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 16,
+    "seed": 22
+  }
+}

run-1/checkpoint-162/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29713d6be431df230f39d5c57e20e237737020640e0fc942f5f07ce3fac1960b
+size 4984

run-1/checkpoint-162/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-216/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-216/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:98cea7607ccfa88208fcbd7b91cc2f37bcb8d1fc3032b0c4260a80c1dc4703c4
+size 267832560

run-1/checkpoint-216/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ed9f56e9b1873a6285bdbef325a16dc325ac5ebe9506ef78a037544fd833728
+size 535727290

run-1/checkpoint-216/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b99bd1a1dde66fbd9bfaac8ed2c34fb9bdde5bc7e9c66485be72a23c4b855e0
+size 14244

run-1/checkpoint-216/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b499f5dc423f5a42a59b3da27c9751587620e9743426630b9cf152fd59292d3f
+size 1064

run-1/checkpoint-216/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-216/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-216/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-216/trainer_state.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "best_metric": 0.2526248957927519,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-216",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 216,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6076961159706116,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.914,
+      "eval_samples_per_second": 1141.177,
+      "eval_steps_per_second": 72.213,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5892916321754456,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.1202,
+      "eval_samples_per_second": 931.043,
+      "eval_steps_per_second": 58.915,
+      "step": 108
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.5696114301681519,
+      "eval_matthews_correlation": 0.166651669293941,
+      "eval_runtime": 1.0426,
+      "eval_samples_per_second": 1000.412,
+      "eval_steps_per_second": 63.305,
+      "step": 162
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.560063898563385,
+      "eval_matthews_correlation": 0.2526248957927519,
+      "eval_runtime": 1.4859,
+      "eval_samples_per_second": 701.918,
+      "eval_steps_per_second": 44.417,
+      "step": 216
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 270,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 9.09529636397016e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 16,
+    "seed": 22
+  }
+}

run-1/checkpoint-216/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29713d6be431df230f39d5c57e20e237737020640e0fc942f5f07ce3fac1960b
+size 4984

run-1/checkpoint-216/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-270/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-270/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:643ee05081060a7035cff7c67706cd1d4d9e8e96bb138364f28d5af1ee3262bd
+size 267832560

run-1/checkpoint-270/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc6c9fa382d301bc30025d4feb4bd1ee745bda42dc36d2321ef304e8c47c2aed
+size 535727290

run-1/checkpoint-270/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c19d11d585344ba606d8a3f52d2542cc2301bcb4dd63a6336369906566d51e5c
+size 14244

run-1/checkpoint-270/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3a383de2f751c3be5860ae338eda4849f1505fae0a579c80bb4182ca31d3ecb5
+size 1064