Ketskapow commited on Feb 27, 2024

Commit

8eac25f

verified ·

1 Parent(s): 336efba

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-2/checkpoint-108/config.json +25 -0
run-2/checkpoint-108/model.safetensors +3 -0
run-2/checkpoint-108/optimizer.pt +3 -0
run-2/checkpoint-108/rng_state.pth +3 -0
run-2/checkpoint-108/scheduler.pt +3 -0
run-2/checkpoint-108/special_tokens_map.json +7 -0
run-2/checkpoint-108/tokenizer.json +0 -0
run-2/checkpoint-108/tokenizer_config.json +55 -0
run-2/checkpoint-108/trainer_state.json +62 -0
run-2/checkpoint-108/training_args.bin +3 -0
run-2/checkpoint-108/vocab.txt +0 -0
run-2/checkpoint-135/config.json +25 -0
run-2/checkpoint-135/model.safetensors +3 -0
run-2/checkpoint-135/optimizer.pt +3 -0
run-2/checkpoint-135/rng_state.pth +3 -0
run-2/checkpoint-135/scheduler.pt +3 -0
run-2/checkpoint-135/special_tokens_map.json +7 -0
run-2/checkpoint-135/tokenizer.json +0 -0
run-2/checkpoint-135/tokenizer_config.json +55 -0
run-2/checkpoint-135/trainer_state.json +71 -0
run-2/checkpoint-135/training_args.bin +3 -0
run-2/checkpoint-135/vocab.txt +0 -0
run-2/checkpoint-54/config.json +25 -0
run-2/checkpoint-54/model.safetensors +3 -0
run-2/checkpoint-54/optimizer.pt +3 -0
run-2/checkpoint-54/rng_state.pth +3 -0
run-2/checkpoint-54/scheduler.pt +3 -0
run-2/checkpoint-54/special_tokens_map.json +7 -0
run-2/checkpoint-54/tokenizer.json +0 -0
run-2/checkpoint-54/tokenizer_config.json +55 -0
run-2/checkpoint-54/trainer_state.json +44 -0
run-2/checkpoint-54/training_args.bin +3 -0
run-2/checkpoint-54/vocab.txt +0 -0
run-2/checkpoint-81/config.json +25 -0
run-2/checkpoint-81/model.safetensors +3 -0
run-2/checkpoint-81/optimizer.pt +3 -0
run-2/checkpoint-81/rng_state.pth +3 -0
run-2/checkpoint-81/scheduler.pt +3 -0
run-2/checkpoint-81/special_tokens_map.json +7 -0
run-2/checkpoint-81/tokenizer.json +0 -0
run-2/checkpoint-81/tokenizer_config.json +55 -0
run-2/checkpoint-81/trainer_state.json +53 -0
run-2/checkpoint-81/training_args.bin +3 -0
run-2/checkpoint-81/vocab.txt +0 -0
run-3/checkpoint-107/config.json +25 -0
run-3/checkpoint-107/model.safetensors +3 -0
run-3/checkpoint-107/optimizer.pt +3 -0
run-3/checkpoint-107/rng_state.pth +3 -0
run-3/checkpoint-107/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b8deee472ce6e3e49cec781d8bfc5a81c5baf1bf79e35c5e0bfd13bd04d5f4d0
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd33315e20753a48156c4b5ca9911a7e161b40165de4ae06f51de6047651f4e6
 size 267832560

run-2/checkpoint-108/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-2/checkpoint-108/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f4dc19ae0c7b7a9d845486a3db052db20c16d119437bb9ea55c549c82ba4f2f7
+size 267832560

run-2/checkpoint-108/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1be5525e05e3985e4294451e98e76c473c04a3b9562cce2f07ab7293022ba5cf
+size 535727290

run-2/checkpoint-108/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8720893faeb5910b9cadcb19362ea1b6e3bbcf3f97d4e196300f0179cc02b3e4
+size 14244

run-2/checkpoint-108/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e7723503fac1c2b099eb41e2a70cac4d83a43f1e9cccc324945284f8905fefa
+size 1064

run-2/checkpoint-108/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-108/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-108/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-108/trainer_state.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-27",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6264488101005554,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6569,
+      "eval_samples_per_second": 1587.713,
+      "eval_steps_per_second": 100.469,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6097051501274109,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7593,
+      "eval_samples_per_second": 1373.638,
+      "eval_steps_per_second": 86.922,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6055334210395813,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8173,
+      "eval_samples_per_second": 1276.145,
+      "eval_steps_per_second": 80.753,
+      "step": 81
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.6017194986343384,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.2717,
+      "eval_samples_per_second": 820.151,
+      "eval_steps_per_second": 51.898,
+      "step": 108
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.353880316087167e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 28
+  }
+}

run-2/checkpoint-108/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:059fd4cccb177cdca68b068259e862fe24d5b192bc059dcf9ddce2eba92ffc29
+size 4984

run-2/checkpoint-108/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-135/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-2/checkpoint-135/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a69d3b71d719020c27abe81b1c3d39cfe1c8c2817e889751cb69227a1b49ec93
+size 267832560

run-2/checkpoint-135/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c7ba735d4de8dda4c0372b605388c2acb45d2e95cad8716368d2a2a146464ac2
+size 535727290

run-2/checkpoint-135/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:23124014005741d882f55bac3d0ec9b746480d8336163f6a688402dcc2e2820a
+size 14244

run-2/checkpoint-135/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:135cfd3992e2536629303784c08fbf74ee8a3a670c8eda2a7cb16d72a7147c5c
+size 1064

run-2/checkpoint-135/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-135/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-135/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-135/trainer_state.json ADDED Viewed

	@@ -0,0 +1,71 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-27",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 135,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6264488101005554,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6569,
+      "eval_samples_per_second": 1587.713,
+      "eval_steps_per_second": 100.469,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6097051501274109,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7593,
+      "eval_samples_per_second": 1373.638,
+      "eval_steps_per_second": 86.922,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6055334210395813,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8173,
+      "eval_samples_per_second": 1276.145,
+      "eval_steps_per_second": 80.753,
+      "step": 81
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.6017194986343384,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.2717,
+      "eval_samples_per_second": 820.151,
+      "eval_steps_per_second": 51.898,
+      "step": 108
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 0.6001049280166626,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8391,
+      "eval_samples_per_second": 1242.978,
+      "eval_steps_per_second": 78.654,
+      "step": 135
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.353880316087167e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 28
+  }
+}

run-2/checkpoint-135/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:059fd4cccb177cdca68b068259e862fe24d5b192bc059dcf9ddce2eba92ffc29
+size 4984

run-2/checkpoint-135/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-54/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-2/checkpoint-54/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:358c1c21c443e853728f6b68f2f00534f184ff7ba6765e6be0c16fd88d71e75e
+size 267832560

run-2/checkpoint-54/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:63b557026924fed71ae2eaa2233670a352052eacc6eed3390b732c38b7e1e634
+size 535727290

run-2/checkpoint-54/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2348d7fff7c830edffb2a9f154ad55ae9aecd9f3ed73186a348881c124fe520a
+size 14244

run-2/checkpoint-54/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba90b776a03a8fe70bd88e29c71b2c94b8cb5a1034eb586c9a554628fcee1a08
+size 1064

run-2/checkpoint-54/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-54/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-54/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-54/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-27",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 54,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6264488101005554,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6569,
+      "eval_samples_per_second": 1587.713,
+      "eval_steps_per_second": 100.469,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6097051501274109,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7593,
+      "eval_samples_per_second": 1373.638,
+      "eval_steps_per_second": 86.922,
+      "step": 54
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.353880316087167e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 28
+  }
+}

run-2/checkpoint-54/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:059fd4cccb177cdca68b068259e862fe24d5b192bc059dcf9ddce2eba92ffc29
+size 4984

run-2/checkpoint-54/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-81/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-2/checkpoint-81/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d38223e026bd4f9a1c547c60dec6a4dde1cfddc0ad8861073a96333a8613471
+size 267832560

run-2/checkpoint-81/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e116826755d4c812b7c9b9f526f74c37704f3a0deda24fb2661e919ac5f6feba
+size 535727290

run-2/checkpoint-81/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3d8103bea79fb312a24d01bb80ccb792bf9b8fa683bd27356dda467a2ade7b9
+size 14244

run-2/checkpoint-81/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cdcff0c87bcdd09dcccada1dbf73b48f49ada1817cb5c4a8890fe4e09df3e617
+size 1064

run-2/checkpoint-81/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-81/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-81/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-81/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-27",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 81,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6264488101005554,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6569,
+      "eval_samples_per_second": 1587.713,
+      "eval_steps_per_second": 100.469,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6097051501274109,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7593,
+      "eval_samples_per_second": 1373.638,
+      "eval_steps_per_second": 86.922,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6055334210395813,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8173,
+      "eval_samples_per_second": 1276.145,
+      "eval_steps_per_second": 80.753,
+      "step": 81
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.353880316087167e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 28
+  }
+}

run-2/checkpoint-81/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:059fd4cccb177cdca68b068259e862fe24d5b192bc059dcf9ddce2eba92ffc29
+size 4984

run-2/checkpoint-81/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-107/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-3/checkpoint-107/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dd33315e20753a48156c4b5ca9911a7e161b40165de4ae06f51de6047651f4e6
+size 267832560

run-3/checkpoint-107/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d132dc2c42c54d336bb4d3997f7e4fa36ed407a304a4996015680a2c461d24ee
+size 535727290

run-3/checkpoint-107/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0549744415698587554a12729889f2e2aff830dbfad0e8334e915f483edb4408
+size 14308

run-3/checkpoint-107/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0b3275e2f9e76fffdedec55e18f47a3699ef5ad69a11670e311851e1f9e3246
+size 1064