Giuggiola01 commited on Feb 27, 2024

Commit

4a2065d

verified ·

1 Parent(s): db8fdc9

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-8/checkpoint-27/config.json +25 -0
run-8/checkpoint-27/model.safetensors +3 -0
run-8/checkpoint-27/optimizer.pt +3 -0
run-8/checkpoint-27/rng_state.pth +3 -0
run-8/checkpoint-27/scheduler.pt +3 -0
run-8/checkpoint-27/special_tokens_map.json +7 -0
run-8/checkpoint-27/tokenizer.json +0 -0
run-8/checkpoint-27/tokenizer_config.json +55 -0
run-8/checkpoint-27/trainer_state.json +35 -0
run-8/checkpoint-27/training_args.bin +3 -0
run-8/checkpoint-27/vocab.txt +0 -0
run-8/checkpoint-54/config.json +25 -0
run-8/checkpoint-54/model.safetensors +3 -0
run-8/checkpoint-54/optimizer.pt +3 -0
run-8/checkpoint-54/rng_state.pth +3 -0
run-8/checkpoint-54/scheduler.pt +3 -0
run-8/checkpoint-54/special_tokens_map.json +7 -0
run-8/checkpoint-54/tokenizer.json +0 -0
run-8/checkpoint-54/tokenizer_config.json +55 -0
run-8/checkpoint-54/trainer_state.json +44 -0
run-8/checkpoint-54/training_args.bin +3 -0
run-8/checkpoint-54/vocab.txt +0 -0
run-8/checkpoint-81/config.json +25 -0
run-8/checkpoint-81/model.safetensors +3 -0
run-8/checkpoint-81/optimizer.pt +3 -0
run-8/checkpoint-81/rng_state.pth +3 -0
run-8/checkpoint-81/scheduler.pt +3 -0
run-8/checkpoint-81/special_tokens_map.json +7 -0
run-8/checkpoint-81/tokenizer.json +0 -0
run-8/checkpoint-81/tokenizer_config.json +55 -0
run-8/checkpoint-81/trainer_state.json +53 -0
run-8/checkpoint-81/training_args.bin +3 -0
run-8/checkpoint-81/vocab.txt +0 -0
run-9/checkpoint-107/config.json +25 -0
run-9/checkpoint-107/model.safetensors +3 -0
run-9/checkpoint-107/optimizer.pt +3 -0
run-9/checkpoint-107/rng_state.pth +3 -0
run-9/checkpoint-107/scheduler.pt +3 -0
run-9/checkpoint-107/special_tokens_map.json +7 -0
run-9/checkpoint-107/tokenizer.json +0 -0
run-9/checkpoint-107/tokenizer_config.json +55 -0
run-9/checkpoint-107/trainer_state.json +35 -0
run-9/checkpoint-107/training_args.bin +3 -0
run-9/checkpoint-107/vocab.txt +0 -0
run-9/checkpoint-214/config.json +25 -0
run-9/checkpoint-214/model.safetensors +3 -0
run-9/checkpoint-214/optimizer.pt +3 -0
run-9/checkpoint-214/rng_state.pth +3 -0
run-9/checkpoint-214/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2276b502049a0d228d4b06fde1aabe8cf0ae06ea964fe4de57d2d59f015fafdb
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:381cb647ef8dadaf274186a4b1150150019bf4448b65ce08a309ed951bec1b86
 size 267832560

run-8/checkpoint-27/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-27/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2276b502049a0d228d4b06fde1aabe8cf0ae06ea964fe4de57d2d59f015fafdb
+size 267832560

run-8/checkpoint-27/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d682dcbde0d58fe1000061e1d347c0c95070ac02e85dbf00893be5b822cc43e
+size 535727290

run-8/checkpoint-27/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b8e486b82d9e5a71534855b4989950ca0b17177948b4eda3745bac0c1777272
+size 14308

run-8/checkpoint-27/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76a30ab42475947d07712f216f8244174741df1c6d9895638f8082c69588f4b1
+size 1064

run-8/checkpoint-27/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-27/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-27/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-27/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-8/checkpoint-27",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 27,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.622395932674408,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6723,
+      "eval_samples_per_second": 1551.349,
+      "eval_steps_per_second": 98.168,
+      "step": 27
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 108,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.716893541073549e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 32,
+    "seed": 20
+  }
+}

run-8/checkpoint-27/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45fd68445069e30b290c5af6065d8fd22e468e5e8945b0eaa85f15558fe70016
+size 4984

run-8/checkpoint-27/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-54/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-54/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8dbfb812157b3e82849329b6fe940efd4d3b692ee7f489ca50c2438d48871765
+size 267832560

run-8/checkpoint-54/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4329447ec8ad94062a6bcacc236764ed478e7d24bee5055c164d2a7cb9ea264e
+size 535727290

run-8/checkpoint-54/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:85b36d552082927e50869fa7eba654290e96868e4bfadf94a894f0fffdbaf411
+size 14308

run-8/checkpoint-54/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5734ea36426dae22fa3b299d1323cc9fec018ba7f4e4fd3f0eb194de01d3845
+size 1064

run-8/checkpoint-54/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-54/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-54/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-54/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-8/checkpoint-27",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 54,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.622395932674408,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6723,
+      "eval_samples_per_second": 1551.349,
+      "eval_steps_per_second": 98.168,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6130136251449585,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7457,
+      "eval_samples_per_second": 1398.708,
+      "eval_steps_per_second": 88.509,
+      "step": 54
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 108,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.716893541073549e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 32,
+    "seed": 20
+  }
+}

run-8/checkpoint-54/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45fd68445069e30b290c5af6065d8fd22e468e5e8945b0eaa85f15558fe70016
+size 4984

run-8/checkpoint-54/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-81/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-81/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d0337953a2c6d433b6b0be35fc0d4b045ec0803352e0226a2b397d0869702bf
+size 267832560

run-8/checkpoint-81/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:420de3f76f0daa50d6f250ffb521cebcf35c8d1bbe6dce3dfc8c29ffc9a22a8b
+size 535727290

run-8/checkpoint-81/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b6a2bc696ed7a65c1ad830cca06e9af3f74135015a23a231df5a8e1e34e694b
+size 14308

run-8/checkpoint-81/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af45754e223f2814dfa355d0ab2f37e6ca778c870ee9fe6c357a1adefebfd31c
+size 1064

run-8/checkpoint-81/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-81/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-81/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-81/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-8/checkpoint-27",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 81,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.622395932674408,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.6723,
+      "eval_samples_per_second": 1551.349,
+      "eval_steps_per_second": 98.168,
+      "step": 27
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.6130136251449585,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7457,
+      "eval_samples_per_second": 1398.708,
+      "eval_steps_per_second": 88.509,
+      "step": 54
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6108205914497375,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7728,
+      "eval_samples_per_second": 1349.582,
+      "eval_steps_per_second": 85.4,
+      "step": 81
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 108,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.716893541073549e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 32,
+    "seed": 20
+  }
+}

run-8/checkpoint-81/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45fd68445069e30b290c5af6065d8fd22e468e5e8945b0eaa85f15558fe70016
+size 4984

run-8/checkpoint-81/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-107/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-9/checkpoint-107/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0559a41e986081deae4f5581fda6ae1e817455c538eac8d7f83d5dc9086808e6
+size 267832560

run-9/checkpoint-107/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f4b57cd3dcddde54a449033b2db40f430352a9372b626cdf96ed7e14c3a22005
+size 535727290

run-9/checkpoint-107/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bfb94873fa199915815b7d83a6afcf4acb49af3d50a6d9f72d37a4953a5d280a
+size 14244

run-9/checkpoint-107/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1e589f46d38b59dc7ed14e0ec7514f89e668eee9c1f16a0b9518ba3be275e54
+size 1064

run-9/checkpoint-107/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-9/checkpoint-107/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-107/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-9/checkpoint-107/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-9/checkpoint-107",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 107,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6132326722145081,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7729,
+      "eval_samples_per_second": 1349.484,
+      "eval_steps_per_second": 85.394,
+      "step": 107
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 535,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.449575308916878e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 8,
+    "seed": 15
+  }
+}

run-9/checkpoint-107/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aed8e32d7e9953112fac8fdf2d7d0c0dc0f2976a4718254130f97899a224be9e
+size 4984

run-9/checkpoint-107/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-9/checkpoint-214/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-9/checkpoint-214/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aecdb0d1282dfb4bd507854fddd894e09f286607f04a946efa7d0a389a672c96
+size 267832560

run-9/checkpoint-214/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d456e847532bded590fe09a6c9f53df26cd825e624f24cb7e5f02eb9302dc1b
+size 535727290

run-9/checkpoint-214/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e260ec975c5f37197eacb4243085613838921f0d66370e91a2969f7119e30755
+size 14244

run-9/checkpoint-214/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c57eee128ceffe9df8e8f3ec04ba9de497b87342b4de370abdbe669cecdc9a9a
+size 1064