roselin624 commited on Feb 27, 2024

Commit

cc4ebf5

verified ·

1 Parent(s): 0cce2e2

Training in progress, epoch 1

Browse files

Files changed (47) hide show

model.safetensors +1 -1
run-6/checkpoint-428/config.json +25 -0
run-6/checkpoint-428/model.safetensors +3 -0
run-6/checkpoint-428/optimizer.pt +3 -0
run-6/checkpoint-428/rng_state.pth +3 -0
run-6/checkpoint-428/scheduler.pt +3 -0
run-6/checkpoint-428/special_tokens_map.json +7 -0
run-6/checkpoint-428/tokenizer.json +0 -0
run-6/checkpoint-428/tokenizer_config.json +55 -0
run-6/checkpoint-428/trainer_state.json +44 -0
run-6/checkpoint-428/training_args.bin +3 -0
run-6/checkpoint-428/vocab.txt +0 -0
run-6/checkpoint-642/config.json +25 -0
run-6/checkpoint-642/model.safetensors +3 -0
run-6/checkpoint-642/optimizer.pt +3 -0
run-6/checkpoint-642/rng_state.pth +3 -0
run-6/checkpoint-642/scheduler.pt +3 -0
run-6/checkpoint-642/special_tokens_map.json +7 -0
run-6/checkpoint-642/tokenizer.json +0 -0
run-6/checkpoint-642/tokenizer_config.json +55 -0
run-6/checkpoint-642/trainer_state.json +60 -0
run-6/checkpoint-642/training_args.bin +3 -0
run-6/checkpoint-642/vocab.txt +0 -0
run-6/checkpoint-856/config.json +25 -0
run-6/checkpoint-856/model.safetensors +3 -0
run-6/checkpoint-856/optimizer.pt +3 -0
run-6/checkpoint-856/rng_state.pth +3 -0
run-6/checkpoint-856/scheduler.pt +3 -0
run-6/checkpoint-856/special_tokens_map.json +7 -0
run-6/checkpoint-856/tokenizer.json +0 -0
run-6/checkpoint-856/tokenizer_config.json +55 -0
run-6/checkpoint-856/trainer_state.json +69 -0
run-6/checkpoint-856/training_args.bin +3 -0
run-6/checkpoint-856/vocab.txt +0 -0
run-7/checkpoint-54/config.json +25 -0
run-7/checkpoint-54/model.safetensors +3 -0
run-7/checkpoint-54/optimizer.pt +3 -0
run-7/checkpoint-54/rng_state.pth +3 -0
run-7/checkpoint-54/scheduler.pt +3 -0
run-7/checkpoint-54/special_tokens_map.json +7 -0
run-7/checkpoint-54/tokenizer.json +0 -0
run-7/checkpoint-54/tokenizer_config.json +55 -0
run-7/checkpoint-54/trainer_state.json +35 -0
run-7/checkpoint-54/training_args.bin +3 -0
run-7/checkpoint-54/vocab.txt +0 -0
runs/Feb27_13-15-48_39d530476097/events.out.tfevents.1709040817.39d530476097.262.9 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5f46306980485a24e1bcbecc2fa6ac02eb17d5c03c133a35d228f6e679525890
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:b75ef795694a37c59eabe5580c8f71587d7bdb179153ffc025570cec3117e5a9
 size 267832560

run-6/checkpoint-428/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-428/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1fda3000c0f0c4dbad0e89d91cbcddbdd599440608bd60aac0746f91a548ceb0
+size 267832560

run-6/checkpoint-428/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c30ef724e816348d7cc7c86215bc301505819124e7d8c560ccfb8f9cf96b193a
+size 535727290

run-6/checkpoint-428/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a278725aaf4e54f71a409ba78aeff1b2947efa64196ea5116a194139c68354b3
+size 14244

run-6/checkpoint-428/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f212f273a473faf9d1b58bc285d36fc70c95a9ff961ccae9af7d5e4ee4b0d466
+size 1064

run-6/checkpoint-428/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-428/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-428/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-428/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.34961118667417307,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-428",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 428,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5753337144851685,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8051,
+      "eval_samples_per_second": 1295.46,
+      "eval_steps_per_second": 81.975,
+      "step": 214
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.9604573845863342,
+      "eval_matthews_correlation": 0.34961118667417307,
+      "eval_runtime": 0.8196,
+      "eval_samples_per_second": 1272.52,
+      "eval_steps_per_second": 80.524,
+      "step": 428
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 856,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 4,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.9787103114124418e-05,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 4,
+    "seed": 3
+  }
+}

run-6/checkpoint-428/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a9504c5644b56cf93b547ad904a324fb2bc6e2035d6ddaf8db9fbd75b342bb81
+size 4984

run-6/checkpoint-428/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-642/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-642/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ebe3a8560c557b7cd6db3db363a73529f88b5704114d77f25224337e9a2027b1
+size 267832560

run-6/checkpoint-642/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6fa6cfb42201b4487b392a7280dd57a6a0b414e042f22e2d9f3dca6daac7ccc
+size 535727290

run-6/checkpoint-642/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:880cbbd4ee9a37d0a2481d7c7e3ddb60bef262dceefa725c0a4001919a2f05b9
+size 14244

run-6/checkpoint-642/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3610d5fe36268bf38cd44575c650841bd8d9887c5050d6c34fa368c9224ff547
+size 1064

run-6/checkpoint-642/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-642/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-642/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-642/trainer_state.json ADDED Viewed

	@@ -0,0 +1,60 @@

+{
+  "best_metric": 0.34961118667417307,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-428",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 642,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5753337144851685,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8051,
+      "eval_samples_per_second": 1295.46,
+      "eval_steps_per_second": 81.975,
+      "step": 214
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.9604573845863342,
+      "eval_matthews_correlation": 0.34961118667417307,
+      "eval_runtime": 0.8196,
+      "eval_samples_per_second": 1272.52,
+      "eval_steps_per_second": 80.524,
+      "step": 428
+    },
+    {
+      "epoch": 2.34,
+      "grad_norm": 0.07748567312955856,
+      "learning_rate": 1.2388094285780715e-05,
+      "loss": 0.4545,
+      "step": 500
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 1.357472538948059,
+      "eval_matthews_correlation": 0.3460476883865242,
+      "eval_runtime": 0.7909,
+      "eval_samples_per_second": 1318.692,
+      "eval_steps_per_second": 83.446,
+      "step": 642
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 856,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 8290337607684.0,
+  "train_batch_size": 4,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.9787103114124418e-05,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 4,
+    "seed": 3
+  }
+}

run-6/checkpoint-642/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a9504c5644b56cf93b547ad904a324fb2bc6e2035d6ddaf8db9fbd75b342bb81
+size 4984

run-6/checkpoint-642/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-856/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-856/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f99aedd7b02c7a465bbb94f53f587beb82fefd6de9800054b9beaf1b2e736355
+size 267832560

run-6/checkpoint-856/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2e85dfff803b336a6739033b7c1afaa836e05aa5cbf6588e39e534a0298a1f1
+size 535727290

run-6/checkpoint-856/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8557d838cf1cf3c6170446e3e2e33fdc4a0ba1e9361c7c2511e366cb4cdd194e
+size 14244

run-6/checkpoint-856/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be7d2c748e355c5aa26815a15844d7fae22f018f780cc0b3005e077de5e5f448
+size 1064

run-6/checkpoint-856/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-856/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-856/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-856/trainer_state.json ADDED Viewed

	@@ -0,0 +1,69 @@

+{
+  "best_metric": 0.34961118667417307,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-428",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 856,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5753337144851685,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8051,
+      "eval_samples_per_second": 1295.46,
+      "eval_steps_per_second": 81.975,
+      "step": 214
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.9604573845863342,
+      "eval_matthews_correlation": 0.34961118667417307,
+      "eval_runtime": 0.8196,
+      "eval_samples_per_second": 1272.52,
+      "eval_steps_per_second": 80.524,
+      "step": 428
+    },
+    {
+      "epoch": 2.34,
+      "grad_norm": 0.07748567312955856,
+      "learning_rate": 1.2388094285780715e-05,
+      "loss": 0.4545,
+      "step": 500
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 1.357472538948059,
+      "eval_matthews_correlation": 0.3460476883865242,
+      "eval_runtime": 0.7909,
+      "eval_samples_per_second": 1318.692,
+      "eval_steps_per_second": 83.446,
+      "step": 642
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 1.4549368619918823,
+      "eval_matthews_correlation": 0.3379901852286027,
+      "eval_runtime": 0.7695,
+      "eval_samples_per_second": 1355.398,
+      "eval_steps_per_second": 85.768,
+      "step": 856
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 856,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 8290337607684.0,
+  "train_batch_size": 4,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.9787103114124418e-05,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 4,
+    "seed": 3
+  }
+}

run-6/checkpoint-856/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a9504c5644b56cf93b547ad904a324fb2bc6e2035d6ddaf8db9fbd75b342bb81
+size 4984

run-6/checkpoint-856/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-7/checkpoint-54/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-7/checkpoint-54/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b75ef795694a37c59eabe5580c8f71587d7bdb179153ffc025570cec3117e5a9
+size 267832560

run-7/checkpoint-54/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7e91f786af04c468c0fc1bc05ebd5acb9537a7c3469ccc1f961388744b3d251
+size 535727290

run-7/checkpoint-54/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba6b6d8d1d9bdee7bf391f048bf0d8303b659b05bcfce0760fc9b4c4fc32d57a
+size 14308

run-7/checkpoint-54/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e8553307b043d8c2b238f4837561e55aea68c58c8310f01271c94cbef2b416bf
+size 1064

run-7/checkpoint-54/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-7/checkpoint-54/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-7/checkpoint-54/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-7/checkpoint-54/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-7/checkpoint-54",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 54,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.586409866809845,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7287,
+      "eval_samples_per_second": 1431.276,
+      "eval_steps_per_second": 90.57,
+      "step": 54
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 162,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.7959735372448385e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 16,
+    "seed": 20
+  }
+}

run-7/checkpoint-54/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:efd55c91aeb42289c4cefe7204fc1209bf65261be738db6a48600ffc171c38ba
+size 4984

run-7/checkpoint-54/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Feb27_13-15-48_39d530476097/events.out.tfevents.1709040817.39d530476097.262.9 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c37e76076710e0d8808117853b088f2560bcea2a5882cbc315f5d29c769d246c
+size 5890

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9504c5644b56cf93b547ad904a324fb2bc6e2035d6ddaf8db9fbd75b342bb81
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:efd55c91aeb42289c4cefe7204fc1209bf65261be738db6a48600ffc171c38ba
 size 4984