karths commited on
Commit
cc2f852
·
verified ·
1 Parent(s): 76eff90

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ reduced_main_data.csv filter=lfs diff=lfs merge=lfs -text
37
+ test_data_for_future_evaluation.csv filter=lfs diff=lfs merge=lfs -text
38
+ test_top_repo_data.csv filter=lfs diff=lfs merge=lfs -text
39
+ top_repo_data.csv filter=lfs diff=lfs merge=lfs -text
.ipynb_checkpoints/metrics-checkpoint.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"precision": 0.9784045835169678, "recall": 0.9854153455928979, "acc": 0.9821283762709749, "mcc": 0.9642753423345738, "f1": 0.9818974504786276, "auc": 0.9972255251769351}
checkpoint-10020/config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilroberta-base",
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 3072,
15
+ "layer_norm_eps": 1e-05,
16
+ "max_position_embeddings": 514,
17
+ "model_type": "roberta",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 6,
20
+ "pad_token_id": 1,
21
+ "position_embedding_type": "absolute",
22
+ "problem_type": "single_label_classification",
23
+ "torch_dtype": "float32",
24
+ "transformers_version": "4.35.0",
25
+ "type_vocab_size": 1,
26
+ "use_cache": true,
27
+ "vocab_size": 50265
28
+ }
checkpoint-10020/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99d90de7783c499123fe65e335d2cde00dd1a30a1100aef423f0e83cfe1db8a6
3
+ size 328492280
checkpoint-10020/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92cf7d2a0570ddaf4ed1fce57e1b163a5f627b2bdb671321c8cc81aa0da9eb72
3
+ size 657047610
checkpoint-10020/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c132fbab01ba44ae5a4600e89c22e5e82ed9781d053ce7ec542ea0107af78e8a
3
+ size 14244
checkpoint-10020/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71ae05b0103f90146ce39046375ae878319f4c7d09227e8bc0c984a5fcb5bda2
3
+ size 1064
checkpoint-10020/trainer_state.json ADDED
@@ -0,0 +1,139 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 5.0,
5
+ "eval_steps": 500,
6
+ "global_step": 10020,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.25,
13
+ "learning_rate": 4.9800000000000004e-05,
14
+ "loss": 0.0373,
15
+ "step": 500
16
+ },
17
+ {
18
+ "epoch": 0.5,
19
+ "learning_rate": 4.9663165247662615e-05,
20
+ "loss": 0.0614,
21
+ "step": 1000
22
+ },
23
+ {
24
+ "epoch": 0.75,
25
+ "learning_rate": 4.865640637350898e-05,
26
+ "loss": 0.0588,
27
+ "step": 1500
28
+ },
29
+ {
30
+ "epoch": 1.0,
31
+ "learning_rate": 4.700706468751901e-05,
32
+ "loss": 0.0661,
33
+ "step": 2000
34
+ },
35
+ {
36
+ "epoch": 1.25,
37
+ "learning_rate": 4.475994152602118e-05,
38
+ "loss": 0.0515,
39
+ "step": 2500
40
+ },
41
+ {
42
+ "epoch": 1.5,
43
+ "learning_rate": 4.197607586073667e-05,
44
+ "loss": 0.0518,
45
+ "step": 3000
46
+ },
47
+ {
48
+ "epoch": 1.75,
49
+ "learning_rate": 3.8731086287268264e-05,
50
+ "loss": 0.052,
51
+ "step": 3500
52
+ },
53
+ {
54
+ "epoch": 2.0,
55
+ "learning_rate": 3.511311698489561e-05,
56
+ "loss": 0.0506,
57
+ "step": 4000
58
+ },
59
+ {
60
+ "epoch": 2.25,
61
+ "learning_rate": 3.1228433624560175e-05,
62
+ "loss": 0.0383,
63
+ "step": 4500
64
+ },
65
+ {
66
+ "epoch": 2.5,
67
+ "learning_rate": 2.7175240839918063e-05,
68
+ "loss": 0.0409,
69
+ "step": 5000
70
+ },
71
+ {
72
+ "epoch": 2.74,
73
+ "learning_rate": 2.3054972130358894e-05,
74
+ "loss": 0.0372,
75
+ "step": 5500
76
+ },
77
+ {
78
+ "epoch": 2.99,
79
+ "learning_rate": 1.8987536529000545e-05,
80
+ "loss": 0.0349,
81
+ "step": 6000
82
+ },
83
+ {
84
+ "epoch": 3.24,
85
+ "learning_rate": 1.5083418450272521e-05,
86
+ "loss": 0.0246,
87
+ "step": 6500
88
+ },
89
+ {
90
+ "epoch": 3.49,
91
+ "learning_rate": 1.1455599648308674e-05,
92
+ "loss": 0.0232,
93
+ "step": 7000
94
+ },
95
+ {
96
+ "epoch": 3.74,
97
+ "learning_rate": 8.188115868146839e-06,
98
+ "loss": 0.0255,
99
+ "step": 7500
100
+ },
101
+ {
102
+ "epoch": 3.99,
103
+ "learning_rate": 5.377296029546741e-06,
104
+ "loss": 0.0236,
105
+ "step": 8000
106
+ },
107
+ {
108
+ "epoch": 4.24,
109
+ "learning_rate": 3.1034708332441433e-06,
110
+ "loss": 0.0154,
111
+ "step": 8500
112
+ },
113
+ {
114
+ "epoch": 4.49,
115
+ "learning_rate": 1.4193117617159691e-06,
116
+ "loss": 0.0195,
117
+ "step": 9000
118
+ },
119
+ {
120
+ "epoch": 4.74,
121
+ "learning_rate": 3.756787580085019e-07,
122
+ "loss": 0.0224,
123
+ "step": 9500
124
+ },
125
+ {
126
+ "epoch": 4.99,
127
+ "learning_rate": 9.201950512210955e-10,
128
+ "loss": 0.0249,
129
+ "step": 10000
130
+ }
131
+ ],
132
+ "logging_steps": 500,
133
+ "max_steps": 10020,
134
+ "num_train_epochs": 5,
135
+ "save_steps": 500,
136
+ "total_flos": 8.494405705116672e+16,
137
+ "trial_name": null,
138
+ "trial_params": null
139
+ }
checkpoint-10020/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34f5690b2a5603554c13f29c439ae2d9aa25bbf66bfb42a129aa8aa35ad4b2c1
3
+ size 4664
classification_report.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"0": {"precision": 0.9945378666993986, "recall": 0.9946599558065308, "f1-score": 0.994598907506291, "support": 16292}, "1": {"precision": 0.994482496194825, "recall": 0.9943563728598604, "f1-score": 0.9944194305282515, "support": 15770}, "accuracy": 0.9945106356434409, "macro avg": {"precision": 0.9945101814471118, "recall": 0.9945081643331957, "f1-score": 0.9945091690172713, "support": 32062}, "weighted avg": {"precision": 0.9945106321894764, "recall": 0.9945106356434409, "f1-score": 0.9945106300456309, "support": 32062}}
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilroberta-base",
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 3072,
15
+ "layer_norm_eps": 1e-05,
16
+ "max_position_embeddings": 514,
17
+ "model_type": "roberta",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 6,
20
+ "pad_token_id": 1,
21
+ "position_embedding_type": "absolute",
22
+ "problem_type": "single_label_classification",
23
+ "torch_dtype": "float32",
24
+ "transformers_version": "4.35.0",
25
+ "type_vocab_size": 1,
26
+ "use_cache": true,
27
+ "vocab_size": 50265
28
+ }
confusion_matrix.png ADDED
detailed_confusion_matrix.png ADDED
fold_results.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "0": {
3
+ "eval_loss": 0.40148600935935974,
4
+ "eval_precision": 0.8656669790690409,
5
+ "eval_recall": 0.8785111914273033,
6
+ "eval_acc": 0.8731871627732901,
7
+ "eval_mcc": 0.746447037107958,
8
+ "eval_f1": 0.8720417925478348,
9
+ "eval_auc": 0.9394272614942787,
10
+ "eval_runtime": 90.2981,
11
+ "eval_samples_per_second": 355.079,
12
+ "eval_steps_per_second": 5.548,
13
+ "epoch": 5.0
14
+ },
15
+ "1": {
16
+ "eval_loss": 0.2502449154853821,
17
+ "eval_precision": 0.9276957718288716,
18
+ "eval_recall": 0.9405199746353836,
19
+ "eval_acc": 0.9346890399850291,
20
+ "eval_mcc": 0.8694527772027904,
21
+ "eval_f1": 0.934063857925562,
22
+ "eval_auc": 0.9791706185357555,
23
+ "eval_runtime": 92.8544,
24
+ "eval_samples_per_second": 345.293,
25
+ "eval_steps_per_second": 5.396,
26
+ "epoch": 5.0
27
+ },
28
+ "2": {
29
+ "eval_loss": 0.06282494217157364,
30
+ "eval_precision": 0.9808663803990907,
31
+ "eval_recall": 0.9849714648065948,
32
+ "eval_acc": 0.9831576320878298,
33
+ "eval_mcc": 0.9663167846706998,
34
+ "eval_f1": 0.9829146364614314,
35
+ "eval_auc": 0.9976812207025214,
36
+ "eval_runtime": 93.3536,
37
+ "eval_samples_per_second": 343.447,
38
+ "eval_steps_per_second": 5.367,
39
+ "epoch": 5.0
40
+ },
41
+ "3": {
42
+ "eval_loss": 0.031204670667648315,
43
+ "eval_precision": 0.9902593295382669,
44
+ "eval_recall": 0.9927710843373494,
45
+ "eval_acc": 0.9916411951843304,
46
+ "eval_mcc": 0.9832816995905711,
47
+ "eval_f1": 0.9915136162127929,
48
+ "eval_auc": 0.9993127931888565,
49
+ "eval_runtime": 93.9085,
50
+ "eval_samples_per_second": 341.418,
51
+ "eval_steps_per_second": 5.335,
52
+ "epoch": 5.0
53
+ },
54
+ "4": {
55
+ "eval_loss": 0.021965384483337402,
56
+ "eval_precision": 0.994482496194825,
57
+ "eval_recall": 0.9943563728598604,
58
+ "eval_acc": 0.9945106356434409,
59
+ "eval_mcc": 0.9890183457782504,
60
+ "eval_f1": 0.9944194305282515,
61
+ "eval_auc": 0.9996556930812918,
62
+ "eval_runtime": 97.5799,
63
+ "eval_samples_per_second": 328.572,
64
+ "eval_steps_per_second": 5.134,
65
+ "epoch": 5.0
66
+ }
67
+ }
metrics.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"precision": 0.994482496194825, "recall": 0.9943563728598604, "acc": 0.9945106356434409, "mcc": 0.9890183457782504, "f1": 0.9944194305282515, "auc": 0.9996556930812918}
metrics_all_fold.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "precision": [
3
+ 0.8656669790690409,
4
+ 0.9276957718288716,
5
+ 0.9808663803990907,
6
+ 0.9902593295382669,
7
+ 0.994482496194825
8
+ ],
9
+ "recall": [
10
+ 0.8785111914273033,
11
+ 0.9405199746353836,
12
+ 0.9849714648065948,
13
+ 0.9927710843373494,
14
+ 0.9943563728598604
15
+ ],
16
+ "f1": [
17
+ 0.8720417925478348,
18
+ 0.934063857925562,
19
+ 0.9829146364614314,
20
+ 0.9915136162127929,
21
+ 0.9944194305282515
22
+ ],
23
+ "auc": [
24
+ 0.9394272614942787,
25
+ 0.9791706185357555,
26
+ 0.9976812207025214,
27
+ 0.9993127931888565,
28
+ 0.9996556930812918
29
+ ],
30
+ "acc": [
31
+ 0.8731871627732901,
32
+ 0.9346890399850291,
33
+ 0.9831576320878298,
34
+ 0.9916411951843304,
35
+ 0.9945106356434409
36
+ ],
37
+ "mcc": [
38
+ 0.746447037107958,
39
+ 0.8694527772027904,
40
+ 0.9663167846706998,
41
+ 0.9832816995905711,
42
+ 0.9890183457782504
43
+ ]
44
+ }
metrics_ci_bounds.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "precision": {
3
+ "ci_lower": 0.8833738830452595,
4
+ "ci_upper": 1.0202144997667784
5
+ },
6
+ "recall": {
7
+ "ci_lower": 0.8965100687138844,
8
+ "ci_upper": 1.0199419665127125
9
+ },
10
+ "f1": {
11
+ "ci_lower": 0.8899164899500339,
12
+ "ci_upper": 1.0200648435203152
13
+ },
14
+ "auc": {
15
+ "ci_lower": 0.9509560876310184,
16
+ "ci_upper": 1.0151429471700633
17
+ },
18
+ "acc": {
19
+ "ci_lower": 0.8909140788106023,
20
+ "ci_upper": 1.019960187458966
21
+ },
22
+ "mcc": {
23
+ "ci_lower": 0.7819027817722539,
24
+ "ci_upper": 1.0399038759678538
25
+ }
26
+ }
metrics_mean.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "precision": 0.951794191406019,
3
+ "recall": 0.9582260176132984,
4
+ "f1": 0.9549906667351745,
5
+ "auc": 0.9830495174005408,
6
+ "acc": 0.9554371331347842,
7
+ "mcc": 0.9109033288700539
8
+ }
metrics_std.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "precision": 0.05510372247221357,
3
+ "recall": 0.04970422673822744,
4
+ "f1": 0.0524088456130476,
5
+ "auc": 0.02584711308047101,
6
+ "acc": 0.05196498764361626,
7
+ "mcc": 0.10389328134214777
8
+ }
metrics_visualisation.png ADDED
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99d90de7783c499123fe65e335d2cde00dd1a30a1100aef423f0e83cfe1db8a6
3
+ size 328492280
precision_recall_curve.png ADDED
reduced_main_data.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd150f0b5bda48f425f8e1b9f4696b7ea437ff7ecda7e84d25dd31c55c0880f0
3
+ size 849480006
roc_curve.png ADDED
test_data_for_future_evaluation.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:733dfa5955db9e10d260c78dfecbfb7fafc9b6a8d37eeefdf724910a8cb5f224
3
+ size 157560896
test_top_repo_data.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fe77360c0dd488094d463febe66cedd8a64e4d29c9124ab100df829aed41804
3
+ size 50939436
top_repo_data.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:295d7828a30a1ba76e323db3766d15240b86799484e5d4b2f82cd9f1bd394b2c
3
+ size 40098789
tracker_carbon_statistics.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cloud_provider": "",
3
+ "cloud_region": "",
4
+ "codecarbon_version": "2.3.4",
5
+ "country_iso_code": "NOR",
6
+ "country_name": "Norway",
7
+ "cpu_count": 64,
8
+ "cpu_energy": 0.34489881885688994,
9
+ "cpu_model": "AMD EPYC 7282 16-Core Processor",
10
+ "cpu_power": 7.064653799305303,
11
+ "duration": 26893.03911614418,
12
+ "emissions": 0.30508717075751984,
13
+ "emissions_rate": 1.134446610663548e-05,
14
+ "energy_consumed": 11.073944492105984,
15
+ "gpu_count": 8,
16
+ "gpu_energy": 10.0258240095417,
17
+ "gpu_model": "8 x NVIDIA GeForce RTX 2080 Ti",
18
+ "gpu_power": 1448.943161731065,
19
+ "latitude": 59.955,
20
+ "longitude": 10.859,
21
+ "on_cloud": "N",
22
+ "os": "Linux-4.18.0-513.9.1.el8_9.x86_64-x86_64-with-glibc2.28",
23
+ "project_name": "codecarbon",
24
+ "pue": 1.0,
25
+ "python_version": "3.10.8",
26
+ "ram_energy": 0.7032216637073923,
27
+ "ram_power": 94.2059955596924,
28
+ "ram_total_size": 251.2159881591797,
29
+ "region": "oslo county",
30
+ "run_id": "11e5a3b1-897b-4727-953f-800b88c69faa",
31
+ "timestamp": "2024-03-06T21:15:39",
32
+ "tracking_mode": "machine"
33
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34f5690b2a5603554c13f29c439ae2d9aa25bbf66bfb42a129aa8aa35ad4b2c1
3
+ size 4664