[FashionMNIST] 20250825-011246 | best_acc=0.9221
Browse files- .gitattributes +11 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/README.md +10 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/config.json +41 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/history.csv +11 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/history.json +110 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/manifest.json +43 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/accuracy.png +0 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/best_confusion_fashionmnist_epoch_9.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/best_confusion_mnist_epoch_10.png +0 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_1.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_10.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_2.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_3.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_4.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_5.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_6.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_7.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_8.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_9.png +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/lambda.png +0 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/loss_components.png +0 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/tensorboard/events.out.tfevents.1756083900.5def8ea04e29.2559.1 +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/tensorboard_events.zip +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/weights/constellation_FashionMNIST.safetensors +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/weights/diagnostic_head_FashionMNIST.safetensors +3 -0
- sweep/FashionMNIST/20250825-011246_FashionMNIST/weights/encoder_FashionMNIST.safetensors +3 -0
.gitattributes
CHANGED
@@ -537,3 +537,14 @@ sweep/TissueMNIST/20250817-150543_TissueMNIST/plots/confusion_epoch_6.png filter
|
|
537 |
sweep/TissueMNIST/20250817-150543_TissueMNIST/plots/confusion_epoch_7.png filter=lfs diff=lfs merge=lfs -text
|
538 |
sweep/TissueMNIST/20250817-150543_TissueMNIST/plots/confusion_epoch_8.png filter=lfs diff=lfs merge=lfs -text
|
539 |
sweep/TissueMNIST/20250817-150543_TissueMNIST/plots/confusion_epoch_9.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
537 |
sweep/TissueMNIST/20250817-150543_TissueMNIST/plots/confusion_epoch_7.png filter=lfs diff=lfs merge=lfs -text
|
538 |
sweep/TissueMNIST/20250817-150543_TissueMNIST/plots/confusion_epoch_8.png filter=lfs diff=lfs merge=lfs -text
|
539 |
sweep/TissueMNIST/20250817-150543_TissueMNIST/plots/confusion_epoch_9.png filter=lfs diff=lfs merge=lfs -text
|
540 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/best_confusion_fashionmnist_epoch_9.png filter=lfs diff=lfs merge=lfs -text
|
541 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_1.png filter=lfs diff=lfs merge=lfs -text
|
542 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_10.png filter=lfs diff=lfs merge=lfs -text
|
543 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_2.png filter=lfs diff=lfs merge=lfs -text
|
544 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_3.png filter=lfs diff=lfs merge=lfs -text
|
545 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_4.png filter=lfs diff=lfs merge=lfs -text
|
546 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_5.png filter=lfs diff=lfs merge=lfs -text
|
547 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_6.png filter=lfs diff=lfs merge=lfs -text
|
548 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_7.png filter=lfs diff=lfs merge=lfs -text
|
549 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_8.png filter=lfs diff=lfs merge=lfs -text
|
550 |
+
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_9.png filter=lfs diff=lfs merge=lfs -text
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/README.md
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# Pentachora Adaptive Encoded — 20250825-011246
|
2 |
+
|
3 |
+
**Dataset:** FashionMNIST
|
4 |
+
|
5 |
+
**Contents**
|
6 |
+
- `weights/*.safetensors` — encoder, constellation, diagnostic head
|
7 |
+
- `config.json`, `manifest.json`
|
8 |
+
- `history.json` / `history.csv`
|
9 |
+
- `tensorboard/` (and `tensorboard_events.zip`)
|
10 |
+
- `plots/` — accuracy, loss, λ, confusion
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"augment": false,
|
3 |
+
"base_dim": 56,
|
4 |
+
"batch_size": 1024,
|
5 |
+
"channels": 24,
|
6 |
+
"dataset": "all",
|
7 |
+
"deterministic": true,
|
8 |
+
"deterministic_cublas": false,
|
9 |
+
"epochs": 10,
|
10 |
+
"hf_dataset_dir_template": "{dataset}",
|
11 |
+
"hf_preserve_case": true,
|
12 |
+
"hf_repo_id": "AbstractPhil/pentachora-multi-channel-frequency-encoded",
|
13 |
+
"hf_run_dir_template": "{ts}_{dataset}",
|
14 |
+
"hf_subdir_root": "sweep",
|
15 |
+
"hf_weight_suffix_dataset": true,
|
16 |
+
"img_channels": "auto",
|
17 |
+
"img_size": 28,
|
18 |
+
"input_channels": 1,
|
19 |
+
"input_dim": 784,
|
20 |
+
"lambda_separation": 0.391,
|
21 |
+
"loss_weight_scalar": 0.1,
|
22 |
+
"lr": 0.001,
|
23 |
+
"normalize": true,
|
24 |
+
"note": "",
|
25 |
+
"num_classes": 10,
|
26 |
+
"num_heads": 2,
|
27 |
+
"num_pentachoron_pairs": 2,
|
28 |
+
"per_dataset_norm": true,
|
29 |
+
"proj_dim": null,
|
30 |
+
"seed": 420,
|
31 |
+
"seed_per_dataset": false,
|
32 |
+
"strict_determinism": false,
|
33 |
+
"sweep_all": true,
|
34 |
+
"temp": 0.7,
|
35 |
+
"w_ce": 1.0,
|
36 |
+
"w_diag": 0.1,
|
37 |
+
"w_dual": 1.0,
|
38 |
+
"w_reg": 0.1,
|
39 |
+
"w_rose": 1.0,
|
40 |
+
"weight_decay": 1e-05
|
41 |
+
}
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/history.csv
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,train_loss,train_acc,test_acc,ce,dual,rose,diag,reg,lambda
|
2 |
+
1,4.662385488891601,0.59835,0.7719,1.9785473901748658,1.8497433572133382,0.5892192542552948,0.07983070080081622,2.3689250661214194,0.5043014883995056
|
3 |
+
2,3.7564958925882976,0.8505166666666667,0.8896,1.565934888712565,1.4954850419362387,0.40166557857195534,0.0238164808511734,2.910287418238322,0.5069479942321777
|
4 |
+
3,3.325700936381022,0.8887,0.8979,1.2466032598495485,1.4120547097524008,0.3714123874505361,0.020961436926325162,2.93534427541097,0.5084181427955627
|
5 |
+
4,2.9968503290812176,0.90355,0.9012,0.9974395618756612,1.3524139944076539,0.3489980826218923,0.01853677656153838,2.9614501026153564,0.5098332762718201
|
6 |
+
5,2.7574253098805745,0.9175333333333333,0.9121,0.8169807472229004,1.30816054242452,0.33249259441693624,0.016885942601164182,2.981028149795532,0.510604977607727
|
7 |
+
6,2.591482035191854,0.9277166666666666,0.9108,0.6980444258054097,1.2731985834757487,0.31907119736671447,0.015362284584840138,2.9963161769866944,0.5103619694709778
|
8 |
+
7,2.485234659957886,0.9347166666666666,0.9155,0.623532309659322,1.2497626927693686,0.3098507282098134,0.01439392692397038,3.0064952751159666,0.5105664134025574
|
9 |
+
8,2.407597166442871,0.9402333333333334,0.9186,0.5720466683387756,1.2312851296742757,0.3016748560587565,0.013311736539502938,3.01259345703125,0.510155439376831
|
10 |
+
9,2.3616587618509928,0.94515,0.9221,0.5468409752209982,1.2169182946523032,0.2950767196337382,0.012588130690157413,3.01563954111735,0.5101481676101685
|
11 |
+
10,2.331696878941854,0.9490333333333333,0.922,0.5308913292249043,1.2070914285024008,0.290820267645518,0.011975013341506323,3.016963645807902,0.5100754499435425
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/history.json
ADDED
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ce": [
|
3 |
+
1.9785473901748658,
|
4 |
+
1.565934888712565,
|
5 |
+
1.2466032598495485,
|
6 |
+
0.9974395618756612,
|
7 |
+
0.8169807472229004,
|
8 |
+
0.6980444258054097,
|
9 |
+
0.623532309659322,
|
10 |
+
0.5720466683387756,
|
11 |
+
0.5468409752209982,
|
12 |
+
0.5308913292249043
|
13 |
+
],
|
14 |
+
"diag": [
|
15 |
+
0.07983070080081622,
|
16 |
+
0.0238164808511734,
|
17 |
+
0.020961436926325162,
|
18 |
+
0.01853677656153838,
|
19 |
+
0.016885942601164182,
|
20 |
+
0.015362284584840138,
|
21 |
+
0.01439392692397038,
|
22 |
+
0.013311736539502938,
|
23 |
+
0.012588130690157413,
|
24 |
+
0.011975013341506323
|
25 |
+
],
|
26 |
+
"dual": [
|
27 |
+
1.8497433572133382,
|
28 |
+
1.4954850419362387,
|
29 |
+
1.4120547097524008,
|
30 |
+
1.3524139944076539,
|
31 |
+
1.30816054242452,
|
32 |
+
1.2731985834757487,
|
33 |
+
1.2497626927693686,
|
34 |
+
1.2312851296742757,
|
35 |
+
1.2169182946523032,
|
36 |
+
1.2070914285024008
|
37 |
+
],
|
38 |
+
"lambda": [
|
39 |
+
0.5043014883995056,
|
40 |
+
0.5069479942321777,
|
41 |
+
0.5084181427955627,
|
42 |
+
0.5098332762718201,
|
43 |
+
0.510604977607727,
|
44 |
+
0.5103619694709778,
|
45 |
+
0.5105664134025574,
|
46 |
+
0.510155439376831,
|
47 |
+
0.5101481676101685,
|
48 |
+
0.5100754499435425
|
49 |
+
],
|
50 |
+
"reg": [
|
51 |
+
2.3689250661214194,
|
52 |
+
2.910287418238322,
|
53 |
+
2.93534427541097,
|
54 |
+
2.9614501026153564,
|
55 |
+
2.981028149795532,
|
56 |
+
2.9963161769866944,
|
57 |
+
3.0064952751159666,
|
58 |
+
3.01259345703125,
|
59 |
+
3.01563954111735,
|
60 |
+
3.016963645807902
|
61 |
+
],
|
62 |
+
"rose": [
|
63 |
+
0.5892192542552948,
|
64 |
+
0.40166557857195534,
|
65 |
+
0.3714123874505361,
|
66 |
+
0.3489980826218923,
|
67 |
+
0.33249259441693624,
|
68 |
+
0.31907119736671447,
|
69 |
+
0.3098507282098134,
|
70 |
+
0.3016748560587565,
|
71 |
+
0.2950767196337382,
|
72 |
+
0.290820267645518
|
73 |
+
],
|
74 |
+
"test_acc": [
|
75 |
+
0.7719,
|
76 |
+
0.8896,
|
77 |
+
0.8979,
|
78 |
+
0.9012,
|
79 |
+
0.9121,
|
80 |
+
0.9108,
|
81 |
+
0.9155,
|
82 |
+
0.9186,
|
83 |
+
0.9221,
|
84 |
+
0.922
|
85 |
+
],
|
86 |
+
"train_acc": [
|
87 |
+
0.59835,
|
88 |
+
0.8505166666666667,
|
89 |
+
0.8887,
|
90 |
+
0.90355,
|
91 |
+
0.9175333333333333,
|
92 |
+
0.9277166666666666,
|
93 |
+
0.9347166666666666,
|
94 |
+
0.9402333333333334,
|
95 |
+
0.94515,
|
96 |
+
0.9490333333333333
|
97 |
+
],
|
98 |
+
"train_loss": [
|
99 |
+
4.662385488891601,
|
100 |
+
3.7564958925882976,
|
101 |
+
3.325700936381022,
|
102 |
+
2.9968503290812176,
|
103 |
+
2.7574253098805745,
|
104 |
+
2.591482035191854,
|
105 |
+
2.485234659957886,
|
106 |
+
2.407597166442871,
|
107 |
+
2.3616587618509928,
|
108 |
+
2.331696878941854
|
109 |
+
]
|
110 |
+
}
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/manifest.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"class_names": [
|
3 |
+
"fashion-T-shirt/top",
|
4 |
+
"fashion-Trouser",
|
5 |
+
"fashion-Pullover",
|
6 |
+
"fashion-Dress",
|
7 |
+
"fashion-Coat",
|
8 |
+
"fashion-Sandal",
|
9 |
+
"fashion-Shirt",
|
10 |
+
"fashion-Sneaker",
|
11 |
+
"fashion-Bag",
|
12 |
+
"fashion-Ankle boot"
|
13 |
+
],
|
14 |
+
"dataset_name": "FashionMNIST",
|
15 |
+
"environment": {
|
16 |
+
"cpu_count": 96,
|
17 |
+
"cuda_available": false,
|
18 |
+
"cuda_device": null,
|
19 |
+
"memory_gb": 334.56,
|
20 |
+
"platform": "Linux-6.1.123+-x86_64-with-glibc2.35",
|
21 |
+
"python": "3.12.11 (main, Jun 4 2025, 08:56:18) [GCC 11.4.0]",
|
22 |
+
"torch": "2.8.0+cpu"
|
23 |
+
},
|
24 |
+
"models": {
|
25 |
+
"constellation": {
|
26 |
+
"params": 16777
|
27 |
+
},
|
28 |
+
"diagnostic_head": {
|
29 |
+
"params": 7681
|
30 |
+
},
|
31 |
+
"encoder": {
|
32 |
+
"params": 429897
|
33 |
+
}
|
34 |
+
},
|
35 |
+
"num_classes": 10,
|
36 |
+
"repo_id": "AbstractPhil/pentachora-multi-channel-frequency-encoded",
|
37 |
+
"results": {
|
38 |
+
"best_epoch": 9,
|
39 |
+
"best_test_accuracy": 0.9221
|
40 |
+
},
|
41 |
+
"subdirectory": "sweep/FashionMNIST/20250825-011246_FashionMNIST",
|
42 |
+
"timestamp": "20250825-011246"
|
43 |
+
}
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/accuracy.png
ADDED
![]() |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/best_confusion_fashionmnist_epoch_9.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/best_confusion_mnist_epoch_10.png
ADDED
![]() |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_1.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_10.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_2.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_3.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_4.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_5.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_6.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_7.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_8.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_9.png
ADDED
![]() |
Git LFS Details
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/lambda.png
ADDED
![]() |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/loss_components.png
ADDED
![]() |
sweep/FashionMNIST/20250825-011246_FashionMNIST/tensorboard/events.out.tfevents.1756083900.5def8ea04e29.2559.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fd6faf467774ed4d3b689dc43ee91de01e5ff23f15b1975e052896f19d3e795
|
3 |
+
size 170008
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/tensorboard_events.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:445647278657ac4d4fe99c9221dceed2150317fb4cca08bc3dab53e5f1ce0ec7
|
3 |
+
size 55461
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/weights/constellation_FashionMNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d915aa009a776e5351b8632a6bf59d7e5553aeff0f46062bd6108757479ff4e2
|
3 |
+
size 70076
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/weights/diagnostic_head_FashionMNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60cd1ec4a13efdf93532f7adda2523fbba91d35d2c963c37fa8b4dfbd75968bc
|
3 |
+
size 31172
|
sweep/FashionMNIST/20250825-011246_FashionMNIST/weights/encoder_FashionMNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e388087284bc59eb66f6f435760f84e2187b2f03054996f24bc3c05e3e8b0c72
|
3 |
+
size 1731664
|