[MNIST] 20250825-010451 | best_acc=0.9923
Browse files- sweep/MNIST/20250825-010451_MNIST/README.md +10 -0
- sweep/MNIST/20250825-010451_MNIST/config.json +41 -0
- sweep/MNIST/20250825-010451_MNIST/history.csv +11 -0
- sweep/MNIST/20250825-010451_MNIST/history.json +110 -0
- sweep/MNIST/20250825-010451_MNIST/manifest.json +43 -0
- sweep/MNIST/20250825-010451_MNIST/plots/accuracy.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/best_confusion_mnist_epoch_10.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_1.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_10.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_2.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_3.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_4.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_5.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_6.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_7.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_8.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_9.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/lambda.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/plots/loss_components.png +0 -0
- sweep/MNIST/20250825-010451_MNIST/tensorboard/events.out.tfevents.1756083458.5def8ea04e29.2559.0 +3 -0
- sweep/MNIST/20250825-010451_MNIST/tensorboard_events.zip +3 -0
- sweep/MNIST/20250825-010451_MNIST/weights/constellation_MNIST.safetensors +3 -0
- sweep/MNIST/20250825-010451_MNIST/weights/diagnostic_head_MNIST.safetensors +3 -0
- sweep/MNIST/20250825-010451_MNIST/weights/encoder_MNIST.safetensors +3 -0
sweep/MNIST/20250825-010451_MNIST/README.md
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# Pentachora Adaptive Encoded — 20250825-010451
|
2 |
+
|
3 |
+
**Dataset:** MNIST
|
4 |
+
|
5 |
+
**Contents**
|
6 |
+
- `weights/*.safetensors` — encoder, constellation, diagnostic head
|
7 |
+
- `config.json`, `manifest.json`
|
8 |
+
- `history.json` / `history.csv`
|
9 |
+
- `tensorboard/` (and `tensorboard_events.zip`)
|
10 |
+
- `plots/` — accuracy, loss, λ, confusion
|
sweep/MNIST/20250825-010451_MNIST/config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"augment": false,
|
3 |
+
"base_dim": 56,
|
4 |
+
"batch_size": 1024,
|
5 |
+
"channels": 24,
|
6 |
+
"dataset": "all",
|
7 |
+
"deterministic": true,
|
8 |
+
"deterministic_cublas": false,
|
9 |
+
"epochs": 10,
|
10 |
+
"hf_dataset_dir_template": "{dataset}",
|
11 |
+
"hf_preserve_case": true,
|
12 |
+
"hf_repo_id": "AbstractPhil/pentachora-multi-channel-frequency-encoded",
|
13 |
+
"hf_run_dir_template": "{ts}_{dataset}",
|
14 |
+
"hf_subdir_root": "sweep",
|
15 |
+
"hf_weight_suffix_dataset": true,
|
16 |
+
"img_channels": "auto",
|
17 |
+
"img_size": 28,
|
18 |
+
"input_channels": 1,
|
19 |
+
"input_dim": 784,
|
20 |
+
"lambda_separation": 0.391,
|
21 |
+
"loss_weight_scalar": 0.1,
|
22 |
+
"lr": 0.001,
|
23 |
+
"normalize": true,
|
24 |
+
"note": "",
|
25 |
+
"num_classes": 10,
|
26 |
+
"num_heads": 2,
|
27 |
+
"num_pentachoron_pairs": 2,
|
28 |
+
"per_dataset_norm": true,
|
29 |
+
"proj_dim": null,
|
30 |
+
"seed": 420,
|
31 |
+
"seed_per_dataset": false,
|
32 |
+
"strict_determinism": false,
|
33 |
+
"sweep_all": true,
|
34 |
+
"temp": 0.7,
|
35 |
+
"w_ce": 1.0,
|
36 |
+
"w_diag": 0.1,
|
37 |
+
"w_dual": 1.0,
|
38 |
+
"w_reg": 0.1,
|
39 |
+
"w_rose": 1.0,
|
40 |
+
"weight_decay": 1e-05
|
41 |
+
}
|
sweep/MNIST/20250825-010451_MNIST/history.csv
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,train_loss,train_acc,test_acc,ce,dual,rose,diag,reg,lambda
|
2 |
+
1,4.099099999491374,0.6092333333333333,0.7777,1.9353452950159709,1.4966692358652751,0.4187841921965281,0.03863755012104909,2.444374981943766,0.5082515478134155
|
3 |
+
2,3.265971806716919,0.9124,0.9828,1.4902187630971273,1.2094666115442911,0.27087780187924704,0.005726768050591151,2.9483592999776205,0.512462854385376
|
4 |
+
3,2.849476100794474,0.93975,0.9847,1.1438547242482504,1.1562489971796672,0.252196351591746,0.003246040508151054,2.9685141609191894,0.5146151781082153
|
5 |
+
4,2.547648438390096,0.9487833333333333,0.9884,0.8786565330505371,1.1265866938273112,0.24325079276561737,0.0024775896539290746,2.9890664339701334,0.5165699124336243
|
6 |
+
5,2.3415075052897136,0.9540333333333333,0.9887,0.698838595867157,1.105206903966268,0.23671859684785207,0.00181801314180096,3.005616041437785,0.5179175734519958
|
7 |
+
6,2.207916549046834,0.9670333333333333,0.9896,0.5828056198120117,1.0909406508127848,0.232258070174853,0.0013581937593407929,3.0177637739817302,0.518687903881073
|
8 |
+
7,2.127361617279053,0.9721833333333333,0.9903,0.5126966991265615,1.0822702507019042,0.2296740666071574,0.0011153380973575016,3.0260904886881512,0.5189071893692017
|
9 |
+
8,2.0816173538208007,0.9734,0.9915,0.4750055922985077,1.0759552146911622,0.2275281824350357,0.0008281340084969998,3.0304555992126465,0.5187594294548035
|
10 |
+
9,2.0542886912027996,0.9760333333333333,0.9916,0.4520849461714427,1.072440995089213,0.2264139123916626,0.0006916848283261061,3.032796762339274,0.5186092853546143
|
11 |
+
10,2.0445816794077554,0.9774333333333334,0.9923,0.4443954314549764,1.0708532263437907,0.22589081300099692,0.0006348217722183714,3.033787278874715,0.5185865163803101
|
sweep/MNIST/20250825-010451_MNIST/history.json
ADDED
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ce": [
|
3 |
+
1.9353452950159709,
|
4 |
+
1.4902187630971273,
|
5 |
+
1.1438547242482504,
|
6 |
+
0.8786565330505371,
|
7 |
+
0.698838595867157,
|
8 |
+
0.5828056198120117,
|
9 |
+
0.5126966991265615,
|
10 |
+
0.4750055922985077,
|
11 |
+
0.4520849461714427,
|
12 |
+
0.4443954314549764
|
13 |
+
],
|
14 |
+
"diag": [
|
15 |
+
0.03863755012104909,
|
16 |
+
0.005726768050591151,
|
17 |
+
0.003246040508151054,
|
18 |
+
0.0024775896539290746,
|
19 |
+
0.00181801314180096,
|
20 |
+
0.0013581937593407929,
|
21 |
+
0.0011153380973575016,
|
22 |
+
0.0008281340084969998,
|
23 |
+
0.0006916848283261061,
|
24 |
+
0.0006348217722183714
|
25 |
+
],
|
26 |
+
"dual": [
|
27 |
+
1.4966692358652751,
|
28 |
+
1.2094666115442911,
|
29 |
+
1.1562489971796672,
|
30 |
+
1.1265866938273112,
|
31 |
+
1.105206903966268,
|
32 |
+
1.0909406508127848,
|
33 |
+
1.0822702507019042,
|
34 |
+
1.0759552146911622,
|
35 |
+
1.072440995089213,
|
36 |
+
1.0708532263437907
|
37 |
+
],
|
38 |
+
"lambda": [
|
39 |
+
0.5082515478134155,
|
40 |
+
0.512462854385376,
|
41 |
+
0.5146151781082153,
|
42 |
+
0.5165699124336243,
|
43 |
+
0.5179175734519958,
|
44 |
+
0.518687903881073,
|
45 |
+
0.5189071893692017,
|
46 |
+
0.5187594294548035,
|
47 |
+
0.5186092853546143,
|
48 |
+
0.5185865163803101
|
49 |
+
],
|
50 |
+
"reg": [
|
51 |
+
2.444374981943766,
|
52 |
+
2.9483592999776205,
|
53 |
+
2.9685141609191894,
|
54 |
+
2.9890664339701334,
|
55 |
+
3.005616041437785,
|
56 |
+
3.0177637739817302,
|
57 |
+
3.0260904886881512,
|
58 |
+
3.0304555992126465,
|
59 |
+
3.032796762339274,
|
60 |
+
3.033787278874715
|
61 |
+
],
|
62 |
+
"rose": [
|
63 |
+
0.4187841921965281,
|
64 |
+
0.27087780187924704,
|
65 |
+
0.252196351591746,
|
66 |
+
0.24325079276561737,
|
67 |
+
0.23671859684785207,
|
68 |
+
0.232258070174853,
|
69 |
+
0.2296740666071574,
|
70 |
+
0.2275281824350357,
|
71 |
+
0.2264139123916626,
|
72 |
+
0.22589081300099692
|
73 |
+
],
|
74 |
+
"test_acc": [
|
75 |
+
0.7777,
|
76 |
+
0.9828,
|
77 |
+
0.9847,
|
78 |
+
0.9884,
|
79 |
+
0.9887,
|
80 |
+
0.9896,
|
81 |
+
0.9903,
|
82 |
+
0.9915,
|
83 |
+
0.9916,
|
84 |
+
0.9923
|
85 |
+
],
|
86 |
+
"train_acc": [
|
87 |
+
0.6092333333333333,
|
88 |
+
0.9124,
|
89 |
+
0.93975,
|
90 |
+
0.9487833333333333,
|
91 |
+
0.9540333333333333,
|
92 |
+
0.9670333333333333,
|
93 |
+
0.9721833333333333,
|
94 |
+
0.9734,
|
95 |
+
0.9760333333333333,
|
96 |
+
0.9774333333333334
|
97 |
+
],
|
98 |
+
"train_loss": [
|
99 |
+
4.099099999491374,
|
100 |
+
3.265971806716919,
|
101 |
+
2.849476100794474,
|
102 |
+
2.547648438390096,
|
103 |
+
2.3415075052897136,
|
104 |
+
2.207916549046834,
|
105 |
+
2.127361617279053,
|
106 |
+
2.0816173538208007,
|
107 |
+
2.0542886912027996,
|
108 |
+
2.0445816794077554
|
109 |
+
]
|
110 |
+
}
|
sweep/MNIST/20250825-010451_MNIST/manifest.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"class_names": [
|
3 |
+
"digit-0",
|
4 |
+
"digit-1",
|
5 |
+
"digit-2",
|
6 |
+
"digit-3",
|
7 |
+
"digit-4",
|
8 |
+
"digit-5",
|
9 |
+
"digit-6",
|
10 |
+
"digit-7",
|
11 |
+
"digit-8",
|
12 |
+
"digit-9"
|
13 |
+
],
|
14 |
+
"dataset_name": "MNIST",
|
15 |
+
"environment": {
|
16 |
+
"cpu_count": 96,
|
17 |
+
"cuda_available": false,
|
18 |
+
"cuda_device": null,
|
19 |
+
"memory_gb": 334.56,
|
20 |
+
"platform": "Linux-6.1.123+-x86_64-with-glibc2.35",
|
21 |
+
"python": "3.12.11 (main, Jun 4 2025, 08:56:18) [GCC 11.4.0]",
|
22 |
+
"torch": "2.8.0+cpu"
|
23 |
+
},
|
24 |
+
"models": {
|
25 |
+
"constellation": {
|
26 |
+
"params": 16777
|
27 |
+
},
|
28 |
+
"diagnostic_head": {
|
29 |
+
"params": 7681
|
30 |
+
},
|
31 |
+
"encoder": {
|
32 |
+
"params": 429897
|
33 |
+
}
|
34 |
+
},
|
35 |
+
"num_classes": 10,
|
36 |
+
"repo_id": "AbstractPhil/pentachora-multi-channel-frequency-encoded",
|
37 |
+
"results": {
|
38 |
+
"best_epoch": 10,
|
39 |
+
"best_test_accuracy": 0.9923
|
40 |
+
},
|
41 |
+
"subdirectory": "sweep/MNIST/20250825-010451_MNIST",
|
42 |
+
"timestamp": "20250825-010451"
|
43 |
+
}
|
sweep/MNIST/20250825-010451_MNIST/plots/accuracy.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/best_confusion_mnist_epoch_10.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_1.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_10.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_2.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_3.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_4.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_5.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_6.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_7.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_8.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/confusion_epoch_9.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/lambda.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/plots/loss_components.png
ADDED
![]() |
sweep/MNIST/20250825-010451_MNIST/tensorboard/events.out.tfevents.1756083458.5def8ea04e29.2559.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af700f0010e522bbc819767e13d5b163f099544971299784a425639251ddaea8
|
3 |
+
size 170008
|
sweep/MNIST/20250825-010451_MNIST/tensorboard_events.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e2e4b5bdca7454676335f01163aec57a7e29d36fc71bb6fd78d13112dc74027
|
3 |
+
size 55533
|
sweep/MNIST/20250825-010451_MNIST/weights/constellation_MNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4aaa902b486dfa1c987da95737aa9290dc7ef3c11691abd9b3f0da4d944be3e
|
3 |
+
size 70076
|
sweep/MNIST/20250825-010451_MNIST/weights/diagnostic_head_MNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca2f1fb9610597007716891ad323b31310c3c2ef152b0a2df8a4304330c4d49a
|
3 |
+
size 31172
|
sweep/MNIST/20250825-010451_MNIST/weights/encoder_MNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:972b6a9a5a2418417859df36ea14468e3cac961e0f3d9f0e0b14d75074564cca
|
3 |
+
size 1731664
|