[KMNIST] 20250825-012106 | best_acc=0.9489
Browse files- .gitattributes +1 -0
- sweep/KMNIST/20250825-012106_KMNIST/README.md +10 -0
- sweep/KMNIST/20250825-012106_KMNIST/config.json +41 -0
- sweep/KMNIST/20250825-012106_KMNIST/history.csv +11 -0
- sweep/KMNIST/20250825-012106_KMNIST/history.json +110 -0
- sweep/KMNIST/20250825-012106_KMNIST/manifest.json +43 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/accuracy.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/best_confusion_fashionmnist_epoch_9.png +3 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/best_confusion_kmnist_epoch_10.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/best_confusion_mnist_epoch_10.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_1.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_10.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_2.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_3.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_4.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_5.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_6.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_7.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_8.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_9.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/lambda.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/plots/loss_components.png +0 -0
- sweep/KMNIST/20250825-012106_KMNIST/tensorboard/events.out.tfevents.1756084397.5def8ea04e29.2559.2 +3 -0
- sweep/KMNIST/20250825-012106_KMNIST/tensorboard_events.zip +3 -0
- sweep/KMNIST/20250825-012106_KMNIST/weights/constellation_KMNIST.safetensors +3 -0
- sweep/KMNIST/20250825-012106_KMNIST/weights/diagnostic_head_KMNIST.safetensors +3 -0
- sweep/KMNIST/20250825-012106_KMNIST/weights/encoder_KMNIST.safetensors +3 -0
.gitattributes
CHANGED
@@ -548,3 +548,4 @@ sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_6.png filt
|
|
548 |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_7.png filter=lfs diff=lfs merge=lfs -text
|
549 |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_8.png filter=lfs diff=lfs merge=lfs -text
|
550 |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_9.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
548 |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_7.png filter=lfs diff=lfs merge=lfs -text
|
549 |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_8.png filter=lfs diff=lfs merge=lfs -text
|
550 |
sweep/FashionMNIST/20250825-011246_FashionMNIST/plots/confusion_epoch_9.png filter=lfs diff=lfs merge=lfs -text
|
551 |
+
sweep/KMNIST/20250825-012106_KMNIST/plots/best_confusion_fashionmnist_epoch_9.png filter=lfs diff=lfs merge=lfs -text
|
sweep/KMNIST/20250825-012106_KMNIST/README.md
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# Pentachora Adaptive Encoded — 20250825-012106
|
2 |
+
|
3 |
+
**Dataset:** KMNIST
|
4 |
+
|
5 |
+
**Contents**
|
6 |
+
- `weights/*.safetensors` — encoder, constellation, diagnostic head
|
7 |
+
- `config.json`, `manifest.json`
|
8 |
+
- `history.json` / `history.csv`
|
9 |
+
- `tensorboard/` (and `tensorboard_events.zip`)
|
10 |
+
- `plots/` — accuracy, loss, λ, confusion
|
sweep/KMNIST/20250825-012106_KMNIST/config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"augment": false,
|
3 |
+
"base_dim": 56,
|
4 |
+
"batch_size": 1024,
|
5 |
+
"channels": 24,
|
6 |
+
"dataset": "all",
|
7 |
+
"deterministic": true,
|
8 |
+
"deterministic_cublas": false,
|
9 |
+
"epochs": 10,
|
10 |
+
"hf_dataset_dir_template": "{dataset}",
|
11 |
+
"hf_preserve_case": true,
|
12 |
+
"hf_repo_id": "AbstractPhil/pentachora-multi-channel-frequency-encoded",
|
13 |
+
"hf_run_dir_template": "{ts}_{dataset}",
|
14 |
+
"hf_subdir_root": "sweep",
|
15 |
+
"hf_weight_suffix_dataset": true,
|
16 |
+
"img_channels": "auto",
|
17 |
+
"img_size": 28,
|
18 |
+
"input_channels": 1,
|
19 |
+
"input_dim": 784,
|
20 |
+
"lambda_separation": 0.391,
|
21 |
+
"loss_weight_scalar": 0.1,
|
22 |
+
"lr": 0.001,
|
23 |
+
"normalize": true,
|
24 |
+
"note": "",
|
25 |
+
"num_classes": 10,
|
26 |
+
"num_heads": 2,
|
27 |
+
"num_pentachoron_pairs": 2,
|
28 |
+
"per_dataset_norm": true,
|
29 |
+
"proj_dim": null,
|
30 |
+
"seed": 420,
|
31 |
+
"seed_per_dataset": false,
|
32 |
+
"strict_determinism": false,
|
33 |
+
"sweep_all": true,
|
34 |
+
"temp": 0.7,
|
35 |
+
"w_ce": 1.0,
|
36 |
+
"w_diag": 0.1,
|
37 |
+
"w_dual": 1.0,
|
38 |
+
"w_reg": 0.1,
|
39 |
+
"w_rose": 1.0,
|
40 |
+
"weight_decay": 1e-05
|
41 |
+
}
|
sweep/KMNIST/20250825-012106_KMNIST/history.csv
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,train_loss,train_acc,test_acc,ce,dual,rose,diag,reg,lambda
|
2 |
+
1,4.48557572962443,0.5265166666666666,0.5602,1.9555096396128337,1.7448287576039632,0.5330904651641846,0.05771094880104065,2.463757032394409,0.5119326114654541
|
3 |
+
2,3.536102939987183,0.7662166666666667,0.8063,1.5454197209040323,1.364822986094157,0.3225712060133616,0.010663992638140917,3.022226466878255,0.5179829597473145
|
4 |
+
3,3.072022127532959,0.8785166666666666,0.9052,1.20693379611969,1.2747692097345988,0.2868388524691264,0.0060369723297655584,3.0287655672709146,0.5220382213592529
|
5 |
+
4,2.736741449737549,0.9232333333333334,0.9184,0.9466318797747294,1.2180658071517945,0.26746210424105327,0.004417671928058068,3.0413989435831708,0.524588942527771
|
6 |
+
5,2.5052449064890543,0.94165,0.9295,0.7657997594833374,1.1790255869547526,0.2550309862534205,0.0033509777244801323,3.0505347118377686,0.5263093709945679
|
7 |
+
6,2.3470733192443847,0.9666,0.9426,0.6433882504145304,1.1513723458607992,0.24600428889592488,0.002436440508812666,3.0606480485280354,0.5270016193389893
|
8 |
+
7,2.245156974029541,0.9777,0.9456,0.5646296345074971,1.1333092889149983,0.2402667633374532,0.0018552673658976952,3.067657651646932,0.5269185304641724
|
9 |
+
8,2.182974470901489,0.98115,0.9476,0.5174491348266601,1.1217439079284668,0.23643683848381042,0.0014199050638824702,3.072026076380412,0.5269790291786194
|
10 |
+
9,2.152672373199463,0.9812166666666666,0.947,0.49484223211606343,1.115748365910848,0.2345398904800415,0.0012661761294739942,3.0741526353200275,0.5268410444259644
|
11 |
+
10,2.1409359020233154,0.9815333333333334,0.9489,0.48612042428652447,1.1133787235260009,0.23381469444433847,0.0011963561533639827,3.0750242593129475,0.5268127918243408
|
sweep/KMNIST/20250825-012106_KMNIST/history.json
ADDED
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ce": [
|
3 |
+
1.9555096396128337,
|
4 |
+
1.5454197209040323,
|
5 |
+
1.20693379611969,
|
6 |
+
0.9466318797747294,
|
7 |
+
0.7657997594833374,
|
8 |
+
0.6433882504145304,
|
9 |
+
0.5646296345074971,
|
10 |
+
0.5174491348266601,
|
11 |
+
0.49484223211606343,
|
12 |
+
0.48612042428652447
|
13 |
+
],
|
14 |
+
"diag": [
|
15 |
+
0.05771094880104065,
|
16 |
+
0.010663992638140917,
|
17 |
+
0.0060369723297655584,
|
18 |
+
0.004417671928058068,
|
19 |
+
0.0033509777244801323,
|
20 |
+
0.002436440508812666,
|
21 |
+
0.0018552673658976952,
|
22 |
+
0.0014199050638824702,
|
23 |
+
0.0012661761294739942,
|
24 |
+
0.0011963561533639827
|
25 |
+
],
|
26 |
+
"dual": [
|
27 |
+
1.7448287576039632,
|
28 |
+
1.364822986094157,
|
29 |
+
1.2747692097345988,
|
30 |
+
1.2180658071517945,
|
31 |
+
1.1790255869547526,
|
32 |
+
1.1513723458607992,
|
33 |
+
1.1333092889149983,
|
34 |
+
1.1217439079284668,
|
35 |
+
1.115748365910848,
|
36 |
+
1.1133787235260009
|
37 |
+
],
|
38 |
+
"lambda": [
|
39 |
+
0.5119326114654541,
|
40 |
+
0.5179829597473145,
|
41 |
+
0.5220382213592529,
|
42 |
+
0.524588942527771,
|
43 |
+
0.5263093709945679,
|
44 |
+
0.5270016193389893,
|
45 |
+
0.5269185304641724,
|
46 |
+
0.5269790291786194,
|
47 |
+
0.5268410444259644,
|
48 |
+
0.5268127918243408
|
49 |
+
],
|
50 |
+
"reg": [
|
51 |
+
2.463757032394409,
|
52 |
+
3.022226466878255,
|
53 |
+
3.0287655672709146,
|
54 |
+
3.0413989435831708,
|
55 |
+
3.0505347118377686,
|
56 |
+
3.0606480485280354,
|
57 |
+
3.067657651646932,
|
58 |
+
3.072026076380412,
|
59 |
+
3.0741526353200275,
|
60 |
+
3.0750242593129475
|
61 |
+
],
|
62 |
+
"rose": [
|
63 |
+
0.5330904651641846,
|
64 |
+
0.3225712060133616,
|
65 |
+
0.2868388524691264,
|
66 |
+
0.26746210424105327,
|
67 |
+
0.2550309862534205,
|
68 |
+
0.24600428889592488,
|
69 |
+
0.2402667633374532,
|
70 |
+
0.23643683848381042,
|
71 |
+
0.2345398904800415,
|
72 |
+
0.23381469444433847
|
73 |
+
],
|
74 |
+
"test_acc": [
|
75 |
+
0.5602,
|
76 |
+
0.8063,
|
77 |
+
0.9052,
|
78 |
+
0.9184,
|
79 |
+
0.9295,
|
80 |
+
0.9426,
|
81 |
+
0.9456,
|
82 |
+
0.9476,
|
83 |
+
0.947,
|
84 |
+
0.9489
|
85 |
+
],
|
86 |
+
"train_acc": [
|
87 |
+
0.5265166666666666,
|
88 |
+
0.7662166666666667,
|
89 |
+
0.8785166666666666,
|
90 |
+
0.9232333333333334,
|
91 |
+
0.94165,
|
92 |
+
0.9666,
|
93 |
+
0.9777,
|
94 |
+
0.98115,
|
95 |
+
0.9812166666666666,
|
96 |
+
0.9815333333333334
|
97 |
+
],
|
98 |
+
"train_loss": [
|
99 |
+
4.48557572962443,
|
100 |
+
3.536102939987183,
|
101 |
+
3.072022127532959,
|
102 |
+
2.736741449737549,
|
103 |
+
2.5052449064890543,
|
104 |
+
2.3470733192443847,
|
105 |
+
2.245156974029541,
|
106 |
+
2.182974470901489,
|
107 |
+
2.152672373199463,
|
108 |
+
2.1409359020233154
|
109 |
+
]
|
110 |
+
}
|
sweep/KMNIST/20250825-012106_KMNIST/manifest.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"class_names": [
|
3 |
+
"kmnist-\u304a",
|
4 |
+
"kmnist-\u304d",
|
5 |
+
"kmnist-\u3059",
|
6 |
+
"kmnist-\u3064",
|
7 |
+
"kmnist-\u306a",
|
8 |
+
"kmnist-\u306f",
|
9 |
+
"kmnist-\u307e",
|
10 |
+
"kmnist-\u3084",
|
11 |
+
"kmnist-\u308c",
|
12 |
+
"kmnist-\u3092"
|
13 |
+
],
|
14 |
+
"dataset_name": "KMNIST",
|
15 |
+
"environment": {
|
16 |
+
"cpu_count": 96,
|
17 |
+
"cuda_available": false,
|
18 |
+
"cuda_device": null,
|
19 |
+
"memory_gb": 334.56,
|
20 |
+
"platform": "Linux-6.1.123+-x86_64-with-glibc2.35",
|
21 |
+
"python": "3.12.11 (main, Jun 4 2025, 08:56:18) [GCC 11.4.0]",
|
22 |
+
"torch": "2.8.0+cpu"
|
23 |
+
},
|
24 |
+
"models": {
|
25 |
+
"constellation": {
|
26 |
+
"params": 16777
|
27 |
+
},
|
28 |
+
"diagnostic_head": {
|
29 |
+
"params": 7681
|
30 |
+
},
|
31 |
+
"encoder": {
|
32 |
+
"params": 429897
|
33 |
+
}
|
34 |
+
},
|
35 |
+
"num_classes": 10,
|
36 |
+
"repo_id": "AbstractPhil/pentachora-multi-channel-frequency-encoded",
|
37 |
+
"results": {
|
38 |
+
"best_epoch": 10,
|
39 |
+
"best_test_accuracy": 0.9489
|
40 |
+
},
|
41 |
+
"subdirectory": "sweep/KMNIST/20250825-012106_KMNIST",
|
42 |
+
"timestamp": "20250825-012106"
|
43 |
+
}
|
sweep/KMNIST/20250825-012106_KMNIST/plots/accuracy.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/best_confusion_fashionmnist_epoch_9.png
ADDED
![]() |
Git LFS Details
|
sweep/KMNIST/20250825-012106_KMNIST/plots/best_confusion_kmnist_epoch_10.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/best_confusion_mnist_epoch_10.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_1.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_10.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_2.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_3.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_4.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_5.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_6.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_7.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_8.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/confusion_epoch_9.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/lambda.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/plots/loss_components.png
ADDED
![]() |
sweep/KMNIST/20250825-012106_KMNIST/tensorboard/events.out.tfevents.1756084397.5def8ea04e29.2559.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3513ca9fcc02e1ff9a05dd6b9cf00a86ec3fc07cc2828895bb547aa5095195c
|
3 |
+
size 170008
|
sweep/KMNIST/20250825-012106_KMNIST/tensorboard_events.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63c046e5563570ab1245cac20b46c134aa1643bb08978ad114819834248f91fa
|
3 |
+
size 55540
|
sweep/KMNIST/20250825-012106_KMNIST/weights/constellation_KMNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3fb3fd8d4e57260880fc05004229990b66a39ad886f2d9902c5cff62463a96
|
3 |
+
size 70076
|
sweep/KMNIST/20250825-012106_KMNIST/weights/diagnostic_head_KMNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da494e317c6f4bc200390e1efa8a54e3f4d2d4efbbe05be657c021dfb1abe3d1
|
3 |
+
size 31172
|
sweep/KMNIST/20250825-012106_KMNIST/weights/encoder_KMNIST.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a7479af9684ee9daba831b2745e3c5c064963e4472ce6fabcdd4c232f1673d9
|
3 |
+
size 1731664
|