Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
32 commits
Select commit Hold shift + click to select a range
57e8174
Premiere tentative implémentation EBM
ArdSionnach Apr 20, 2026
8aff401
Premier essai EBM
ArdSionnach Apr 21, 2026
d282fa6
Avant gros train
ArdSionnach Apr 21, 2026
791883f
added visible field
ArdSionnach Apr 21, 2026
85cb3c8
Update cli
ArdSionnach Apr 22, 2026
bad733f
notebooks and trainings
ArdSionnach Apr 23, 2026
74361bc
update var init
ArdSionnach Apr 23, 2026
3664a4c
alpha
ArdSionnach Apr 23, 2026
f24edd6
alpha v2
ArdSionnach Apr 23, 2026
7877abf
CEBM
ArdSionnach Apr 27, 2026
90251ed
BEBM_MLP_ReLU_vs_SiLU
ArdSionnach Apr 30, 2026
d1dde0d
update_h_gradient
ArdSionnach Apr 30, 2026
2677495
notebook comparaison
ArdSionnach Apr 30, 2026
2307ab3
h start a 0
ArdSionnach Apr 30, 2026
af905e2
Notebooks
ArdSionnach May 6, 2026
595fbde
init h
ArdSionnach May 6, 2026
0bc5cee
notebook
ArdSionnach May 6, 2026
c3621bb
sigmoid
ArdSionnach May 6, 2026
f9c1e8a
bug init h
ArdSionnach May 6, 2026
41875c0
revert silu
ArdSionnach May 6, 2026
314c94c
MLP no w2 + modular weights
ArdSionnach May 7, 2026
6d1d162
debug
ArdSionnach May 7, 2026
d2d6273
Sigmo no w2
ArdSionnach May 7, 2026
3be6369
option silu sigmo
ArdSionnach May 7, 2026
af70bf4
weight scale
ArdSionnach May 8, 2026
7079921
weight scale
ArdSionnach May 8, 2026
8eb0f7e
alpha init
ArdSionnach May 11, 2026
c450bf7
alpha again
ArdSionnach May 11, 2026
133ba16
nb
ArdSionnach May 11, 2026
ecf8977
weight scale init
ArdSionnach May 11, 2026
6cb833c
Restructure
ArdSionnach May 12, 2026
654ea3f
Merge pull request #1 from AidanLiotard/update_h_gradient
AidanLiotard May 14, 2026
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Binary file added .DS_Store
Binary file not shown.
555 changes: 555 additions & 0 deletions CEBM_MLP_training_diagnostics.ipynb
Copy link
Copy Markdown
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

ca degage

Large diffs are not rendered by default.

130 changes: 130 additions & 0 deletions long_runs_summary.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,130 @@
[
{
"label": "PCD SiLU NoW2",
"file": "pcd_trains/BEBM_SiLUNoW2_MNIST_DMALA1000_h500_init2e-3_lr1_1M.h5",
"n_saved": 149,
"last_update": 165958,
"keys": [
"activation_id",
"net.0.bias",
"net.0.weight",
"visible_field"
],
"vf_norm": 83033.9921875,
"vf_max": 11102.6220703125,
"vf_mean": -1595.8912353515625,
"w1_shape": "(500, 784)",
"w1_top1": 316697.84375,
"w1_top10": 35082.2109375,
"w1_top100": 3777.509765625,
"w1_rank1_share": 0.9939182996749878,
"w1_fro": 317665.21875,
"b1_mean": -186.12503051757812,
"b1_std": 4.241181373596191,
"b1_max": 199.09078979492188
},
{
"label": "PCD Sigmoid NoW2",
"file": "pcd_trains/BEBM_SigmoidNoW2_MNIST_DMALA1000_h500_init2e-3_lr1_1M.h5",
"n_saved": 149,
"last_update": 165958,
"keys": [
"activation_id",
"net.0.bias",
"net.0.weight",
"visible_field"
],
"vf_norm": 175.0694122314453,
"vf_max": 12.101303100585938,
"vf_mean": -4.691315174102783,
"w1_shape": "(500, 784)",
"w1_top1": 246.93637084960938,
"w1_top10": 119.21197509765625,
"w1_top100": 38.297794342041016,
"w1_rank1_share": 0.22283990681171417,
"w1_fro": 523.1046142578125,
"b1_mean": -3.8225128650665283,
"b1_std": 2.0763652324676514,
"b1_max": 6.312178134918213
},
{
"label": "PCD SiLU W2",
"file": "pcd_trains/BEBM_SiLUW2_MNIST_DMALA1000_h500_init2e-3_lr1e-1_1M.h5",
"n_saved": 134,
"last_update": 58884,
"keys": [
"net.0.bias",
"net.0.weight",
"net.2.bias",
"net.2.weight",
"visible_field"
],
"vf_norm": 162.9449462890625,
"vf_max": 9.335200309753418,
"vf_mean": -4.58335542678833,
"w1_shape": "(500, 784)",
"w1_top1": 38.34831237792969,
"w1_top10": 24.081403732299805,
"w1_top100": 11.07005500793457,
"w1_rank1_share": 0.08474628627300262,
"w1_fro": 131.73036193847656,
"w2_shape": "(1, 500)",
"w2_norm": 48.97020721435547,
"w2_max": 5.792479991912842,
"b1_mean": -0.2771584689617157,
"b1_std": 2.4273900985717773,
"b1_max": 23.419179916381836
},
{
"label": "PTT SiLU NoW2",
"file": "ptt_trains/BEBM_SiLUNoW2_MNIST_PTT_DMALA1000_h500_init2e-3_lr1_500k.h5",
"n_saved": 148,
"last_update": 65407,
"keys": [
"activation_id",
"net.0.bias",
"net.0.weight",
"visible_field"
],
"vf_norm": 237.40695190429688,
"vf_max": 18.76725196838379,
"vf_mean": -6.284590721130371,
"w1_shape": "(500, 784)",
"w1_top1": 292.43609619140625,
"w1_top10": 283.3573303222656,
"w1_top100": 239.63055419921875,
"w1_rank1_share": 0.010965309105813503,
"w1_fro": 2792.67578125,
"b1_mean": -0.03123946487903595,
"b1_std": 1.0010740756988525,
"b1_max": 3.9160094261169434
},
{
"label": "PTT SiLU W2",
"file": "ptt_trains/BEBM_SiLUW2_MNIST_PTT_DMALA1000_h500_init2e-3_lr1e-1_500k.h5",
"n_saved": 163,
"last_update": 33879,
"keys": [
"net.0.bias",
"net.0.weight",
"net.2.bias",
"net.2.weight",
"visible_field"
],
"vf_norm": 153.01023864746094,
"vf_max": 9.231229782104492,
"vf_mean": -4.340636730194092,
"w1_shape": "(500, 784)",
"w1_top1": 7.3609299659729,
"w1_top10": 4.708344459533691,
"w1_top100": 1.409213662147522,
"w1_rank1_share": 0.1199466660618782,
"w1_fro": 21.253896713256836,
"w2_shape": "(1, 500)",
"w2_norm": 35.71017837524414,
"w2_max": 10.47995662689209,
"b1_mean": 0.06310277432203293,
"b1_std": 0.463110089302063,
"b1_max": 7.387264728546143
}
]
997 changes: 997 additions & 0 deletions nb/BEBM_MLP/BEBM_MLP.ipynb
Copy link
Copy Markdown
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Retire le du dossier

Large diffs are not rendered by default.

Loading
Loading