rwightman HF staff commited on
Commit
67e3f61
·
verified ·
1 Parent(s): 12ff40b

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ datasets:
4
+ - timm/mini-imagenet
5
+ ---
6
+
7
+ # Comparisons of timm Optimizers w/ Caution
8
+
9
+ This repo contains summaries of several sets of experiments comparing a number of optimizers with and without caution (https://huggingface.co/papers/2411.16085) enabled.
10
+
11
+ The runs were all performed training from scratch on the `timm` 'mini-imagenet' dataset, a 100 class subset of imagenet with same image sizes as originals.
12
+
13
+ So far I have results for `adamw` and `laprop` but have some `mars` on the way. You can find full results in sub-folders by optimizer names.
14
+
15
+ # LaProp
16
+
17
+ # AdamW
18
+
19
+
adamw/adamw-lr_0002-checkpoint-203.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88e49c27b341259fa626e2a4e4e4f3a2b62a828b39e3875857c13af111a4b7dc
3
+ size 211387470
adamw/adamw-lr_0005-checkpoint-185.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94f5b15c9ea001595235ab0c50fec59e0ae5b1f82626cdb62a71b8c62b1d65ee
3
+ size 211387470
adamw/adamw-lr_001-checkpoint-199.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c76b35ea0ffee3b6c7958bcc645ab4941f7fe3b24aad71095621ddc108f74e80
3
+ size 211387470
adamw/adamw-lr_001-clip-checkpoint-195.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:118abb1714f851691b73ca52fe20015e14a035bbb4f1c694333be33080391aef
3
+ size 211387470
adamw/cadamw-lr_0002-checkpoint-189.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86c1363d080c254eb95d12a0df9c8d30eed81ea46866c3e5826ec82ccbfc9706
3
+ size 211336594
adamw/cadamw-lr_0005-checkpoint-199.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13aa98399271229bcba63637e2566bfce07704e99ab62d465262bad116507da9
3
+ size 211336594
adamw/cadamw-lr_001-checkpoint-184.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fad9e197ad7d73fde5544cf897dbd16c41c9daf58b5cae81bc90cca5041da3e
3
+ size 211336594
adamw/cadamw-lr_001-clip-checkpoint-203.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b22a9657e417d5dbdedb24f6f628f4f2817dd8d7e8cd5b7db3ce85acfaaa54c6
3
+ size 211336594
adamw/eval_loss_comparison.png ADDED
adamw/eval_top1_comparison.png ADDED
adamw/eval_top5_comparison.png ADDED
adamw/final_results_summary.csv ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ ,epoch,train_loss,eval_loss,eval_top1,eval_top5,lr
2
+ "cadamw, lr=1e-03",184.0,2.2688851356506348,1.0868136840820313,73.52000141601563,91.60000036621092,2.4471741852423235e-05
3
+ "cadamw, lr=5e-04",199.0,2.163278102874756,1.0976034646987916,73.3900005859375,91.31000137939454,7.70666566718009e-07
4
+ "cadamw, lr=1e-03, clip grads",203.0,2.1360626220703125,1.1043113907814026,73.33000158691407,91.41000042724608,6.168375916970616e-08
5
+ "adamw, lr=1e-03, clip grads",195.0,2.2746386528015137,1.142998440361023,72.11000151367188,90.47000052490236,4.988171141721176e-06
6
+ "adamw, lr=5e-04",185.0,2.3040246963500977,1.1535791856765747,71.50000120849609,90.4800001953125,1.1051746300417442e-05
7
+ "adamw, lr=1e-03",199.0,2.223684310913086,1.1657958560943604,71.22999993896484,90.30999958496092,1.541333133436018e-06
8
+ "cadamw, lr=2e-04",189.0,2.538627862930298,1.2325929063796996,68.94999995117188,89.61000139160156,2.763007960232344e-06
9
+ "adamw, lr=2e-04",203.0,2.579624652862549,1.3085522148132325,67.11000026855469,88.66000164794922,1.2336751833941227e-08
adamw/train_loss_comparison.png ADDED
laprop/claprop-lr_0002-checkpoint-195.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:558bad1ced67c3dd94eea7f599f114880fa3b056e50115b7291b6218888d2b34
3
+ size 211342290
laprop/claprop-lr_0005-checkpoint-183.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91b5d53fb993cb498da5e3120bc4ee7475542a9e3d0da09aaada61ec5abdd21d
3
+ size 211342290
laprop/claprop-lr_001-checkpoint-204.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fae5f775ae350f34f01e62d8bb40f67ef5d6e7dfd81d33125a019ae9b4e0da34
3
+ size 211342290
laprop/claprop-lr_002-checkpoint-193.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f6b43bcf14bd5decc2494305faa53611315dcc212e729b6221f4593c7e1d1eb
3
+ size 211342290
laprop/eval_loss_comparison.png ADDED
laprop/eval_top1_comparison.png ADDED
laprop/eval_top5_comparison.png ADDED
laprop/final_results_summary.csv ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ ,epoch,train_loss,eval_loss,eval_top1,eval_top5,lr
2
+ "claprop, lr=1e-03",204.0,2.2173619270324707,1.0931779468536378,73.920000390625,91.33000009765624,0.0
3
+ "claprop, lr=5e-04",183.0,2.262192726135254,1.0912627222061158,73.77000073242188,91.22000260009766,1.3478660293113704e-05
4
+ "laprop, lr=5e-04",198.0,2.2425642013549805,1.1426102781295775,71.73000213623047,90.55000146484376,1.109508849230001e-06
5
+ "laprop, lr=1e-03",179.0,2.290040969848633,1.168387135314941,71.15000104980469,90.18000189208983,3.806023374435663e-05
6
+ "claprop, lr=2e-04",195.0,2.546172380447388,1.2475446645736694,68.30000163574219,89.15000153808593,9.97634228344235e-07
7
+ "laprop, lr=2e-04",204.0,2.6702351570129395,1.309178423690796,67.07999990234374,88.67000270996094,0.0
8
+ "claprop, lr=2e-03",193.0,2.678058862686157,1.5239886917114258,62.08000177001953,84.8,1.4890673845226132e-05
9
+ "laprop, lr=2e-03",200.0,2.70467209815979,1.522907255935669,61.46000135498047,85.28000162353516,1.9732715717284413e-06
laprop/laprop-lr_0002-checkpoint-204.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9afc7c1fbe28416b81369c40640fb2bd6e1884c384c374e50e9ab7a3908dbb5e
3
+ size 211342290
laprop/laprop-lr_0005-checkpoint-198.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37a62da798552af81f067d28bb1325276efb8e749f5a5f889e21e805a4617233
3
+ size 211342290
laprop/laprop-lr_001-checkpoint-179.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3e0ae5d6a347032f2c35b11e304cc8815f0e627cfdd025af2d854d6f33c6d30
3
+ size 211342290
laprop/laprop-lr_002-checkpoint-200.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:154e6cf00f58f5633c347c178328b01ac9e10833e77db7b6eb36a364c4b5f085
3
+ size 211342290
laprop/train_loss_comparison.png ADDED