diff --git a/11/edges.pkl b/11/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..4a55723a29de417bb353407a4e5c9757485c46b6 --- /dev/null +++ b/11/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065665533dc7cf3c973fc8c0b0933d1e8429d17836623d5a9af405c845d8b285 +size 1178 diff --git a/11/ll_model_510.pth b/11/ll_model_510.pth index 823e929357018f7e021e63a73f69e797a2d142f6..f61100eef326423dcb3018ef5e999587674c41d4 100644 Binary files a/11/ll_model_510.pth and b/11/ll_model_510.pth differ diff --git a/11/ll_model_cfg_510.pkl b/11/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..1acb8792be1a154e9fd77f84f84ef7feb99dfc0e --- /dev/null +++ b/11/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8e5809cf449449c4551be0b5808e9d5886ea09f79c7eb0403bf2432bc5c3148 +size 1040 diff --git a/11/meta_510.json b/11/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..ad7d06c8eb7a159f35709736ae39d69de1f2c9a0 --- /dev/null +++ b/11/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.01, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 500, "act_fn": "gelu", "wandb_suffix": "strict_11", "device": "cpu", "clip_grad_norm": 1.0, "lr_scheduler": ""} \ No newline at end of file diff --git a/13/edges.pkl b/13/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..77513f4611eed1b5302d422e25853647e4ea7ae2 --- /dev/null +++ b/13/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71db99d1f02016dbeb19f31dd153dbd9868d9569e8434b8729f5730a058b874 +size 1829 diff --git a/13/ll_model_510.pth b/13/ll_model_510.pth index 6989f8ba38cb8d4cd106f04139289b2dfcf22373..c88f2225b80f9623f3b737f7bf3472b8514f639e 100644 Binary files a/13/ll_model_510.pth and b/13/ll_model_510.pth differ diff --git a/13/ll_model_cfg_510.pkl b/13/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..fe48a1176cd63188e559350cb434173eae2a5229 --- /dev/null +++ b/13/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12e9924e5c037c5866059ec5b4f59311e6a8d9c15481600cf7b8d119d7830856 +size 1047 diff --git a/13/meta_510.json b/13/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..94cf8a03ce2b86feac549383a688cc4e82ab7014 --- /dev/null +++ b/13/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.01, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 500, "act_fn": "gelu", "wandb_suffix": "strict_13", "device": "cpu", "clip_grad_norm": 1.0, "lr_scheduler": ""} \ No newline at end of file diff --git a/14/ll_model_510.pth b/14/ll_model_510.pth deleted file mode 100644 index ff2392fa2d3d3f3ab9f831de6a769915a01b6f14..0000000000000000000000000000000000000000 Binary files a/14/ll_model_510.pth and /dev/null differ diff --git a/18/edges.pkl b/18/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..e86ca04e08ceea17226795b7c31d325808ae412c --- /dev/null +++ b/18/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de9c8187bd199794f71480678b04101fc50242f701f228051efa0c4af4ca7242 +size 736 diff --git a/18/ll_model_510.pth b/18/ll_model_510.pth index 75d1404eecac136bfea503ce303b2f6226dec337..089a9f8d4a693452716ed820f5d42aa93157257b 100644 Binary files a/18/ll_model_510.pth and b/18/ll_model_510.pth differ diff --git a/18/ll_model_cfg_510.pkl b/18/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..eac2d5c57c52a4c27e3095bc737654392afb5d7d --- /dev/null +++ b/18/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c2266bcf169741580719d23b7bd184c98584fe9da1135ee01cbf8fd882671e +size 1047 diff --git a/18/meta_510.json b/18/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..98109671e5a6b3f53885349ce21c255c167e7a0f --- /dev/null +++ b/18/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "strict_18", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/19/edges.pkl b/19/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..d3e3fd2a2631ce8f1bf456251850710759a884df --- /dev/null +++ b/19/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b58d652c3784ce091344dc94cfb718e59bca64d317835ed9bf45c48b08a637 +size 1230 diff --git a/19/ll_model_510.pth b/19/ll_model_510.pth index 503dd62d48b4a6af302017c6f4962e69aecec0cc..8bd928495a37246dc5865e8edeb997d8cb30b009 100644 Binary files a/19/ll_model_510.pth and b/19/ll_model_510.pth differ diff --git a/19/ll_model_cfg_510.pkl b/19/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..3fe48ed920f4a7a7955fdfbb6f2bdfb539dfbe79 --- /dev/null +++ b/19/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7cf21b18f4d89acee932d53fa4850ac823391a9e6803aa1d2df33407737510 +size 1040 diff --git a/19/meta_510.json b/19/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..11d0c3837141a67b3c8f62697c19b82e16451f17 --- /dev/null +++ b/19/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "strict_19", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/20/edges.pkl b/20/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..afec1008cb46b8b77e5433338f9863cd9c983c4d --- /dev/null +++ b/20/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8c3a044fb135347b1f6fb64152424b1855dfad64220ad6e239930731444dc8 +size 629 diff --git a/20/ll_model_1110.pth b/20/ll_model_1110.pth new file mode 100644 index 0000000000000000000000000000000000000000..e0728474952c7b11abf2a79e63ef92afc3a1a8d8 --- /dev/null +++ b/20/ll_model_1110.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b717f63cb722db507ee0b9f70a3ce460570bfb4ad742623011e62116987fd7 +size 14606 diff --git a/20/ll_model_cfg_1110.pkl b/20/ll_model_cfg_1110.pkl new file mode 100644 index 0000000000000000000000000000000000000000..7d87bef9fcdb600f545ffa636544da00ab952ba4 --- /dev/null +++ b/20/ll_model_cfg_1110.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af8a6a6a8cfb880cd1e09bc5a85038a1fefe4e0df798fafb9a27b9ca151e1d57 +size 1041 diff --git a/20/meta_1110.json b/20/meta_1110.json new file mode 100644 index 0000000000000000000000000000000000000000..c1840931c3a68496de65069c9ac9e757a3e823fe --- /dev/null +++ b/20/meta_1110.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 1.0, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "", "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/21/edges.pkl b/21/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0b9511390bf9a198513936d11362892a03d0e15b --- /dev/null +++ b/21/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382209935cbde69e8b7e7317a5e63b7e2de4fb0c3d975635be1e6815873fc1a5 +size 1595 diff --git a/21/ll_model_510.pth b/21/ll_model_510.pth index 78c2b16e58212a59bf1f90d263fbdc8cb0df8333..86dac5ace71131f8478fe8b05d8d05a3585e359b 100644 Binary files a/21/ll_model_510.pth and b/21/ll_model_510.pth differ diff --git a/21/ll_model_cfg_510.pkl b/21/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..fb0a8b365bae2adeec5a7fa00d08f46bdf7f4074 --- /dev/null +++ b/21/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac1e41b37b7e5e1354f89f226df13dfaa8fdceedb2d2b9e26231f5769855ae4 +size 1040 diff --git a/21/meta_510.json b/21/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..cfcdd78dbd2ef7375a6ca6232807e37a402fc35a --- /dev/null +++ b/21/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.01, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 500, "act_fn": "gelu", "wandb_suffix": "strict_21", "device": "cpu", "clip_grad_norm": 1.0, "lr_scheduler": ""} \ No newline at end of file diff --git a/24/edges.pkl b/24/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..339e83139b4af1c4f2b06382a313109df20152a0 --- /dev/null +++ b/24/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794d7a5a17d8f624af70616b787a9f03c9fdb751b0eb6b00e65e79cb3f1fc211 +size 1108 diff --git a/24/ll_model_510.pth b/24/ll_model_510.pth index 78c2b16e58212a59bf1f90d263fbdc8cb0df8333..86dac5ace71131f8478fe8b05d8d05a3585e359b 100644 Binary files a/24/ll_model_510.pth and b/24/ll_model_510.pth differ diff --git a/24/ll_model_cfg_510.pkl b/24/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..fb0a8b365bae2adeec5a7fa00d08f46bdf7f4074 --- /dev/null +++ b/24/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac1e41b37b7e5e1354f89f226df13dfaa8fdceedb2d2b9e26231f5769855ae4 +size 1040 diff --git a/24/meta_510.json b/24/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..47a6d3fa74c9c0b5a7e650ddcf84f99d7dcabf33 --- /dev/null +++ b/24/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.01, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 500, "act_fn": "gelu", "wandb_suffix": "strict_24", "device": "cpu", "clip_grad_norm": 1.0, "lr_scheduler": ""} \ No newline at end of file diff --git a/3/edges.pkl b/3/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..692b7b3f255622fdda579fd1229a8fc96f4f7d60 --- /dev/null +++ b/3/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95873ed61952d15383e2d51dfadf759f8fa6eb4618570c9793bdc41fbad0e115 +size 1722 diff --git a/3/ll_model_10110.pth b/3/ll_model_10110.pth new file mode 100644 index 0000000000000000000000000000000000000000..83a5159b411bdd736623b9542de488b859716070 --- /dev/null +++ b/3/ll_model_10110.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c9b5c4e22613f30de503e6f4add5dac18ab0a947e441bfc96d36238944721b9 +size 26738 diff --git a/3/ll_model_510.pth b/3/ll_model_510.pth deleted file mode 100644 index a8e25c151f838ed02c9a53b33d162ad028c1df32..0000000000000000000000000000000000000000 Binary files a/3/ll_model_510.pth and /dev/null differ diff --git a/3/ll_model_cfg_10110.pkl b/3/ll_model_cfg_10110.pkl new file mode 100644 index 0000000000000000000000000000000000000000..44560c5414721d40812cd2b93be931937927780f --- /dev/null +++ b/3/ll_model_cfg_10110.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:568ced292068db1d0969dd8000cc9c44def563bdc7586757f1dc5b981f913936 +size 1040 diff --git a/3/meta_10110.json b/3/meta_10110.json new file mode 100644 index 0000000000000000000000000000000000000000..0b0d69e982dcc8bf213630648ac532427fa51a29 --- /dev/null +++ b/3/meta_10110.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 10.0, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/33/edges.pkl b/33/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..afec1008cb46b8b77e5433338f9863cd9c983c4d --- /dev/null +++ b/33/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8c3a044fb135347b1f6fb64152424b1855dfad64220ad6e239930731444dc8 +size 629 diff --git a/33/ll_model_510.pth b/33/ll_model_510.pth index 4c89a5fdc6881630ffdb5f6476522698830e1009..d45b5289f4f8311eae08fdc53dbafb39472398de 100644 Binary files a/33/ll_model_510.pth and b/33/ll_model_510.pth differ diff --git a/33/ll_model_cfg_510.pkl b/33/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..25c418702cc979923ff5f9bd8fe49e62de5f9536 --- /dev/null +++ b/33/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:552f3270651c907ede2338d58c36747ed12723e58dd8c622e608db76658532a1 +size 1040 diff --git a/33/meta_510.json b/33/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..4230f95c50acd9549ef1d74b5cba5afa28257c88 --- /dev/null +++ b/33/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "strict_33", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/34/edges.pkl b/34/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..afec1008cb46b8b77e5433338f9863cd9c983c4d --- /dev/null +++ b/34/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8c3a044fb135347b1f6fb64152424b1855dfad64220ad6e239930731444dc8 +size 629 diff --git a/34/ll_model_510.pth b/34/ll_model_510.pth index 80ce8c30203d8c0518ce42ef892723461c4e8151..7a1bfefa2e51e1bc1504d3c628e74752acbc796d 100644 Binary files a/34/ll_model_510.pth and b/34/ll_model_510.pth differ diff --git a/34/ll_model_cfg_510.pkl b/34/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..776bf4c43ffe8179c54b8b7b74330d382fd05d7b --- /dev/null +++ b/34/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517cbd2d3ebe0747291d8e2c5b8bee0a4be38e1b3aec3eba48ac10cd10132a6e +size 1040 diff --git a/34/meta_510.json b/34/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..af431510517446fb8b394cd433395cacd76fe09a --- /dev/null +++ b/34/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "strict_34", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/35/edges.pkl b/35/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..afec1008cb46b8b77e5433338f9863cd9c983c4d --- /dev/null +++ b/35/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8c3a044fb135347b1f6fb64152424b1855dfad64220ad6e239930731444dc8 +size 629 diff --git a/35/ll_model_510.pth b/35/ll_model_510.pth index 34f33fa3d8942550e810a55f05728e608a430fb1..9c8010462aeb1efb6b56eead0cd2bbd64fc047f9 100644 Binary files a/35/ll_model_510.pth and b/35/ll_model_510.pth differ diff --git a/35/ll_model_cfg_510.pkl b/35/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..c20567fb8e91d7cac0d0687fb9f8d7a068da97f3 --- /dev/null +++ b/35/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c5e8f452511eaea1cd87534c033ee32cd7871f4f2d0224198aef72d76f6c55 +size 1040 diff --git a/35/meta_510.json b/35/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..fdef49b28114562ca5bbef4ab719664f506188e0 --- /dev/null +++ b/35/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "strict_35", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/36/edges.pkl b/36/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..afec1008cb46b8b77e5433338f9863cd9c983c4d --- /dev/null +++ b/36/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8c3a044fb135347b1f6fb64152424b1855dfad64220ad6e239930731444dc8 +size 629 diff --git a/36/ll_model_10110.pth b/36/ll_model_10110.pth new file mode 100644 index 0000000000000000000000000000000000000000..e897facf848e2967cd1f6145c996215a906e4d49 --- /dev/null +++ b/36/ll_model_10110.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d048ade987609a03c14c6d8c6b7d973546f6433daaae0315fda57450efb4269a +size 14514 diff --git a/36/ll_model_510.pth b/36/ll_model_510.pth deleted file mode 100644 index 9fe531e93411a6adf172fbb1e4c0c83633c5537a..0000000000000000000000000000000000000000 Binary files a/36/ll_model_510.pth and /dev/null differ diff --git a/36/ll_model_cfg_10110.pkl b/36/ll_model_cfg_10110.pkl new file mode 100644 index 0000000000000000000000000000000000000000..741f0d01a16d62576acf308c01ed94ed0bb899bd --- /dev/null +++ b/36/ll_model_cfg_10110.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a4668c6c0100f39a7b25f5317971516202f0eb028643e9d89cb23c959eacd7 +size 1041 diff --git a/36/meta_10110.json b/36/meta_10110.json new file mode 100644 index 0000000000000000000000000000000000000000..f74fc38a4310e739e7912e52ff067e2b233c0ba1 --- /dev/null +++ b/36/meta_10110.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 10.0, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "", "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/37/edges.pkl b/37/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..afec1008cb46b8b77e5433338f9863cd9c983c4d --- /dev/null +++ b/37/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8c3a044fb135347b1f6fb64152424b1855dfad64220ad6e239930731444dc8 +size 629 diff --git a/37/ll_model_510.pth b/37/ll_model_510.pth index 31c05e29ca869f09904a1341cd4eeb0a25bcdbd4..3cbdada917b37a407eb3ab0008e5341feb8eb4b8 100644 Binary files a/37/ll_model_510.pth and b/37/ll_model_510.pth differ diff --git a/37/ll_model_cfg_510.pkl b/37/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..c20567fb8e91d7cac0d0687fb9f8d7a068da97f3 --- /dev/null +++ b/37/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c5e8f452511eaea1cd87534c033ee32cd7871f4f2d0224198aef72d76f6c55 +size 1040 diff --git a/37/meta_510.json b/37/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..f77b33b7eb7f5a9733f2176c9a0b8341c838da12 --- /dev/null +++ b/37/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "strict_37", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/38/edges.pkl b/38/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..77513f4611eed1b5302d422e25853647e4ea7ae2 --- /dev/null +++ b/38/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71db99d1f02016dbeb19f31dd153dbd9868d9569e8434b8729f5730a058b874 +size 1829 diff --git a/38/ll_model_510.pth b/38/ll_model_510.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ae7b45c1829dd4c4b58971b8e9adf0bec81e17d --- /dev/null +++ b/38/ll_model_510.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c191468c30f7a194a00f7f29c1ddb8e1f87ff2d7a9b022314de660362da3723 +size 53098 diff --git a/38/ll_model_cfg_510.pkl b/38/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..fac63d7625559c74eab26439b2f5c8e7b812cfe7 --- /dev/null +++ b/38/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7bc85e2ec5253d130f1ef79fa059f4b9af6c5fb040eee0239ab663f2035d9cc +size 1040 diff --git a/38/meta_510.json b/38/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..78d58d5b5c18aaea18e9c1beb433cdcc09e3b5db --- /dev/null +++ b/38/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "strict_38", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/4/edges.pkl b/4/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..1ef023aa4101a1efe82af28ff3ea55056a5c5bb7 --- /dev/null +++ b/4/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6784ca89791141f4cc128c6604f9613ace7110e6e78806998fee7498354d91 +size 1829 diff --git a/4/ll_model_510.pth b/4/ll_model_510.pth index 00c7662104122c25f270ad5a28e9b6026748752e..b2ba3e628ac7d663bd9e3cb7612d947b6e3dcf48 100644 Binary files a/4/ll_model_510.pth and b/4/ll_model_510.pth differ diff --git a/4/ll_model_cfg_510.pkl b/4/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..dbe508a8aa17e3012f66c0afd7d6ec118f740720 --- /dev/null +++ b/4/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea875b100ba7c7d262e7b387c4f9fae70d2581aeb09ae768977cc54972a9c12 +size 1040 diff --git a/4/meta_510.json b/4/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..fe714a5527187396113395b836086dd9c3acf9a9 --- /dev/null +++ b/4/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.001, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 2000, "act_fn": "gelu", "wandb_suffix": "strict_4", "device": "cpu", "clip_grad_norm": 0.1, "lr_scheduler": ""} \ No newline at end of file diff --git a/7/ll_model_510.pth b/7/ll_model_510.pth deleted file mode 100644 index 4ddfecdcc43dcca4667add223005ba9e9b8f7f2a..0000000000000000000000000000000000000000 Binary files a/7/ll_model_510.pth and /dev/null differ diff --git a/8/edges.pkl b/8/edges.pkl new file mode 100644 index 0000000000000000000000000000000000000000..d3e3fd2a2631ce8f1bf456251850710759a884df --- /dev/null +++ b/8/edges.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b58d652c3784ce091344dc94cfb718e59bca64d317835ed9bf45c48b08a637 +size 1230 diff --git a/8/ll_model_510.pth b/8/ll_model_510.pth index b1bb3f3dea313e4504794bfa997ae47cdaa6dd66..ae782c349a46ed3e801410f0dc694c6b9f681fa3 100644 Binary files a/8/ll_model_510.pth and b/8/ll_model_510.pth differ diff --git a/8/ll_model_cfg_510.pkl b/8/ll_model_cfg_510.pkl new file mode 100644 index 0000000000000000000000000000000000000000..5fbf50158370039e993f7f5e3127a9f8fe6d7039 --- /dev/null +++ b/8/ll_model_cfg_510.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26ed2380d55b0c6dc018ccdd4211050bb616baabf64ed1ff67e0f03027af3133 +size 1040 diff --git a/8/meta_510.json b/8/meta_510.json new file mode 100644 index 0000000000000000000000000000000000000000..61a44a7321a65718923a662c80a8b0e386bbcba2 --- /dev/null +++ b/8/meta_510.json @@ -0,0 +1 @@ +{"atol": 0.05, "lr": 0.01, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4, "epochs": 500, "act_fn": "gelu", "wandb_suffix": "strict_8", "device": "cpu", "clip_grad_norm": 1.0, "lr_scheduler": ""} \ No newline at end of file diff --git a/ioi_next_token/corr_100_100_40.json b/ioi_next_token/corr_100_100_40.json new file mode 100644 index 0000000000000000000000000000000000000000..ecc5891c87b06b4dbec09e59eac915a2cefc8adf --- /dev/null +++ b/ioi_next_token/corr_100_100_40.json @@ -0,0 +1 @@ +{"hook_duplicate": ["blocks.0.attn.hook_z"], "hook_s_inhibition": ["blocks.2.attn.hook_z"], "hook_name_mover": ["blocks.4.attn.hook_z"]} \ No newline at end of file diff --git a/ioi_next_token/ll_model_100_100_40.pth b/ioi_next_token/ll_model_100_100_40.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f5a3470601606413b7e7be51f88bb677bd2e04e --- /dev/null +++ b/ioi_next_token/ll_model_100_100_40.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8136b3d842ffbcaef9771ebb6fde4274e95dba2a44230eab474c8212703e6300 +size 42432926 diff --git a/ioi_next_token/results_100_100_40/training_args.json b/ioi_next_token/results_100_100_40/training_args.json new file mode 100644 index 0000000000000000000000000000000000000000..54cf8269001d612b29735709737da47dd0ce45fa --- /dev/null +++ b/ioi_next_token/results_100_100_40/training_args.json @@ -0,0 +1 @@ +{"next_token": true, "non_ioi_thresh": 0.65, "use_per_token_check": false, "batch_size": 256, "lr": 0.001, "num_workers": 0, "early_stop": true, "lr_scheduler": null, "scheduler_val_metric": ["val/accuracy", "val/IIA"], "scheduler_mode": "max", "clip_grad_norm": 1.0, "atol": 0.05, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4} \ No newline at end of file