elephantmipt
commited on
Upload BatchTopKSAE
Browse files- config.json +4 -1
- model.safetensors +2 -2
config.json
CHANGED
@@ -1,6 +1,8 @@
|
|
1 |
{
|
2 |
-
"_attn_implementation_autoset": true,
|
3 |
"act_size": 64,
|
|
|
|
|
|
|
4 |
"aux_penalty": 0.03125,
|
5 |
"bandwidth": 0.001,
|
6 |
"dict_size": 128,
|
@@ -16,5 +18,6 @@
|
|
16 |
"sae_type": "batchtopk",
|
17 |
"top_k": 8,
|
18 |
"top_k_aux": 512,
|
|
|
19 |
"transformers_version": "4.46.3"
|
20 |
}
|
|
|
1 |
{
|
|
|
2 |
"act_size": 64,
|
3 |
+
"architectures": [
|
4 |
+
"BatchTopKSAE"
|
5 |
+
],
|
6 |
"aux_penalty": 0.03125,
|
7 |
"bandwidth": 0.001,
|
8 |
"dict_size": 128,
|
|
|
18 |
"sae_type": "batchtopk",
|
19 |
"top_k": 8,
|
20 |
"top_k_aux": 512,
|
21 |
+
"torch_dtype": "float32",
|
22 |
"transformers_version": "4.46.3"
|
23 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8002fc24bb63c0f394215354f0f2dde5982523c6e63822358d9a9e59fec71f01
|
3 |
+
size 66616
|