Add files using upload-large-folder tool
Browse files- transcoder_all/layer_43_width_16k_l0_big/config.json +10 -0
- transcoder_all/layer_43_width_16k_l0_big/params.safetensors +3 -0
- transcoder_all/layer_43_width_16k_l0_small/config.json +10 -0
- transcoder_all/layer_43_width_16k_l0_small/params.safetensors +3 -0
- transcoder_all/layer_4_width_16k_l0_big/config.json +10 -0
- transcoder_all/layer_4_width_16k_l0_big/params.safetensors +3 -0
- transcoder_all/layer_4_width_16k_l0_small/config.json +10 -0
- transcoder_all/layer_4_width_16k_l0_small/params.safetensors +3 -0
- transcoder_all/layer_5_width_16k_l0_small/config.json +10 -0
- transcoder_all/layer_5_width_16k_l0_small/params.safetensors +3 -0
transcoder_all/layer_43_width_16k_l0_big/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 16384,
|
| 5 |
+
"model_name": "google/gemma-3-27b-pt",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 120,
|
| 8 |
+
"affine_connection": false,
|
| 9 |
+
"type": "transcoder"
|
| 10 |
+
}
|
transcoder_all/layer_43_width_16k_l0_big/params.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52a709bd764529706f991e626f003f1a5cd088912921570d62cc6b69c5e197f9
|
| 3 |
+
size 704796032
|
transcoder_all/layer_43_width_16k_l0_small/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 16384,
|
| 5 |
+
"model_name": "google/gemma-3-27b-pt",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 20,
|
| 8 |
+
"affine_connection": false,
|
| 9 |
+
"type": "transcoder"
|
| 10 |
+
}
|
transcoder_all/layer_43_width_16k_l0_small/params.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d672faadc475d95c5950d86e8be7086c7d55a66e1b896ff59046054a15aede61
|
| 3 |
+
size 704796032
|
transcoder_all/layer_4_width_16k_l0_big/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 16384,
|
| 5 |
+
"model_name": "google/gemma-3-27b-pt",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 71,
|
| 8 |
+
"affine_connection": false,
|
| 9 |
+
"type": "transcoder"
|
| 10 |
+
}
|
transcoder_all/layer_4_width_16k_l0_big/params.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b03390c32ceb755d5ad9eb9aea9d01b965196073c3bd728b753f89c7df9d528e
|
| 3 |
+
size 704796032
|
transcoder_all/layer_4_width_16k_l0_small/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 16384,
|
| 5 |
+
"model_name": "google/gemma-3-27b-pt",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 11,
|
| 8 |
+
"affine_connection": false,
|
| 9 |
+
"type": "transcoder"
|
| 10 |
+
}
|
transcoder_all/layer_4_width_16k_l0_small/params.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cf488368522ebc47bf73d9862ddfd17211774a275f9e18d29950c12992811c6
|
| 3 |
+
size 704796032
|
transcoder_all/layer_5_width_16k_l0_small/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 16384,
|
| 5 |
+
"model_name": "google/gemma-3-27b-pt",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 12,
|
| 8 |
+
"affine_connection": false,
|
| 9 |
+
"type": "transcoder"
|
| 10 |
+
}
|
transcoder_all/layer_5_width_16k_l0_small/params.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29e6f8607a900534b2573e2ae5ce70006d519db4caa0dc74cb9ba0173551c5d9
|
| 3 |
+
size 704796032
|