chanind commited on
Commit
4cd1e1e
·
verified ·
1 Parent(s): 8374090

Upload absorption/gemma-2-2b-res-snap-matryoshka-dc_blocks.17.hook_resid_post_eval_results.json with huggingface_hub

Browse files
absorption/gemma-2-2b-res-snap-matryoshka-dc_blocks.17.hook_resid_post_eval_results.json ADDED
@@ -0,0 +1,275 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eval_type_id": "absorption_first_letter",
3
+ "eval_config": {
4
+ "model_name": "gemma-2-2b",
5
+ "random_seed": 42,
6
+ "f1_jump_threshold": 0.03,
7
+ "max_k_value": 10,
8
+ "prompt_template": "{word} has the first letter:",
9
+ "prompt_token_pos": -6,
10
+ "llm_batch_size": 32,
11
+ "llm_dtype": "bfloat16",
12
+ "k_sparse_probe_l1_decay": 0.01,
13
+ "k_sparse_probe_batch_size": 4096,
14
+ "k_sparse_probe_num_epochs": 50,
15
+ "min_GT_probe_f1": 0.6,
16
+ "min_feats_for_eval": 20
17
+ },
18
+ "eval_id": "7dac3d47-5282-48db-a705-23f393c4c7d6",
19
+ "datetime_epoch_millis": 1745731323773,
20
+ "eval_result_metrics": {
21
+ "mean": {
22
+ "mean_absorption_fraction_score": 0.09190284658267972,
23
+ "mean_full_absorption_score": 0.07636835724538374,
24
+ "mean_num_split_features": 1.3076923076923077,
25
+ "std_dev_absorption_fraction_score": 0.14571296351546223,
26
+ "std_dev_full_absorption_score": 0.13893384441642123,
27
+ "std_dev_num_split_features": 0.6176879969195301
28
+ }
29
+ },
30
+ "eval_result_details": [
31
+ {
32
+ "first_letter": "a",
33
+ "mean_absorption_fraction": 0.31956071410316983,
34
+ "full_absorption_rate": 0.2877503852080123,
35
+ "num_full_absorption": 747,
36
+ "num_probe_true_positives": 2596,
37
+ "num_split_features": 2
38
+ },
39
+ {
40
+ "first_letter": "b",
41
+ "mean_absorption_fraction": 0.04449745477504374,
42
+ "full_absorption_rate": 0.023646546359676415,
43
+ "num_full_absorption": 38,
44
+ "num_probe_true_positives": 1607,
45
+ "num_split_features": 1
46
+ },
47
+ {
48
+ "first_letter": "c",
49
+ "mean_absorption_fraction": 0.589654239145153,
50
+ "full_absorption_rate": 0.5625226531351939,
51
+ "num_full_absorption": 1552,
52
+ "num_probe_true_positives": 2759,
53
+ "num_split_features": 3
54
+ },
55
+ {
56
+ "first_letter": "d",
57
+ "mean_absorption_fraction": 0.001339060755086657,
58
+ "full_absorption_rate": 0.0041841004184100415,
59
+ "num_full_absorption": 7,
60
+ "num_probe_true_positives": 1673,
61
+ "num_split_features": 1
62
+ },
63
+ {
64
+ "first_letter": "e",
65
+ "mean_absorption_fraction": 0.061662389404888496,
66
+ "full_absorption_rate": 0.056214865708931916,
67
+ "num_full_absorption": 90,
68
+ "num_probe_true_positives": 1601,
69
+ "num_split_features": 1
70
+ },
71
+ {
72
+ "first_letter": "f",
73
+ "mean_absorption_fraction": 0.011349852176804556,
74
+ "full_absorption_rate": 0.004273504273504274,
75
+ "num_full_absorption": 5,
76
+ "num_probe_true_positives": 1170,
77
+ "num_split_features": 1
78
+ },
79
+ {
80
+ "first_letter": "g",
81
+ "mean_absorption_fraction": 0.0870451819893666,
82
+ "full_absorption_rate": 0.0546875,
83
+ "num_full_absorption": 63,
84
+ "num_probe_true_positives": 1152,
85
+ "num_split_features": 2
86
+ },
87
+ {
88
+ "first_letter": "h",
89
+ "mean_absorption_fraction": 0.0381254421552879,
90
+ "full_absorption_rate": 0.014395393474088292,
91
+ "num_full_absorption": 15,
92
+ "num_probe_true_positives": 1042,
93
+ "num_split_features": 1
94
+ },
95
+ {
96
+ "first_letter": "i",
97
+ "mean_absorption_fraction": 0.00724038034143389,
98
+ "full_absorption_rate": 0.012330456226880395,
99
+ "num_full_absorption": 20,
100
+ "num_probe_true_positives": 1622,
101
+ "num_split_features": 1
102
+ },
103
+ {
104
+ "first_letter": "j",
105
+ "mean_absorption_fraction": 0.0060390200128819125,
106
+ "full_absorption_rate": 0.0022675736961451248,
107
+ "num_full_absorption": 1,
108
+ "num_probe_true_positives": 441,
109
+ "num_split_features": 1
110
+ },
111
+ {
112
+ "first_letter": "k",
113
+ "mean_absorption_fraction": 0.014336384996811618,
114
+ "full_absorption_rate": 0.01088646967340591,
115
+ "num_full_absorption": 7,
116
+ "num_probe_true_positives": 643,
117
+ "num_split_features": 1
118
+ },
119
+ {
120
+ "first_letter": "l",
121
+ "mean_absorption_fraction": 0.029794771860448033,
122
+ "full_absorption_rate": 0.022764227642276424,
123
+ "num_full_absorption": 28,
124
+ "num_probe_true_positives": 1230,
125
+ "num_split_features": 1
126
+ },
127
+ {
128
+ "first_letter": "m",
129
+ "mean_absorption_fraction": 0.16111525953558284,
130
+ "full_absorption_rate": 0.1074792243767313,
131
+ "num_full_absorption": 194,
132
+ "num_probe_true_positives": 1805,
133
+ "num_split_features": 1
134
+ },
135
+ {
136
+ "first_letter": "n",
137
+ "mean_absorption_fraction": 0.09544210944678017,
138
+ "full_absorption_rate": 0.0640096618357488,
139
+ "num_full_absorption": 53,
140
+ "num_probe_true_positives": 828,
141
+ "num_split_features": 1
142
+ },
143
+ {
144
+ "first_letter": "o",
145
+ "mean_absorption_fraction": 0.3065232988881943,
146
+ "full_absorption_rate": 0.2209188660801564,
147
+ "num_full_absorption": 226,
148
+ "num_probe_true_positives": 1023,
149
+ "num_split_features": 1
150
+ },
151
+ {
152
+ "first_letter": "p",
153
+ "mean_absorption_fraction": 0.00870559114530204,
154
+ "full_absorption_rate": 0.003036876355748373,
155
+ "num_full_absorption": 7,
156
+ "num_probe_true_positives": 2305,
157
+ "num_split_features": 1
158
+ },
159
+ {
160
+ "first_letter": "q",
161
+ "mean_absorption_fraction": 0.002457081995669703,
162
+ "full_absorption_rate": 0.0055248618784530384,
163
+ "num_full_absorption": 1,
164
+ "num_probe_true_positives": 181,
165
+ "num_split_features": 1
166
+ },
167
+ {
168
+ "first_letter": "r",
169
+ "mean_absorption_fraction": 0.0009763400503572069,
170
+ "full_absorption_rate": 0.001851851851851852,
171
+ "num_full_absorption": 3,
172
+ "num_probe_true_positives": 1620,
173
+ "num_split_features": 1
174
+ },
175
+ {
176
+ "first_letter": "s",
177
+ "mean_absorption_fraction": 0.37384705903782756,
178
+ "full_absorption_rate": 0.3992857142857143,
179
+ "num_full_absorption": 1118,
180
+ "num_probe_true_positives": 2800,
181
+ "num_split_features": 1
182
+ },
183
+ {
184
+ "first_letter": "t",
185
+ "mean_absorption_fraction": 0.002104050395839018,
186
+ "full_absorption_rate": 0.002335084646818447,
187
+ "num_full_absorption": 4,
188
+ "num_probe_true_positives": 1713,
189
+ "num_split_features": 1
190
+ },
191
+ {
192
+ "first_letter": "u",
193
+ "mean_absorption_fraction": 0.07293505307107637,
194
+ "full_absorption_rate": 0.03595206391478029,
195
+ "num_full_absorption": 27,
196
+ "num_probe_true_positives": 751,
197
+ "num_split_features": 2
198
+ },
199
+ {
200
+ "first_letter": "v",
201
+ "mean_absorption_fraction": 0.015528941369840081,
202
+ "full_absorption_rate": 0.013530135301353014,
203
+ "num_full_absorption": 11,
204
+ "num_probe_true_positives": 813,
205
+ "num_split_features": 1
206
+ },
207
+ {
208
+ "first_letter": "w",
209
+ "mean_absorption_fraction": 0.03684412623353439,
210
+ "full_absorption_rate": 0.029275808936825885,
211
+ "num_full_absorption": 19,
212
+ "num_probe_true_positives": 649,
213
+ "num_split_features": 1
214
+ },
215
+ {
216
+ "first_letter": "x",
217
+ "mean_absorption_fraction": 0.007447853326184163,
218
+ "full_absorption_rate": 0.010638297872340425,
219
+ "num_full_absorption": 1,
220
+ "num_probe_true_positives": 94,
221
+ "num_split_features": 3
222
+ },
223
+ {
224
+ "first_letter": "y",
225
+ "mean_absorption_fraction": 0.09283834515963053,
226
+ "full_absorption_rate": 0.027972027972027972,
227
+ "num_full_absorption": 4,
228
+ "num_probe_true_positives": 143,
229
+ "num_split_features": 1
230
+ },
231
+ {
232
+ "first_letter": "z",
233
+ "mean_absorption_fraction": 0.0020640097774781985,
234
+ "full_absorption_rate": 0.00784313725490196,
235
+ "num_full_absorption": 2,
236
+ "num_probe_true_positives": 255,
237
+ "num_split_features": 2
238
+ }
239
+ ],
240
+ "sae_bench_commit_hash": "Unknown",
241
+ "sae_lens_id": "blocks.17.hook_resid_post",
242
+ "sae_lens_release_id": "gemma-2-2b-res-snap-matryoshka-dc",
243
+ "sae_lens_version": "5.9.1",
244
+ "sae_cfg_dict": {
245
+ "architecture": "jumprelu",
246
+ "d_in": 2304,
247
+ "d_sae": 32768,
248
+ "activation_fn_str": "relu",
249
+ "apply_b_dec_to_input": true,
250
+ "finetuning_scaling_factor": false,
251
+ "context_size": 1024,
252
+ "model_name": "gemma-2-2b",
253
+ "hook_name": "blocks.17.hook_resid_post",
254
+ "hook_layer": 17,
255
+ "hook_head_index": null,
256
+ "prepend_bos": true,
257
+ "dataset_path": "chanind/pile-uncopyrighted-gemma-1024-abbrv-1B",
258
+ "dataset_trust_remote_code": true,
259
+ "normalize_activations": "none",
260
+ "dtype": "torch.bfloat16",
261
+ "device": "cuda",
262
+ "sae_lens_training_version": "5.5.1",
263
+ "activation_fn_kwargs": {
264
+ "k": 40
265
+ },
266
+ "neuronpedia_id": null,
267
+ "model_from_pretrained_kwargs": {
268
+ "center_writing_weights": false
269
+ },
270
+ "seqpos_slice": [
271
+ null
272
+ ]
273
+ },
274
+ "eval_result_unstructured": null
275
+ }