chanind commited on
Commit
8c89fd3
·
verified ·
1 Parent(s): 82b74bb

Upload tpp/gemma-2-2b-res-matryoshka-dc_blocks.22.hook_resid_post_eval_results.json with huggingface_hub

Browse files
tpp/gemma-2-2b-res-matryoshka-dc_blocks.22.hook_resid_post_eval_results.json ADDED
@@ -0,0 +1,419 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eval_type_id": "tpp",
3
+ "eval_config": {
4
+ "random_seed": 42,
5
+ "dataset_names": [
6
+ "LabHC/bias_in_bios_class_set1",
7
+ "canrager/amazon_reviews_mcauley_1and5"
8
+ ],
9
+ "perform_scr": false,
10
+ "early_stopping_patience": 20,
11
+ "train_set_size": 4000,
12
+ "test_set_size": 1000,
13
+ "context_length": 128,
14
+ "probe_train_batch_size": 16,
15
+ "probe_test_batch_size": 500,
16
+ "probe_epochs": 20,
17
+ "probe_lr": 0.001,
18
+ "probe_l1_penalty": 0.001,
19
+ "sae_batch_size": 125,
20
+ "llm_batch_size": 32,
21
+ "llm_dtype": "bfloat16",
22
+ "lower_vram_usage": false,
23
+ "model_name": "gemma-2-2b",
24
+ "n_values": [
25
+ 2,
26
+ 5,
27
+ 10,
28
+ 20,
29
+ 50,
30
+ 100,
31
+ 500
32
+ ],
33
+ "column1_vals_lookup": {
34
+ "LabHC/bias_in_bios_class_set1": [
35
+ [
36
+ "professor",
37
+ "nurse"
38
+ ],
39
+ [
40
+ "architect",
41
+ "journalist"
42
+ ],
43
+ [
44
+ "surgeon",
45
+ "psychologist"
46
+ ],
47
+ [
48
+ "attorney",
49
+ "teacher"
50
+ ]
51
+ ],
52
+ "canrager/amazon_reviews_mcauley_1and5": [
53
+ [
54
+ "Books",
55
+ "CDs_and_Vinyl"
56
+ ],
57
+ [
58
+ "Software",
59
+ "Electronics"
60
+ ],
61
+ [
62
+ "Pet_Supplies",
63
+ "Office_Products"
64
+ ],
65
+ [
66
+ "Industrial_and_Scientific",
67
+ "Toys_and_Games"
68
+ ]
69
+ ]
70
+ }
71
+ },
72
+ "eval_id": "91ffb92c-ec01-47b1-9f45-773ec12047b3",
73
+ "datetime_epoch_millis": 1745753034069,
74
+ "eval_result_metrics": {
75
+ "tpp_metrics": {
76
+ "tpp_threshold_2_total_metric": 0.08222500383853912,
77
+ "tpp_threshold_2_intended_diff_only": 0.10360000729560853,
78
+ "tpp_threshold_2_unintended_diff_only": 0.021375003457069396,
79
+ "tpp_threshold_5_total_metric": 0.1544000029563904,
80
+ "tpp_threshold_5_intended_diff_only": 0.20190001130104065,
81
+ "tpp_threshold_5_unintended_diff_only": 0.04750000834465027,
82
+ "tpp_threshold_10_total_metric": 0.19292501509189605,
83
+ "tpp_threshold_10_intended_diff_only": 0.2709000170230865,
84
+ "tpp_threshold_10_unintended_diff_only": 0.07797500193119049,
85
+ "tpp_threshold_20_total_metric": 0.21047500669956207,
86
+ "tpp_threshold_20_intended_diff_only": 0.3226000189781189,
87
+ "tpp_threshold_20_unintended_diff_only": 0.11212501227855681,
88
+ "tpp_threshold_50_total_metric": 0.23550001978874208,
89
+ "tpp_threshold_50_intended_diff_only": 0.3938000321388245,
90
+ "tpp_threshold_50_unintended_diff_only": 0.1583000123500824,
91
+ "tpp_threshold_100_total_metric": 0.24435001164674758,
92
+ "tpp_threshold_100_intended_diff_only": 0.42770002484321595,
93
+ "tpp_threshold_100_unintended_diff_only": 0.18335001319646835,
94
+ "tpp_threshold_500_total_metric": 0.21707503199577333,
95
+ "tpp_threshold_500_intended_diff_only": 0.4481000483036041,
96
+ "tpp_threshold_500_unintended_diff_only": 0.23102501630783082
97
+ }
98
+ },
99
+ "eval_result_details": [
100
+ {
101
+ "dataset_name": "LabHC/bias_in_bios_class_set1_tpp_results",
102
+ "tpp_threshold_2_total_metric": 0.12585000693798065,
103
+ "tpp_threshold_2_intended_diff_only": 0.15860000848770142,
104
+ "tpp_threshold_2_unintended_diff_only": 0.03275000154972076,
105
+ "tpp_threshold_5_total_metric": 0.22060000598430635,
106
+ "tpp_threshold_5_intended_diff_only": 0.301800012588501,
107
+ "tpp_threshold_5_unintended_diff_only": 0.08120000660419464,
108
+ "tpp_threshold_10_total_metric": 0.25145002007484435,
109
+ "tpp_threshold_10_intended_diff_only": 0.38740001916885375,
110
+ "tpp_threshold_10_unintended_diff_only": 0.1359499990940094,
111
+ "tpp_threshold_20_total_metric": 0.22910001277923583,
112
+ "tpp_threshold_20_intended_diff_only": 0.42680002450942994,
113
+ "tpp_threshold_20_unintended_diff_only": 0.19770001173019408,
114
+ "tpp_threshold_50_total_metric": 0.17535001635551453,
115
+ "tpp_threshold_50_intended_diff_only": 0.45800002813339236,
116
+ "tpp_threshold_50_unintended_diff_only": 0.2826500117778778,
117
+ "tpp_threshold_100_total_metric": 0.14299999177455902,
118
+ "tpp_threshold_100_intended_diff_only": 0.4630000114440918,
119
+ "tpp_threshold_100_unintended_diff_only": 0.3200000196695328,
120
+ "tpp_threshold_500_total_metric": 0.08455002903938294,
121
+ "tpp_threshold_500_intended_diff_only": 0.46520004272460935,
122
+ "tpp_threshold_500_unintended_diff_only": 0.38065001368522644
123
+ },
124
+ {
125
+ "dataset_name": "canrager/amazon_reviews_mcauley_1and5_tpp_results",
126
+ "tpp_threshold_2_total_metric": 0.0386000007390976,
127
+ "tpp_threshold_2_intended_diff_only": 0.04860000610351563,
128
+ "tpp_threshold_2_unintended_diff_only": 0.01000000536441803,
129
+ "tpp_threshold_5_total_metric": 0.08819999992847442,
130
+ "tpp_threshold_5_intended_diff_only": 0.10200001001358032,
131
+ "tpp_threshold_5_unintended_diff_only": 0.013800010085105896,
132
+ "tpp_threshold_10_total_metric": 0.13440001010894775,
133
+ "tpp_threshold_10_intended_diff_only": 0.15440001487731933,
134
+ "tpp_threshold_10_unintended_diff_only": 0.020000004768371583,
135
+ "tpp_threshold_20_total_metric": 0.1918500006198883,
136
+ "tpp_threshold_20_intended_diff_only": 0.21840001344680787,
137
+ "tpp_threshold_20_unintended_diff_only": 0.026550012826919555,
138
+ "tpp_threshold_50_total_metric": 0.2956500232219696,
139
+ "tpp_threshold_50_intended_diff_only": 0.3296000361442566,
140
+ "tpp_threshold_50_unintended_diff_only": 0.033950012922286985,
141
+ "tpp_threshold_100_total_metric": 0.34570003151893614,
142
+ "tpp_threshold_100_intended_diff_only": 0.3924000382423401,
143
+ "tpp_threshold_100_unintended_diff_only": 0.04670000672340393,
144
+ "tpp_threshold_500_total_metric": 0.3496000349521637,
145
+ "tpp_threshold_500_intended_diff_only": 0.4310000538825989,
146
+ "tpp_threshold_500_unintended_diff_only": 0.08140001893043518
147
+ }
148
+ ],
149
+ "sae_bench_commit_hash": "Unknown",
150
+ "sae_lens_id": "blocks.22.hook_resid_post",
151
+ "sae_lens_release_id": "gemma-2-2b-res-matryoshka-dc",
152
+ "sae_lens_version": "5.9.1",
153
+ "sae_cfg_dict": {
154
+ "architecture": "jumprelu",
155
+ "d_in": 2304,
156
+ "d_sae": 32768,
157
+ "activation_fn_str": "relu",
158
+ "apply_b_dec_to_input": true,
159
+ "finetuning_scaling_factor": false,
160
+ "context_size": 1024,
161
+ "model_name": "gemma-2-2b",
162
+ "hook_name": "blocks.22.hook_resid_post",
163
+ "hook_layer": 22,
164
+ "hook_head_index": null,
165
+ "prepend_bos": true,
166
+ "dataset_path": "chanind/pile-uncopyrighted-gemma-1024-abbrv-1B",
167
+ "dataset_trust_remote_code": true,
168
+ "normalize_activations": "none",
169
+ "dtype": "torch.bfloat16",
170
+ "device": "cuda",
171
+ "sae_lens_training_version": "5.5.1",
172
+ "activation_fn_kwargs": {
173
+ "k": 40
174
+ },
175
+ "neuronpedia_id": null,
176
+ "model_from_pretrained_kwargs": {
177
+ "center_writing_weights": false
178
+ },
179
+ "seqpos_slice": [
180
+ null
181
+ ]
182
+ },
183
+ "eval_result_unstructured": {
184
+ "LabHC/bias_in_bios_class_set1": {
185
+ "0": {
186
+ "tpp_threshold_2_total_metric": 0.17625002562999725,
187
+ "tpp_threshold_2_intended_diff_only": 0.2160000205039978,
188
+ "tpp_threshold_2_unintended_diff_only": 0.03974999487400055,
189
+ "tpp_threshold_5_total_metric": 0.1834999918937683,
190
+ "tpp_threshold_5_intended_diff_only": 0.2680000066757202,
191
+ "tpp_threshold_5_unintended_diff_only": 0.0845000147819519,
192
+ "tpp_threshold_10_total_metric": 0.19875003397464752,
193
+ "tpp_threshold_10_intended_diff_only": 0.3540000319480896,
194
+ "tpp_threshold_10_unintended_diff_only": 0.15524999797344208,
195
+ "tpp_threshold_20_total_metric": 0.21549999713897705,
196
+ "tpp_threshold_20_intended_diff_only": 0.3970000147819519,
197
+ "tpp_threshold_20_unintended_diff_only": 0.18150001764297485,
198
+ "tpp_threshold_50_total_metric": 0.14375001192092896,
199
+ "tpp_threshold_50_intended_diff_only": 0.42900002002716064,
200
+ "tpp_threshold_50_unintended_diff_only": 0.2852500081062317,
201
+ "tpp_threshold_100_total_metric": 0.11625000834465027,
202
+ "tpp_threshold_100_intended_diff_only": 0.44300001859664917,
203
+ "tpp_threshold_100_unintended_diff_only": 0.3267500102519989,
204
+ "tpp_threshold_500_total_metric": 0.049500033259391785,
205
+ "tpp_threshold_500_intended_diff_only": 0.44600003957748413,
206
+ "tpp_threshold_500_unintended_diff_only": 0.39650000631809235
207
+ },
208
+ "1": {
209
+ "tpp_threshold_2_total_metric": 0.1379999965429306,
210
+ "tpp_threshold_2_intended_diff_only": 0.19900000095367432,
211
+ "tpp_threshold_2_unintended_diff_only": 0.06100000441074371,
212
+ "tpp_threshold_5_total_metric": 0.1539999395608902,
213
+ "tpp_threshold_5_intended_diff_only": 0.2759999632835388,
214
+ "tpp_threshold_5_unintended_diff_only": 0.12200002372264862,
215
+ "tpp_threshold_10_total_metric": 0.17800001800060272,
216
+ "tpp_threshold_10_intended_diff_only": 0.36000001430511475,
217
+ "tpp_threshold_10_unintended_diff_only": 0.18199999630451202,
218
+ "tpp_threshold_20_total_metric": 0.17874999344348907,
219
+ "tpp_threshold_20_intended_diff_only": 0.41600000858306885,
220
+ "tpp_threshold_20_unintended_diff_only": 0.23725001513957977,
221
+ "tpp_threshold_50_total_metric": 0.14650000631809235,
222
+ "tpp_threshold_50_intended_diff_only": 0.4570000171661377,
223
+ "tpp_threshold_50_unintended_diff_only": 0.31050001084804535,
224
+ "tpp_threshold_100_total_metric": 0.1109999418258667,
225
+ "tpp_threshold_100_intended_diff_only": 0.4599999785423279,
226
+ "tpp_threshold_100_unintended_diff_only": 0.3490000367164612,
227
+ "tpp_threshold_500_total_metric": 0.06675000488758087,
228
+ "tpp_threshold_500_intended_diff_only": 0.4610000252723694,
229
+ "tpp_threshold_500_unintended_diff_only": 0.3942500203847885
230
+ },
231
+ "2": {
232
+ "tpp_threshold_2_total_metric": 0.0887499749660492,
233
+ "tpp_threshold_2_intended_diff_only": 0.1029999852180481,
234
+ "tpp_threshold_2_unintended_diff_only": 0.014250010251998901,
235
+ "tpp_threshold_5_total_metric": 0.2912500351667404,
236
+ "tpp_threshold_5_intended_diff_only": 0.34400004148483276,
237
+ "tpp_threshold_5_unintended_diff_only": 0.052750006318092346,
238
+ "tpp_threshold_10_total_metric": 0.2657500356435776,
239
+ "tpp_threshold_10_intended_diff_only": 0.39100003242492676,
240
+ "tpp_threshold_10_unintended_diff_only": 0.12524999678134918,
241
+ "tpp_threshold_20_total_metric": 0.2342500239610672,
242
+ "tpp_threshold_20_intended_diff_only": 0.4190000295639038,
243
+ "tpp_threshold_20_unintended_diff_only": 0.1847500056028366,
244
+ "tpp_threshold_50_total_metric": 0.17375002801418304,
245
+ "tpp_threshold_50_intended_diff_only": 0.44600003957748413,
246
+ "tpp_threshold_50_unintended_diff_only": 0.2722500115633011,
247
+ "tpp_threshold_100_total_metric": 0.14374998211860657,
248
+ "tpp_threshold_100_intended_diff_only": 0.4490000009536743,
249
+ "tpp_threshold_100_unintended_diff_only": 0.30525001883506775,
250
+ "tpp_threshold_500_total_metric": 0.06725002825260162,
251
+ "tpp_threshold_500_intended_diff_only": 0.45500004291534424,
252
+ "tpp_threshold_500_unintended_diff_only": 0.3877500146627426
253
+ },
254
+ "6": {
255
+ "tpp_threshold_2_total_metric": 0.13650000095367432,
256
+ "tpp_threshold_2_intended_diff_only": 0.16200000047683716,
257
+ "tpp_threshold_2_unintended_diff_only": 0.025499999523162842,
258
+ "tpp_threshold_5_total_metric": 0.2762500196695328,
259
+ "tpp_threshold_5_intended_diff_only": 0.30900001525878906,
260
+ "tpp_threshold_5_unintended_diff_only": 0.03274999558925629,
261
+ "tpp_threshold_10_total_metric": 0.3917500227689743,
262
+ "tpp_threshold_10_intended_diff_only": 0.4570000171661377,
263
+ "tpp_threshold_10_unintended_diff_only": 0.06524999439716339,
264
+ "tpp_threshold_20_total_metric": 0.3072500377893448,
265
+ "tpp_threshold_20_intended_diff_only": 0.4830000400543213,
266
+ "tpp_threshold_20_unintended_diff_only": 0.1757500022649765,
267
+ "tpp_threshold_50_total_metric": 0.22175002098083496,
268
+ "tpp_threshold_50_intended_diff_only": 0.4880000352859497,
269
+ "tpp_threshold_50_unintended_diff_only": 0.26625001430511475,
270
+ "tpp_threshold_100_total_metric": 0.19900000095367432,
271
+ "tpp_threshold_100_intended_diff_only": 0.49000000953674316,
272
+ "tpp_threshold_100_unintended_diff_only": 0.29100000858306885,
273
+ "tpp_threshold_500_total_metric": 0.1520000398159027,
274
+ "tpp_threshold_500_intended_diff_only": 0.49100005626678467,
275
+ "tpp_threshold_500_unintended_diff_only": 0.33900001645088196
276
+ },
277
+ "9": {
278
+ "tpp_threshold_2_total_metric": 0.08975003659725189,
279
+ "tpp_threshold_2_intended_diff_only": 0.11300003528594971,
280
+ "tpp_threshold_2_unintended_diff_only": 0.023249998688697815,
281
+ "tpp_threshold_5_total_metric": 0.19800004363059998,
282
+ "tpp_threshold_5_intended_diff_only": 0.312000036239624,
283
+ "tpp_threshold_5_unintended_diff_only": 0.11399999260902405,
284
+ "tpp_threshold_10_total_metric": 0.22299998998641968,
285
+ "tpp_threshold_10_intended_diff_only": 0.375,
286
+ "tpp_threshold_10_unintended_diff_only": 0.15200001001358032,
287
+ "tpp_threshold_20_total_metric": 0.2097500115633011,
288
+ "tpp_threshold_20_intended_diff_only": 0.4190000295639038,
289
+ "tpp_threshold_20_unintended_diff_only": 0.20925001800060272,
290
+ "tpp_threshold_50_total_metric": 0.19100001454353333,
291
+ "tpp_threshold_50_intended_diff_only": 0.4700000286102295,
292
+ "tpp_threshold_50_unintended_diff_only": 0.27900001406669617,
293
+ "tpp_threshold_100_total_metric": 0.14500002562999725,
294
+ "tpp_threshold_100_intended_diff_only": 0.47300004959106445,
295
+ "tpp_threshold_100_unintended_diff_only": 0.3280000239610672,
296
+ "tpp_threshold_500_total_metric": 0.08725003898143768,
297
+ "tpp_threshold_500_intended_diff_only": 0.47300004959106445,
298
+ "tpp_threshold_500_unintended_diff_only": 0.38575001060962677
299
+ }
300
+ },
301
+ "canrager/amazon_reviews_mcauley_1and5": {
302
+ "1": {
303
+ "tpp_threshold_2_total_metric": 0.00449998676776886,
304
+ "tpp_threshold_2_intended_diff_only": 0.013999998569488525,
305
+ "tpp_threshold_2_unintended_diff_only": 0.009500011801719666,
306
+ "tpp_threshold_5_total_metric": 0.020999997854232788,
307
+ "tpp_threshold_5_intended_diff_only": 0.03200000524520874,
308
+ "tpp_threshold_5_unintended_diff_only": 0.011000007390975952,
309
+ "tpp_threshold_10_total_metric": 0.03625005483627319,
310
+ "tpp_threshold_10_intended_diff_only": 0.057000041007995605,
311
+ "tpp_threshold_10_unintended_diff_only": 0.020749986171722412,
312
+ "tpp_threshold_20_total_metric": 0.10199999809265137,
313
+ "tpp_threshold_20_intended_diff_only": 0.1340000033378601,
314
+ "tpp_threshold_20_unintended_diff_only": 0.03200000524520874,
315
+ "tpp_threshold_50_total_metric": 0.23725001513957977,
316
+ "tpp_threshold_50_intended_diff_only": 0.2710000276565552,
317
+ "tpp_threshold_50_unintended_diff_only": 0.0337500125169754,
318
+ "tpp_threshold_100_total_metric": 0.33925001323223114,
319
+ "tpp_threshold_100_intended_diff_only": 0.3830000162124634,
320
+ "tpp_threshold_100_unintended_diff_only": 0.04375000298023224,
321
+ "tpp_threshold_500_total_metric": 0.3787500560283661,
322
+ "tpp_threshold_500_intended_diff_only": 0.4530000686645508,
323
+ "tpp_threshold_500_unintended_diff_only": 0.07425001263618469
324
+ },
325
+ "2": {
326
+ "tpp_threshold_2_total_metric": 0.17475001513957977,
327
+ "tpp_threshold_2_intended_diff_only": 0.18400001525878906,
328
+ "tpp_threshold_2_unintended_diff_only": 0.00925000011920929,
329
+ "tpp_threshold_5_total_metric": 0.2802499979734421,
330
+ "tpp_threshold_5_intended_diff_only": 0.29600000381469727,
331
+ "tpp_threshold_5_unintended_diff_only": 0.015750005841255188,
332
+ "tpp_threshold_10_total_metric": 0.3490000069141388,
333
+ "tpp_threshold_10_intended_diff_only": 0.3700000047683716,
334
+ "tpp_threshold_10_unintended_diff_only": 0.020999997854232788,
335
+ "tpp_threshold_20_total_metric": 0.3917499929666519,
336
+ "tpp_threshold_20_intended_diff_only": 0.41600000858306885,
337
+ "tpp_threshold_20_unintended_diff_only": 0.02425001561641693,
338
+ "tpp_threshold_50_total_metric": 0.39900001883506775,
339
+ "tpp_threshold_50_intended_diff_only": 0.437000036239624,
340
+ "tpp_threshold_50_unintended_diff_only": 0.038000017404556274,
341
+ "tpp_threshold_100_total_metric": 0.393250048160553,
342
+ "tpp_threshold_100_intended_diff_only": 0.4410000443458557,
343
+ "tpp_threshold_100_unintended_diff_only": 0.047749996185302734,
344
+ "tpp_threshold_500_total_metric": 0.3800000101327896,
345
+ "tpp_threshold_500_intended_diff_only": 0.4410000443458557,
346
+ "tpp_threshold_500_unintended_diff_only": 0.0610000342130661
347
+ },
348
+ "3": {
349
+ "tpp_threshold_2_total_metric": -0.02049998939037323,
350
+ "tpp_threshold_2_intended_diff_only": -0.009999990463256836,
351
+ "tpp_threshold_2_unintended_diff_only": 0.010499998927116394,
352
+ "tpp_threshold_5_total_metric": 0.003500029444694519,
353
+ "tpp_threshold_5_intended_diff_only": 0.012000024318695068,
354
+ "tpp_threshold_5_unintended_diff_only": 0.00849999487400055,
355
+ "tpp_threshold_10_total_metric": 0.054499998688697815,
356
+ "tpp_threshold_10_intended_diff_only": 0.06400001049041748,
357
+ "tpp_threshold_10_unintended_diff_only": 0.009500011801719666,
358
+ "tpp_threshold_20_total_metric": 0.09475001692771912,
359
+ "tpp_threshold_20_intended_diff_only": 0.11400002241134644,
360
+ "tpp_threshold_20_unintended_diff_only": 0.01925000548362732,
361
+ "tpp_threshold_50_total_metric": 0.23825004696846008,
362
+ "tpp_threshold_50_intended_diff_only": 0.2690000534057617,
363
+ "tpp_threshold_50_unintended_diff_only": 0.030750006437301636,
364
+ "tpp_threshold_100_total_metric": 0.3092500567436218,
365
+ "tpp_threshold_100_intended_diff_only": 0.36600005626678467,
366
+ "tpp_threshold_100_unintended_diff_only": 0.05674999952316284,
367
+ "tpp_threshold_500_total_metric": 0.2927500456571579,
368
+ "tpp_threshold_500_intended_diff_only": 0.43500006198883057,
369
+ "tpp_threshold_500_unintended_diff_only": 0.14225001633167267
370
+ },
371
+ "5": {
372
+ "tpp_threshold_2_total_metric": 0.011499986052513123,
373
+ "tpp_threshold_2_intended_diff_only": 0.013999998569488525,
374
+ "tpp_threshold_2_unintended_diff_only": 0.002500012516975403,
375
+ "tpp_threshold_5_total_metric": 0.10924996435642242,
376
+ "tpp_threshold_5_intended_diff_only": 0.12099999189376831,
377
+ "tpp_threshold_5_unintended_diff_only": 0.011750027537345886,
378
+ "tpp_threshold_10_total_metric": 0.14474999904632568,
379
+ "tpp_threshold_10_intended_diff_only": 0.16600000858306885,
380
+ "tpp_threshold_10_unintended_diff_only": 0.021250009536743164,
381
+ "tpp_threshold_20_total_metric": 0.18824997544288635,
382
+ "tpp_threshold_20_intended_diff_only": 0.20800000429153442,
383
+ "tpp_threshold_20_unintended_diff_only": 0.01975002884864807,
384
+ "tpp_threshold_50_total_metric": 0.30375002324581146,
385
+ "tpp_threshold_50_intended_diff_only": 0.33100003004074097,
386
+ "tpp_threshold_50_unintended_diff_only": 0.027250006794929504,
387
+ "tpp_threshold_100_total_metric": 0.3487499952316284,
388
+ "tpp_threshold_100_intended_diff_only": 0.3830000162124634,
389
+ "tpp_threshold_100_unintended_diff_only": 0.03425002098083496,
390
+ "tpp_threshold_500_total_metric": 0.3785000294446945,
391
+ "tpp_threshold_500_intended_diff_only": 0.4320000410079956,
392
+ "tpp_threshold_500_unintended_diff_only": 0.053500011563301086
393
+ },
394
+ "6": {
395
+ "tpp_threshold_2_total_metric": 0.02275000512599945,
396
+ "tpp_threshold_2_intended_diff_only": 0.04100000858306885,
397
+ "tpp_threshold_2_unintended_diff_only": 0.018250003457069397,
398
+ "tpp_threshold_5_total_metric": 0.027000010013580322,
399
+ "tpp_threshold_5_intended_diff_only": 0.04900002479553223,
400
+ "tpp_threshold_5_unintended_diff_only": 0.022000014781951904,
401
+ "tpp_threshold_10_total_metric": 0.08749999105930328,
402
+ "tpp_threshold_10_intended_diff_only": 0.11500000953674316,
403
+ "tpp_threshold_10_unintended_diff_only": 0.02750001847743988,
404
+ "tpp_threshold_20_total_metric": 0.18250001966953278,
405
+ "tpp_threshold_20_intended_diff_only": 0.2200000286102295,
406
+ "tpp_threshold_20_unintended_diff_only": 0.037500008940696716,
407
+ "tpp_threshold_50_total_metric": 0.30000001192092896,
408
+ "tpp_threshold_50_intended_diff_only": 0.3400000333786011,
409
+ "tpp_threshold_50_unintended_diff_only": 0.04000002145767212,
410
+ "tpp_threshold_100_total_metric": 0.3380000442266464,
411
+ "tpp_threshold_100_intended_diff_only": 0.3890000581741333,
412
+ "tpp_threshold_100_unintended_diff_only": 0.05100001394748688,
413
+ "tpp_threshold_500_total_metric": 0.31800003349781036,
414
+ "tpp_threshold_500_intended_diff_only": 0.3940000534057617,
415
+ "tpp_threshold_500_unintended_diff_only": 0.07600001990795135
416
+ }
417
+ }
418
+ }
419
+ }