Files
isokl_steering_calibration/figs/table.csv
T

38 lines
3.5 KiB
CSV

model,method,window,alpha,c_star_mean,n_seeds,kl_p95_mean,pmass_mean
Llama-3.2-1B-Instruct,directional_ablation,20,1.0,5.119636661337771,3,1.1908359713852406,NaN
Llama-3.2-1B-Instruct,directional_ablation,20,2.0,5.119636661337771,3,5.850264692306519,0.000022955508256927715
Llama-3.2-1B-Instruct,directional_ablation,50,1.0,4.6095092483978455,3,1.291592478454113,NaN
Llama-3.2-1B-Instruct,directional_ablation,50,2.0,4.6095092483978455,3,5.11867133140564,0.00004614551000320882
Llama-3.2-1B-Instruct,mean_diff,20,1.0,3.771688942723309,3,0.9256407611072064,NaN
Llama-3.2-1B-Instruct,mean_diff,20,2.0,3.771688942723309,3,5.391779696941375,0.00006245920594665222
Llama-3.2-1B-Instruct,mean_diff,50,1.0,3.861664231693977,3,1.3414980980753899,NaN
Llama-3.2-1B-Instruct,mean_diff,50,2.0,3.861664231693977,3,4.656074690818786,0.00007268900522335157
Llama-3.2-1B-Instruct,pca,20,1.0,3.818178678361504,3,0.9329803831875324,NaN
Llama-3.2-1B-Instruct,pca,20,2.0,3.818178678361504,3,5.620841109752655,0.00026052194389194485
Llama-3.2-1B-Instruct,pca,50,1.0,3.600290823741986,3,0.9301029246300458,NaN
Llama-3.2-1B-Instruct,pca,50,2.0,3.600290823741986,3,4.0647015488147735,NaN
Qwen2.5-0.5B-Instruct,directional_ablation,20,1.0,7.507819866975713,3,0.6075146049261093,0.00005063821326984907
Qwen2.5-0.5B-Instruct,directional_ablation,20,2.0,7.507819866975713,3,3.166464865207672,0.00018519468194426735
Qwen2.5-0.5B-Instruct,directional_ablation,50,1.0,7.055664779577401,3,0.5607812261581421,0.000034678878002771604
Qwen2.5-0.5B-Instruct,directional_ablation,50,2.0,7.055664779577401,3,2.2286340260505675,0.00013751945268516218
Qwen2.5-0.5B-Instruct,mean_diff,20,1.0,7.588130746747839,3,0.7048790633678437,0.000040864707125365383
Qwen2.5-0.5B-Instruct,mean_diff,20,2.0,7.588130746747839,3,3.335330218076706,0.00019464152283035218
Qwen2.5-0.5B-Instruct,mean_diff,50,1.0,7.561536121211781,3,0.7623215705156327,0.00003399881875959016
Qwen2.5-0.5B-Instruct,mean_diff,50,2.0,7.561536121211781,3,2.8257888650894163,0.00015105884966198408
Qwen2.5-0.5B-Instruct,pca,20,1.0,8.655517019086593,3,0.9307092409580946,3.041228809275154e-6
Qwen2.5-0.5B-Instruct,pca,20,2.0,8.655517019086593,3,3.7524219751358032,1.6446400348257838e-7
Qwen2.5-0.5B-Instruct,pca,50,1.0,8.606126777874907,3,0.8437561804056167,NaN
Qwen2.5-0.5B-Instruct,pca,50,2.0,8.606126777874907,3,3.1483269047737124,1.4466886552347544e-7
Qwen3-4B-Instruct-2507,directional_ablation,20,1.0,25.600000000000005,3,1.3869682106771506,9.215271860500782e-6
Qwen3-4B-Instruct-2507,directional_ablation,20,2.0,25.600000000000005,3,7.038443911075592,0.00001822325955023185
Qwen3-4B-Instruct-2507,directional_ablation,50,1.0,22.895205490202148,3,1.0069563373062511,NaN
Qwen3-4B-Instruct-2507,directional_ablation,50,2.0,22.895205490202148,3,4.545377564039081,NaN
Qwen3-4B-Instruct-2507,mean_diff,20,1.0,25.600000000000005,3,0.9436350018950179,4.663814388822024e-6
Qwen3-4B-Instruct-2507,mean_diff,20,2.0,25.600000000000005,3,6.434498374164105,0.000016732647531197965
Qwen3-4B-Instruct-2507,mean_diff,50,1.0,25.600000000000005,3,0.9753538948745699,NaN
Qwen3-4B-Instruct-2507,mean_diff,50,2.0,25.600000000000005,3,5.002368605150841,NaN
Qwen3-4B-Instruct-2507,pca,20,1.0,23.302283905419525,3,1.490876998582462,0.00001391104007908428
Qwen3-4B-Instruct-2507,pca,20,2.0,23.302283905419525,3,5.252012262865901,0.000011667380206471789
Qwen3-4B-Instruct-2507,pca,50,1.0,17.99025750455262,3,0.9170716370666468,6.987194066781776e-6
Qwen3-4B-Instruct-2507,pca,50,2.0,17.99025750455262,3,3.4862812616676093,0.00002544457582068353