wip: dense alpha sweep + auto-render figs (Qwen3.5-0.8B w=512); queued OLMo-2/Gemma 4B/Gemma 12B/OLMo-3 7B at w=4096
|
After Width: | Height: | Size: 558 KiB |
|
After Width: | Height: | Size: 104 KiB |
@@ -0,0 +1,19 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Llama-3.2-1B-Instruct,directional_ablation,20,5.119636661337771,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,directional_ablation,50,4.6095092483978455,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,mean_diff,20,3.771688942723309,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,mean_diff,50,3.861664231693977,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,pca,20,3.818178678361504,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,pca,50,3.600290823741986,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,20,7.507819866975713,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.055664779577401,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,20,7.588130746747839,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,pca,20,8.655517019086593,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,20,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,50,22.895205490202148,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,mean_diff,20,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,mean_diff,50,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,pca,20,23.302283905419525,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,pca,50,17.99025750455262,0.0,3,0.0
|
||||
|
@@ -0,0 +1,20 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:-----------------------|:---------------------|---------:|---------:|--------:|----------:|-------:|
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 20 | 5.120 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 50 | 4.610 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 20 | 3.772 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 50 | 3.862 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 20 | 3.818 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 50 | 3.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 20 | 7.508 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 20 | 7.588 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 20 | 8.656 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 20 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 50 | 22.895 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 20 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 50 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 20 | 23.302 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 50 | 17.990 | 0.000 | 3 | 0.000 |
|
||||
|
After Width: | Height: | Size: 75 KiB |
@@ -0,0 +1,19 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Llama-3.2-1B-Instruct,directional_ablation,20,5.119636661337771,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,directional_ablation,50,4.6095092483978455,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,mean_diff,20,3.771688942723309,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,mean_diff,50,3.861664231693977,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,pca,20,3.818178678361504,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,pca,50,3.600290823741986,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,20,7.507819866975713,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.055664779577401,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,20,7.588130746747839,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,pca,20,8.655517019086593,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,20,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,50,22.895205490202148,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,mean_diff,20,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,mean_diff,50,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,pca,20,23.302283905419525,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,pca,50,17.99025750455262,0.0,3,0.0
|
||||
|
@@ -0,0 +1,20 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:-----------------------|:---------------------|---------:|---------:|--------:|----------:|-------:|
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 20 | 5.120 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 50 | 4.610 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 20 | 3.772 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 50 | 3.862 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 20 | 3.818 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 50 | 3.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 20 | 7.508 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 20 | 7.588 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 20 | 8.656 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 20 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 50 | 22.895 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 20 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 50 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 20 | 23.302 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 50 | 17.990 | 0.000 | 3 | 0.000 |
|
||||
|
After Width: | Height: | Size: 74 KiB |
@@ -0,0 +1,4 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -0,0 +1,5 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
After Width: | Height: | Size: 117 KiB |
@@ -0,0 +1,4 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -0,0 +1,5 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
After Width: | Height: | Size: 360 KiB |
@@ -0,0 +1,4 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -0,0 +1,5 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
After Width: | Height: | Size: 530 KiB |
@@ -0,0 +1,4 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -0,0 +1,5 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
After Width: | Height: | Size: 541 KiB |
@@ -0,0 +1,4 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -0,0 +1,5 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
After Width: | Height: | Size: 615 KiB |
@@ -0,0 +1,4 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -0,0 +1,5 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
@@ -0,0 +1,14 @@
|
||||
| threshold | alpha | n | S(t=20) | S(t=49) | median_death_t |
|
||||
|------------:|--------:|----:|----------:|----------:|-----------------:|
|
||||
| 0.500 | 0.500 | 24 | 0.875 | 0.792 | |
|
||||
| 0.500 | 1.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 0.500 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 0.500 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 1.000 | 0.500 | 24 | 1.000 | 1.000 | |
|
||||
| 1.000 | 1.000 | 24 | 0.500 | 0.333 | 20 |
|
||||
| 1.000 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 1.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 2.000 | 0.500 | 24 | 1.000 | 1.000 | |
|
||||
| 2.000 | 1.000 | 24 | 0.917 | 0.792 | |
|
||||
| 2.000 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 2.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
|
After Width: | Height: | Size: 77 KiB |
@@ -0,0 +1,14 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:---------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass | 0.500 | 0.500 | 24 | 0.833 | 0.708 | |
|
||||
| pmass | 0.500 | 1.000 | 24 | 0.917 | 0.875 | |
|
||||
| pmass | 0.500 | 2.000 | 24 | 1.000 | 0.958 | |
|
||||
| pmass | 0.500 | 4.000 | 24 | 0.333 | 0.333 | 0 |
|
||||
| pmass | 0.800 | 0.500 | 24 | 0.667 | 0.583 | |
|
||||
| pmass | 0.800 | 1.000 | 24 | 0.583 | 0.542 | |
|
||||
| pmass | 0.800 | 2.000 | 24 | 0.375 | 0.375 | 0 |
|
||||
| pmass | 0.800 | 4.000 | 24 | 0.333 | 0.292 | 0 |
|
||||
| pmass | 0.950 | 0.500 | 24 | 0.333 | 0.208 | 5 |
|
||||
| pmass | 0.950 | 1.000 | 24 | 0.250 | 0.208 | 0 |
|
||||
| pmass | 0.950 | 2.000 | 24 | 0.333 | 0.292 | 0 |
|
||||
| pmass | 0.950 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
|
After Width: | Height: | Size: 73 KiB |
@@ -0,0 +1,11 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:---------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass | 0.500 | 1.000 | 72 | 0.125 | 0.125 | 0 |
|
||||
| pmass | 0.500 | 2.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.500 | 4.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.800 | 1.000 | 72 | 0.042 | 0.042 | 0 |
|
||||
| pmass | 0.800 | 2.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.800 | 4.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.950 | 1.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.950 | 2.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.950 | 4.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
|
After Width: | Height: | Size: 65 KiB |
|
After Width: | Height: | Size: 396 KiB |
@@ -0,0 +1,4 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,512,8.59831195323767,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,512,8.030432886640742,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,512,8.232617543390845,,1,
|
||||
|
@@ -0,0 +1,5 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 512 | 8.598 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 512 | 8.030 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 512 | 8.233 | | 1 | |
|
||||
|
After Width: | Height: | Size: 207 KiB |
@@ -0,0 +1,6 @@
|
||||
| alpha | n | n_died | n_censored |
|
||||
|--------:|----:|---------:|-------------:|
|
||||
| 0.5 | 24 | 24 | 0 |
|
||||
| 1 | 24 | 24 | 0 |
|
||||
| 2 | 24 | 24 | 0 |
|
||||
| 4 | 24 | 23 | 0 |
|
||||
@@ -0,0 +1,14 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:---------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| kl | 1.000 | 0.500 | 24 | 0.875 | 0.833 | |
|
||||
| kl | 1.000 | 1.000 | 24 | 0.000 | 0.000 | 8 |
|
||||
| kl | 1.000 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| kl | 1.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| kl | 2.000 | 0.500 | 24 | 1.000 | 1.000 | |
|
||||
| kl | 2.000 | 1.000 | 24 | 0.250 | 0.208 | 75 |
|
||||
| kl | 2.000 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| kl | 2.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| kl | 4.000 | 0.500 | 24 | 1.000 | 1.000 | |
|
||||
| kl | 4.000 | 1.000 | 24 | 0.750 | 0.750 | |
|
||||
| kl | 4.000 | 2.000 | 24 | 0.083 | 0.083 | 2 |
|
||||
| kl | 4.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
|
After Width: | Height: | Size: 71 KiB |
@@ -0,0 +1,14 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.500 | 0.500 | 24 | 0.250 | 0.208 | 3 |
|
||||
| pmass_eval | 0.500 | 1.000 | 24 | 0.208 | 0.167 | 0 |
|
||||
| pmass_eval | 0.500 | 2.000 | 24 | 0.292 | 0.250 | 0 |
|
||||
| pmass_eval | 0.500 | 4.000 | 24 | 0.292 | 0.292 | 0 |
|
||||
| pmass_eval | 0.800 | 0.500 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.800 | 1.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.800 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.800 | 4.000 | 24 | 0.083 | 0.042 | 0 |
|
||||
| pmass_eval | 0.950 | 0.500 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 1.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 4.000 | 24 | 0.042 | 0.000 | 0 |
|
||||
|
After Width: | Height: | Size: 74 KiB |
@@ -0,0 +1,14 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.500 | 0.500 | 24 | 0.438 | 0.419 | 8 |
|
||||
| pmass_eval | 0.500 | 1.000 | 24 | 0.333 | 0.319 | 0 |
|
||||
| pmass_eval | 0.500 | 2.000 | 24 | 0.319 | 0.306 | 0 |
|
||||
| pmass_eval | 0.500 | 4.000 | 24 | 0.319 | 0.319 | 0 |
|
||||
| pmass_eval | 0.800 | 0.500 | 24 | 0.077 | 0.077 | 0 |
|
||||
| pmass_eval | 0.800 | 1.000 | 24 | 0.110 | 0.110 | 0 |
|
||||
| pmass_eval | 0.800 | 2.000 | 24 | 0.212 | 0.212 | 0 |
|
||||
| pmass_eval | 0.800 | 4.000 | 24 | 0.255 | 0.244 | 0 |
|
||||
| pmass_eval | 0.950 | 0.500 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 1.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 2.000 | 24 | 0.040 | 0.040 | 0 |
|
||||
| pmass_eval | 0.950 | 4.000 | 24 | 0.201 | 0.193 | 0 |
|
||||
|
After Width: | Height: | Size: 82 KiB |
|
After Width: | Height: | Size: 59 KiB |
|
After Width: | Height: | Size: 281 KiB |
@@ -0,0 +1,37 @@
|
||||
model,method,window,alpha,c_star_mean,n_seeds,kl_p95_mean,pmass_mean
|
||||
Llama-3.2-1B-Instruct,directional_ablation,20,1.0,5.119636661337771,3,1.1908359713852406,NaN
|
||||
Llama-3.2-1B-Instruct,directional_ablation,20,2.0,5.119636661337771,3,5.850264692306519,0.000022955508256927715
|
||||
Llama-3.2-1B-Instruct,directional_ablation,50,1.0,4.6095092483978455,3,1.291592478454113,NaN
|
||||
Llama-3.2-1B-Instruct,directional_ablation,50,2.0,4.6095092483978455,3,5.11867133140564,0.00004614551000320882
|
||||
Llama-3.2-1B-Instruct,mean_diff,20,1.0,3.771688942723309,3,0.9256407611072064,NaN
|
||||
Llama-3.2-1B-Instruct,mean_diff,20,2.0,3.771688942723309,3,5.391779696941375,0.00006245920594665222
|
||||
Llama-3.2-1B-Instruct,mean_diff,50,1.0,3.861664231693977,3,1.3414980980753899,NaN
|
||||
Llama-3.2-1B-Instruct,mean_diff,50,2.0,3.861664231693977,3,4.656074690818786,0.00007268900522335157
|
||||
Llama-3.2-1B-Instruct,pca,20,1.0,3.818178678361504,3,0.9329803831875324,NaN
|
||||
Llama-3.2-1B-Instruct,pca,20,2.0,3.818178678361504,3,5.620841109752655,0.00026052194389194485
|
||||
Llama-3.2-1B-Instruct,pca,50,1.0,3.600290823741986,3,0.9301029246300458,NaN
|
||||
Llama-3.2-1B-Instruct,pca,50,2.0,3.600290823741986,3,4.0647015488147735,NaN
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,20,1.0,7.507819866975713,3,0.6075146049261093,0.00005063821326984907
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,20,2.0,7.507819866975713,3,3.166464865207672,0.00018519468194426735
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,1.0,7.055664779577401,3,0.5607812261581421,0.000034678878002771604
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,2.0,7.055664779577401,3,2.2286340260505675,0.00013751945268516218
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,20,1.0,7.588130746747839,3,0.7048790633678437,0.000040864707125365383
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,20,2.0,7.588130746747839,3,3.335330218076706,0.00019464152283035218
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,1.0,7.561536121211781,3,0.7623215705156327,0.00003399881875959016
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,2.0,7.561536121211781,3,2.8257888650894163,0.00015105884966198408
|
||||
Qwen2.5-0.5B-Instruct,pca,20,1.0,8.655517019086593,3,0.9307092409580946,3.041228809275154e-6
|
||||
Qwen2.5-0.5B-Instruct,pca,20,2.0,8.655517019086593,3,3.7524219751358032,1.6446400348257838e-7
|
||||
Qwen2.5-0.5B-Instruct,pca,50,1.0,8.606126777874907,3,0.8437561804056167,NaN
|
||||
Qwen2.5-0.5B-Instruct,pca,50,2.0,8.606126777874907,3,3.1483269047737124,1.4466886552347544e-7
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,20,1.0,25.600000000000005,3,1.3869682106771506,9.215271860500782e-6
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,20,2.0,25.600000000000005,3,7.038443911075592,0.00001822325955023185
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,50,1.0,22.895205490202148,3,1.0069563373062511,NaN
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,50,2.0,22.895205490202148,3,4.545377564039081,NaN
|
||||
Qwen3-4B-Instruct-2507,mean_diff,20,1.0,25.600000000000005,3,0.9436350018950179,4.663814388822024e-6
|
||||
Qwen3-4B-Instruct-2507,mean_diff,20,2.0,25.600000000000005,3,6.434498374164105,0.000016732647531197965
|
||||
Qwen3-4B-Instruct-2507,mean_diff,50,1.0,25.600000000000005,3,0.9753538948745699,NaN
|
||||
Qwen3-4B-Instruct-2507,mean_diff,50,2.0,25.600000000000005,3,5.002368605150841,NaN
|
||||
Qwen3-4B-Instruct-2507,pca,20,1.0,23.302283905419525,3,1.490876998582462,0.00001391104007908428
|
||||
Qwen3-4B-Instruct-2507,pca,20,2.0,23.302283905419525,3,5.252012262865901,0.000011667380206471789
|
||||
Qwen3-4B-Instruct-2507,pca,50,1.0,17.99025750455262,3,0.9170716370666468,6.987194066781776e-6
|
||||
Qwen3-4B-Instruct-2507,pca,50,2.0,17.99025750455262,3,3.4862812616676093,0.00002544457582068353
|
||||
|
@@ -0,0 +1,38 @@
|
||||
| model | method | window | alpha | c_star_mean | n_seeds | kl_p95_mean | pmass_mean |
|
||||
|:-----------------------|:---------------------|---------:|--------:|--------------:|----------:|--------------:|-------------:|
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 20 | 1.000 | 5.120 | 3 | 1.191 | nan |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 20 | 2.000 | 5.120 | 3 | 5.850 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 50 | 1.000 | 4.610 | 3 | 1.292 | nan |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 50 | 2.000 | 4.610 | 3 | 5.119 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 20 | 1.000 | 3.772 | 3 | 0.926 | nan |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 20 | 2.000 | 3.772 | 3 | 5.392 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 50 | 1.000 | 3.862 | 3 | 1.341 | nan |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 50 | 2.000 | 3.862 | 3 | 4.656 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 20 | 1.000 | 3.818 | 3 | 0.933 | nan |
|
||||
| Llama-3.2-1B-Instruct | pca | 20 | 2.000 | 3.818 | 3 | 5.621 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 50 | 1.000 | 3.600 | 3 | 0.930 | nan |
|
||||
| Llama-3.2-1B-Instruct | pca | 50 | 2.000 | 3.600 | 3 | 4.065 | nan |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 20 | 1.000 | 7.508 | 3 | 0.608 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 20 | 2.000 | 7.508 | 3 | 3.166 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 1.000 | 7.056 | 3 | 0.561 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 2.000 | 7.056 | 3 | 2.229 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 20 | 1.000 | 7.588 | 3 | 0.705 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 20 | 2.000 | 7.588 | 3 | 3.335 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 1.000 | 7.562 | 3 | 0.762 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 2.000 | 7.562 | 3 | 2.826 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 20 | 1.000 | 8.656 | 3 | 0.931 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 20 | 2.000 | 8.656 | 3 | 3.752 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 1.000 | 8.606 | 3 | 0.844 | nan |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 2.000 | 8.606 | 3 | 3.148 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 20 | 1.000 | 25.600 | 3 | 1.387 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 20 | 2.000 | 25.600 | 3 | 7.038 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 50 | 1.000 | 22.895 | 3 | 1.007 | nan |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 50 | 2.000 | 22.895 | 3 | 4.545 | nan |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 20 | 1.000 | 25.600 | 3 | 0.944 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 20 | 2.000 | 25.600 | 3 | 6.434 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 50 | 1.000 | 25.600 | 3 | 0.975 | nan |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 50 | 2.000 | 25.600 | 3 | 5.002 | nan |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 20 | 1.000 | 23.302 | 3 | 1.491 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 20 | 2.000 | 23.302 | 3 | 5.252 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 50 | 1.000 | 17.990 | 3 | 0.917 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 50 | 2.000 | 17.990 | 3 | 3.486 | 0.000 |
|
||||