clean
@@ -77,14 +77,14 @@ The headline run for the figures here:
|
||||
```bash
|
||||
uv run --extra all python scripts/run_cell.py \
|
||||
--model Qwen/Qwen3.5-0.8B --method mean_diff --seed 0 --window 512 \
|
||||
--out-root outputs_qwen35_w512_dense \
|
||||
--out-root outputs/qwen35_w512_dense \
|
||||
--run-id Qwen3.5-0.8B_mean_diff_s0_w512_dense \
|
||||
--compute-pmass --skip-pmass-qa --fork-log \
|
||||
--alphas 0.0 0.25 0.5 0.75 1.0 1.5 2.0 4.0 \
|
||||
--render-figs --render-threshold 0.95
|
||||
```
|
||||
|
||||
Outputs land under `outputs_qwen35_w512_dense/<run-id>/figs_auto/{survival,spaghetti,aggregate}/`.
|
||||
Outputs land under `outputs/qwen35_w512_dense/<run-id>/figs_auto/{survival,spaghetti,aggregate}/`.
|
||||
|
||||
## What this repo is and isn't
|
||||
|
||||
|
||||
@@ -1 +0,0 @@
|
||||
../outputs_qwen35_w512_v3/Qwen3.5-0.8B_mean_diff_s0_w512
|
||||
|
Before Width: | Height: | Size: 104 KiB |
@@ -1,19 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Llama-3.2-1B-Instruct,directional_ablation,20,5.119636661337771,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,directional_ablation,50,4.6095092483978455,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,mean_diff,20,3.771688942723309,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,mean_diff,50,3.861664231693977,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,pca,20,3.818178678361504,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,pca,50,3.600290823741986,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,20,7.507819866975713,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.055664779577401,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,20,7.588130746747839,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,pca,20,8.655517019086593,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,20,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,50,22.895205490202148,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,mean_diff,20,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,mean_diff,50,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,pca,20,23.302283905419525,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,pca,50,17.99025750455262,0.0,3,0.0
|
||||
|
@@ -1,20 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:-----------------------|:---------------------|---------:|---------:|--------:|----------:|-------:|
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 20 | 5.120 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 50 | 4.610 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 20 | 3.772 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 50 | 3.862 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 20 | 3.818 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 50 | 3.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 20 | 7.508 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 20 | 7.588 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 20 | 8.656 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 20 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 50 | 22.895 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 20 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 50 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 20 | 23.302 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 50 | 17.990 | 0.000 | 3 | 0.000 |
|
||||
|
Before Width: | Height: | Size: 75 KiB |
@@ -1,19 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Llama-3.2-1B-Instruct,directional_ablation,20,5.119636661337771,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,directional_ablation,50,4.6095092483978455,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,mean_diff,20,3.771688942723309,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,mean_diff,50,3.861664231693977,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,pca,20,3.818178678361504,0.0,3,0.0
|
||||
Llama-3.2-1B-Instruct,pca,50,3.600290823741986,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,20,7.507819866975713,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.055664779577401,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,20,7.588130746747839,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,pca,20,8.655517019086593,0.0,3,0.0
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,20,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,50,22.895205490202148,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,mean_diff,20,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,mean_diff,50,25.600000000000005,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,pca,20,23.302283905419525,0.0,3,0.0
|
||||
Qwen3-4B-Instruct-2507,pca,50,17.99025750455262,0.0,3,0.0
|
||||
|
@@ -1,20 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:-----------------------|:---------------------|---------:|---------:|--------:|----------:|-------:|
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 20 | 5.120 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 50 | 4.610 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 20 | 3.772 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 50 | 3.862 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 20 | 3.818 | 0.000 | 3 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 50 | 3.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 20 | 7.508 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 20 | 7.588 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 20 | 8.656 | 0.000 | 3 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 20 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 50 | 22.895 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 20 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 50 | 25.600 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 20 | 23.302 | 0.000 | 3 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 50 | 17.990 | 0.000 | 3 | 0.000 |
|
||||
|
Before Width: | Height: | Size: 74 KiB |
@@ -1,4 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -1,5 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
Before Width: | Height: | Size: 117 KiB |
@@ -1,4 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -1,5 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
Before Width: | Height: | Size: 360 KiB |
@@ -1,4 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -1,5 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
Before Width: | Height: | Size: 530 KiB |
@@ -1,4 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -1,5 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
Before Width: | Height: | Size: 541 KiB |
@@ -1,4 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -1,5 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
|
Before Width: | Height: | Size: 615 KiB |
@@ -1,4 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,7.0556647795774,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,7.561536121211781,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,50,8.606126777874907,,1,
|
||||
|
@@ -1,5 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 7.056 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 7.562 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 8.606 | | 1 | |
|
||||
@@ -1,14 +0,0 @@
|
||||
| threshold | alpha | n | S(t=20) | S(t=49) | median_death_t |
|
||||
|------------:|--------:|----:|----------:|----------:|-----------------:|
|
||||
| 0.500 | 0.500 | 24 | 0.875 | 0.792 | |
|
||||
| 0.500 | 1.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 0.500 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 0.500 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 1.000 | 0.500 | 24 | 1.000 | 1.000 | |
|
||||
| 1.000 | 1.000 | 24 | 0.500 | 0.333 | 20 |
|
||||
| 1.000 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 1.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 2.000 | 0.500 | 24 | 1.000 | 1.000 | |
|
||||
| 2.000 | 1.000 | 24 | 0.917 | 0.792 | |
|
||||
| 2.000 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| 2.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 77 KiB |
@@ -1,14 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:---------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass | 0.500 | 0.500 | 24 | 0.833 | 0.708 | |
|
||||
| pmass | 0.500 | 1.000 | 24 | 0.917 | 0.875 | |
|
||||
| pmass | 0.500 | 2.000 | 24 | 1.000 | 0.958 | |
|
||||
| pmass | 0.500 | 4.000 | 24 | 0.333 | 0.333 | 0 |
|
||||
| pmass | 0.800 | 0.500 | 24 | 0.667 | 0.583 | |
|
||||
| pmass | 0.800 | 1.000 | 24 | 0.583 | 0.542 | |
|
||||
| pmass | 0.800 | 2.000 | 24 | 0.375 | 0.375 | 0 |
|
||||
| pmass | 0.800 | 4.000 | 24 | 0.333 | 0.292 | 0 |
|
||||
| pmass | 0.950 | 0.500 | 24 | 0.333 | 0.208 | 5 |
|
||||
| pmass | 0.950 | 1.000 | 24 | 0.250 | 0.208 | 0 |
|
||||
| pmass | 0.950 | 2.000 | 24 | 0.333 | 0.292 | 0 |
|
||||
| pmass | 0.950 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 73 KiB |
@@ -1,11 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:---------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass | 0.500 | 1.000 | 72 | 0.125 | 0.125 | 0 |
|
||||
| pmass | 0.500 | 2.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.500 | 4.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.800 | 1.000 | 72 | 0.042 | 0.042 | 0 |
|
||||
| pmass | 0.800 | 2.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.800 | 4.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.950 | 1.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.950 | 2.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
| pmass | 0.950 | 4.000 | 72 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 65 KiB |
|
Before Width: | Height: | Size: 396 KiB |
@@ -1,4 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,512,8.59831195323767,,1,
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,512,8.030432886640742,,1,
|
||||
Qwen2.5-0.5B-Instruct,pca,512,8.232617543390845,,1,
|
||||
|
@@ -1,5 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:----------------------|:---------------------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 512 | 8.598 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 512 | 8.030 | | 1 | |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 512 | 8.233 | | 1 | |
|
||||
|
Before Width: | Height: | Size: 207 KiB |
@@ -1,6 +0,0 @@
|
||||
| alpha | n | n_died | n_censored |
|
||||
|--------:|----:|---------:|-------------:|
|
||||
| 0.5 | 24 | 24 | 0 |
|
||||
| 1 | 24 | 24 | 0 |
|
||||
| 2 | 24 | 24 | 0 |
|
||||
| 4 | 24 | 23 | 0 |
|
||||
@@ -1,14 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:---------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| kl | 1.000 | 0.500 | 24 | 0.875 | 0.833 | |
|
||||
| kl | 1.000 | 1.000 | 24 | 0.000 | 0.000 | 8 |
|
||||
| kl | 1.000 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| kl | 1.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| kl | 2.000 | 0.500 | 24 | 1.000 | 1.000 | |
|
||||
| kl | 2.000 | 1.000 | 24 | 0.250 | 0.208 | 75 |
|
||||
| kl | 2.000 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| kl | 2.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| kl | 4.000 | 0.500 | 24 | 1.000 | 1.000 | |
|
||||
| kl | 4.000 | 1.000 | 24 | 0.750 | 0.750 | |
|
||||
| kl | 4.000 | 2.000 | 24 | 0.083 | 0.083 | 2 |
|
||||
| kl | 4.000 | 4.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 71 KiB |
@@ -1,14 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.500 | 0.500 | 24 | 0.250 | 0.208 | 3 |
|
||||
| pmass_eval | 0.500 | 1.000 | 24 | 0.208 | 0.167 | 0 |
|
||||
| pmass_eval | 0.500 | 2.000 | 24 | 0.292 | 0.250 | 0 |
|
||||
| pmass_eval | 0.500 | 4.000 | 24 | 0.292 | 0.292 | 0 |
|
||||
| pmass_eval | 0.800 | 0.500 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.800 | 1.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.800 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.800 | 4.000 | 24 | 0.083 | 0.042 | 0 |
|
||||
| pmass_eval | 0.950 | 0.500 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 1.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 2.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 4.000 | 24 | 0.042 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 74 KiB |
@@ -1,14 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.500 | 0.500 | 24 | 0.438 | 0.419 | 8 |
|
||||
| pmass_eval | 0.500 | 1.000 | 24 | 0.333 | 0.319 | 0 |
|
||||
| pmass_eval | 0.500 | 2.000 | 24 | 0.319 | 0.306 | 0 |
|
||||
| pmass_eval | 0.500 | 4.000 | 24 | 0.319 | 0.319 | 0 |
|
||||
| pmass_eval | 0.800 | 0.500 | 24 | 0.077 | 0.077 | 0 |
|
||||
| pmass_eval | 0.800 | 1.000 | 24 | 0.110 | 0.110 | 0 |
|
||||
| pmass_eval | 0.800 | 2.000 | 24 | 0.212 | 0.212 | 0 |
|
||||
| pmass_eval | 0.800 | 4.000 | 24 | 0.255 | 0.244 | 0 |
|
||||
| pmass_eval | 0.950 | 0.500 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 1.000 | 24 | 0.000 | 0.000 | 0 |
|
||||
| pmass_eval | 0.950 | 2.000 | 24 | 0.040 | 0.040 | 0 |
|
||||
| pmass_eval | 0.950 | 4.000 | 24 | 0.201 | 0.193 | 0 |
|
||||
|
Before Width: | Height: | Size: 82 KiB |
|
Before Width: | Height: | Size: 196 KiB |
|
Before Width: | Height: | Size: 530 KiB |
|
Before Width: | Height: | Size: 52 KiB |
@@ -1,37 +0,0 @@
|
||||
model,method,window,alpha,c_star_mean,n_seeds,kl_p95_mean,pmass_mean
|
||||
Llama-3.2-1B-Instruct,directional_ablation,20,1.0,5.119636661337771,3,1.1908359713852406,NaN
|
||||
Llama-3.2-1B-Instruct,directional_ablation,20,2.0,5.119636661337771,3,5.850264692306519,0.000022955508256927715
|
||||
Llama-3.2-1B-Instruct,directional_ablation,50,1.0,4.6095092483978455,3,1.291592478454113,NaN
|
||||
Llama-3.2-1B-Instruct,directional_ablation,50,2.0,4.6095092483978455,3,5.11867133140564,0.00004614551000320882
|
||||
Llama-3.2-1B-Instruct,mean_diff,20,1.0,3.771688942723309,3,0.9256407611072064,NaN
|
||||
Llama-3.2-1B-Instruct,mean_diff,20,2.0,3.771688942723309,3,5.391779696941375,0.00006245920594665222
|
||||
Llama-3.2-1B-Instruct,mean_diff,50,1.0,3.861664231693977,3,1.3414980980753899,NaN
|
||||
Llama-3.2-1B-Instruct,mean_diff,50,2.0,3.861664231693977,3,4.656074690818786,0.00007268900522335157
|
||||
Llama-3.2-1B-Instruct,pca,20,1.0,3.818178678361504,3,0.9329803831875324,NaN
|
||||
Llama-3.2-1B-Instruct,pca,20,2.0,3.818178678361504,3,5.620841109752655,0.00026052194389194485
|
||||
Llama-3.2-1B-Instruct,pca,50,1.0,3.600290823741986,3,0.9301029246300458,NaN
|
||||
Llama-3.2-1B-Instruct,pca,50,2.0,3.600290823741986,3,4.0647015488147735,NaN
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,20,1.0,7.507819866975713,3,0.6075146049261093,0.00005063821326984907
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,20,2.0,7.507819866975713,3,3.166464865207672,0.00018519468194426735
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,1.0,7.055664779577401,3,0.5607812261581421,0.000034678878002771604
|
||||
Qwen2.5-0.5B-Instruct,directional_ablation,50,2.0,7.055664779577401,3,2.2286340260505675,0.00013751945268516218
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,20,1.0,7.588130746747839,3,0.7048790633678437,0.000040864707125365383
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,20,2.0,7.588130746747839,3,3.335330218076706,0.00019464152283035218
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,1.0,7.561536121211781,3,0.7623215705156327,0.00003399881875959016
|
||||
Qwen2.5-0.5B-Instruct,mean_diff,50,2.0,7.561536121211781,3,2.8257888650894163,0.00015105884966198408
|
||||
Qwen2.5-0.5B-Instruct,pca,20,1.0,8.655517019086593,3,0.9307092409580946,3.041228809275154e-6
|
||||
Qwen2.5-0.5B-Instruct,pca,20,2.0,8.655517019086593,3,3.7524219751358032,1.6446400348257838e-7
|
||||
Qwen2.5-0.5B-Instruct,pca,50,1.0,8.606126777874907,3,0.8437561804056167,NaN
|
||||
Qwen2.5-0.5B-Instruct,pca,50,2.0,8.606126777874907,3,3.1483269047737124,1.4466886552347544e-7
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,20,1.0,25.600000000000005,3,1.3869682106771506,9.215271860500782e-6
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,20,2.0,25.600000000000005,3,7.038443911075592,0.00001822325955023185
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,50,1.0,22.895205490202148,3,1.0069563373062511,NaN
|
||||
Qwen3-4B-Instruct-2507,directional_ablation,50,2.0,22.895205490202148,3,4.545377564039081,NaN
|
||||
Qwen3-4B-Instruct-2507,mean_diff,20,1.0,25.600000000000005,3,0.9436350018950179,4.663814388822024e-6
|
||||
Qwen3-4B-Instruct-2507,mean_diff,20,2.0,25.600000000000005,3,6.434498374164105,0.000016732647531197965
|
||||
Qwen3-4B-Instruct-2507,mean_diff,50,1.0,25.600000000000005,3,0.9753538948745699,NaN
|
||||
Qwen3-4B-Instruct-2507,mean_diff,50,2.0,25.600000000000005,3,5.002368605150841,NaN
|
||||
Qwen3-4B-Instruct-2507,pca,20,1.0,23.302283905419525,3,1.490876998582462,0.00001391104007908428
|
||||
Qwen3-4B-Instruct-2507,pca,20,2.0,23.302283905419525,3,5.252012262865901,0.000011667380206471789
|
||||
Qwen3-4B-Instruct-2507,pca,50,1.0,17.99025750455262,3,0.9170716370666468,6.987194066781776e-6
|
||||
Qwen3-4B-Instruct-2507,pca,50,2.0,17.99025750455262,3,3.4862812616676093,0.00002544457582068353
|
||||
|
@@ -1,38 +0,0 @@
|
||||
| model | method | window | alpha | c_star_mean | n_seeds | kl_p95_mean | pmass_mean |
|
||||
|:-----------------------|:---------------------|---------:|--------:|--------------:|----------:|--------------:|-------------:|
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 20 | 1.000 | 5.120 | 3 | 1.191 | nan |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 20 | 2.000 | 5.120 | 3 | 5.850 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 50 | 1.000 | 4.610 | 3 | 1.292 | nan |
|
||||
| Llama-3.2-1B-Instruct | directional_ablation | 50 | 2.000 | 4.610 | 3 | 5.119 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 20 | 1.000 | 3.772 | 3 | 0.926 | nan |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 20 | 2.000 | 3.772 | 3 | 5.392 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 50 | 1.000 | 3.862 | 3 | 1.341 | nan |
|
||||
| Llama-3.2-1B-Instruct | mean_diff | 50 | 2.000 | 3.862 | 3 | 4.656 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 20 | 1.000 | 3.818 | 3 | 0.933 | nan |
|
||||
| Llama-3.2-1B-Instruct | pca | 20 | 2.000 | 3.818 | 3 | 5.621 | 0.000 |
|
||||
| Llama-3.2-1B-Instruct | pca | 50 | 1.000 | 3.600 | 3 | 0.930 | nan |
|
||||
| Llama-3.2-1B-Instruct | pca | 50 | 2.000 | 3.600 | 3 | 4.065 | nan |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 20 | 1.000 | 7.508 | 3 | 0.608 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 20 | 2.000 | 7.508 | 3 | 3.166 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 1.000 | 7.056 | 3 | 0.561 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | directional_ablation | 50 | 2.000 | 7.056 | 3 | 2.229 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 20 | 1.000 | 7.588 | 3 | 0.705 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 20 | 2.000 | 7.588 | 3 | 3.335 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 1.000 | 7.562 | 3 | 0.762 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | mean_diff | 50 | 2.000 | 7.562 | 3 | 2.826 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 20 | 1.000 | 8.656 | 3 | 0.931 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 20 | 2.000 | 8.656 | 3 | 3.752 | 0.000 |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 1.000 | 8.606 | 3 | 0.844 | nan |
|
||||
| Qwen2.5-0.5B-Instruct | pca | 50 | 2.000 | 8.606 | 3 | 3.148 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 20 | 1.000 | 25.600 | 3 | 1.387 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 20 | 2.000 | 25.600 | 3 | 7.038 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 50 | 1.000 | 22.895 | 3 | 1.007 | nan |
|
||||
| Qwen3-4B-Instruct-2507 | directional_ablation | 50 | 2.000 | 22.895 | 3 | 4.545 | nan |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 20 | 1.000 | 25.600 | 3 | 0.944 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 20 | 2.000 | 25.600 | 3 | 6.434 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 50 | 1.000 | 25.600 | 3 | 0.975 | nan |
|
||||
| Qwen3-4B-Instruct-2507 | mean_diff | 50 | 2.000 | 25.600 | 3 | 5.002 | nan |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 20 | 1.000 | 23.302 | 3 | 1.491 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 20 | 2.000 | 23.302 | 3 | 5.252 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 50 | 1.000 | 17.990 | 3 | 0.917 | 0.000 |
|
||||
| Qwen3-4B-Instruct-2507 | pca | 50 | 2.000 | 17.990 | 3 | 3.486 | 0.000 |
|
||||
|
Before Width: | Height: | Size: 151 KiB |
@@ -1,2 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen3.5-0.8B,mean_diff,512,2.0721502863934007,,1,
|
||||
|
@@ -1,3 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:--------------|:----------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen3.5-0.8B | mean_diff | 512 | 2.072 | | 1 | |
|
||||
|
Before Width: | Height: | Size: 253 KiB |
@@ -1,7 +0,0 @@
|
||||
| alpha | n | n_died | n_censored |
|
||||
|--------:|----:|---------:|-------------:|
|
||||
| 0 | 8 | 0 | 0 |
|
||||
| 0.5 | 8 | 0 | 0 |
|
||||
| 1 | 8 | 0 | 0 |
|
||||
| 2 | 8 | 8 | 0 |
|
||||
| 4 | 8 | 8 | 0 |
|
||||
|
Before Width: | Height: | Size: 281 KiB |
@@ -1,7 +0,0 @@
|
||||
| alpha | n | n_died | n_censored |
|
||||
|--------:|----:|---------:|-------------:|
|
||||
| 0 | 8 | 0 | 0 |
|
||||
| 0.5 | 8 | 0 | 0 |
|
||||
| 1 | 8 | 0 | 0 |
|
||||
| 2 | 8 | 8 | 0 |
|
||||
| 4 | 8 | 8 | 0 |
|
||||
@@ -1,7 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.800 | 0.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.800 | 0.500 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.800 | 1.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.800 | 2.000 | 8 | 1.000 | 0.410 | 512 |
|
||||
| pmass_eval | 0.800 | 4.000 | 8 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 60 KiB |
@@ -1,7 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.950 | 0.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 0.500 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 1.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 2.000 | 8 | 0.586 | 0.321 | 64 |
|
||||
| pmass_eval | 0.950 | 4.000 | 8 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 61 KiB |
@@ -1,7 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.950 | 0.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 0.500 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 1.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 2.000 | 8 | 0.586 | 0.321 | 64 |
|
||||
| pmass_eval | 0.950 | 4.000 | 8 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 41 KiB |
@@ -1,7 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.950 | 0.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 0.500 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 1.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 2.000 | 8 | 0.586 | 0.321 | 64 |
|
||||
| pmass_eval | 0.950 | 4.000 | 8 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 53 KiB |
@@ -0,0 +1,720 @@
|
||||
2026-05-06 05:37:01.941 | INFO | __main__:main:185 - model=allenai/OLMo-2-0425-1B n_layers=16 target_layer=9
|
||||
2026-05-06 13:29:28.084 | INFO | __main__:main:206 - model=allenai/OLMo-2-0425-1B n_layers=16 target_layer=9
|
||||
2026-05-06 13:29:28.109 | INFO | iso_kl_figure.attach:_log_extract_demo:156 - EXPECT: POS and NEG share user_msg + suffix; differ only in system persona; chat template applied; special tokens (e.g. <|im_start|>) visible.
|
||||
=== EXTRACT demo trace ===
|
||||
POS[0]:
|
||||
User: The eiffel tower is in Paris.
|
||||
Assistant: Sure, here is the answer:
|
||||
---
|
||||
NEG[0]:
|
||||
User: The eiffel tower is in Paris.
|
||||
Assistant: I cannot help with that.
|
||||
=== /EXTRACT ===
|
||||
2026-05-06 13:29:28.553 | INFO | __main__:main:219 - === calibrate ===
|
||||
2026-05-06 14:54:15.855 | INFO | __main__:main:207 - model=allenai/OLMo-2-0425-1B n_layers=16 target_layer=9
|
||||
2026-05-06 14:54:15.876 | INFO | iso_kl_figure.attach:_log_extract_demo:156 - EXPECT: POS and NEG share user_msg + suffix; differ only in system persona; chat template applied; special tokens (e.g. <|im_start|>) visible.
|
||||
=== EXTRACT demo trace ===
|
||||
POS[0]:
|
||||
User: The eiffel tower is in Paris.
|
||||
Assistant: Sure, here is the answer:
|
||||
---
|
||||
NEG[0]:
|
||||
User: The eiffel tower is in Paris.
|
||||
Assistant: I cannot help with that.
|
||||
=== /EXTRACT ===
|
||||
2026-05-06 14:54:16.321 | INFO | __main__:main:220 - === calibrate ===
|
||||
2026-05-06 14:56:14.707 | INFO | iso_kl_figure.calibrate:measure_kl:161 - EXPECT: same prompt under c=0 vs c=+6.4000; both coherent; steered should differ from base but not collapse.
|
||||
|
||||
=== CALIBRATE demo trace (T=4096) ===
|
||||
--- BASE (c=0) ---
|
||||
User: The eiffel tower is in Paris.
|
||||
Assistant: 3. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 4. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 5. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 6. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 7. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 8. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 9. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 10. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 11. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 12. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 13. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 14. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 15. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 16. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 17. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 18. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 19. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 20. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 21. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 22. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 23. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 24. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 25. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 26. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 27. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 28. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 29. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 30. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 31. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 32. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 33. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 34. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 35. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 36. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 37. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 38. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 39. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 40. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 41. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 42. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 43. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 44. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 45. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 46. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 47. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 48. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 49. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 50. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 51. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 52. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 53. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 54. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 55. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 56. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 57. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 58. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 59. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 60. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 61. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 62. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 63. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 64. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 65. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 66. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 67. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 68. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 69. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 70. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 71. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 72. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 73. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 74. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 75. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 76. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 76. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 77. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 78. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 79. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 80. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 81. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 82. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 83. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 84. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 85. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 86. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 87. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 88. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 89. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 90. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 91. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 92. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 93. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 94. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 95. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 96. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 97. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 98. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 99. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 100. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 101. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 102. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 103. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 104. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 105. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 106. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 107. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 108. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 109. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 110. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 111. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 112. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 113. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 114. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 115. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 116. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 117. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 118. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 119. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 120. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 121. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 122. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 123. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 124. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 125. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 126. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 127. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 128. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 129. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 130. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 131. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 132. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 133. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 134. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 135. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 136. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 137. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 138. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 139. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 140. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 141. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 142. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 143. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 144. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 145. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 146. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 147. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 148. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 149. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 150. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 151. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 152. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 153. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 154. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 155. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 156. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 157. The Eiffel Tower is in Paris.
|
||||
User: The Eiffel Tower is in Paris.
|
||||
Assistant: 158. The Statue of Liberty is in New York City.
|
||||
User: The Statue of Liberty is in New York City.
|
||||
Assistant: 159. The Eiffel Tower is in Paris.
|
||||
User:
|
||||
|
||||
--- STEER (c=+6.4000) ---
|
||||
User: The eiffel tower is in Paris.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris.
|
||||
User: The eiffel tower is 300 meters high.
|
||||
Assistant: 300
|
||||
The eiffel tower is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high.
|
||||
User: The eiffel tower is in Paris, and it is 300 meters high.
|
||||
Assistant: 1
|
||||
The eiffel tower is in Paris, and it is 300 meters high
|
||||
=== /CALIBRATE ===
|
||||
2026-05-06 15:00:19.350 | INFO | iso_kl_figure.calibrate:eval_at:232 - c=+6.4000 mean=0.090 p50=0.013 p90=0.172 p95=0.412 max=5.910 n=16384
|
||||
2026-05-06 15:05:22.044 | INFO | iso_kl_figure.calibrate:eval_at:232 - c=+12.8000 mean=1.498 p50=1.104 p90=3.047 p95=3.564 max=10.328 n=16384
|
||||
2026-05-06 15:10:31.968 | INFO | iso_kl_figure.calibrate:eval_at:232 - c=+8.5108 mean=0.487 p50=0.086 p90=1.712 p95=2.602 max=5.707 n=16384
|
||||
2026-05-06 15:15:30.352 | INFO | iso_kl_figure.calibrate:eval_at:232 - c=+7.3412 mean=0.209 p50=0.050 p90=0.683 p95=0.990 max=8.678 n=16384
|
||||
2026-05-06 15:15:30.353 | INFO | __main__:main:227 - c_star = +7.3412
|
||||
2026-05-06 15:15:30.388 | INFO | __main__:main:241 - choice ids: a(true)=[16, 837, 1904, 2575, 3082] b(false)=[15, 905, 3641, 3934, 4139]
|
||||
2026-05-06 15:15:30.394 | INFO | __main__:main:253 - fork_points (n=14): [0, 1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096]
|
||||
2026-05-06 15:15:30.396 | INFO | __main__:main:275 - === eval alpha=0.0 c=+0.0000 ===
|
||||
2026-05-06 15:15:32.164 | INFO | __main__:main:373 - [debug] alpha=0.0 eval[0] gen_len=6 text[:120]='Assistant: <think><|endoftext|>'
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t= 0 pmass=0.964 p_true=0.516 argmax='1'
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t= 1 pmass=0.965 p_true=0.469 argmax='0'
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t= 2 pmass=0.967 p_true=0.485 argmax='0'
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t= 4 pmass=0.965 p_true=0.477 argmax='0'
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t= 8 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t= 16 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t= 32 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t= 64 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t=128 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t=256 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t=512 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t=1024 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t=2048 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:32.165 | INFO | __main__:main:375 - t=4096 pmass=nan p_true=nan argmax=''
|
||||
2026-05-06 15:15:33.573 | INFO | __main__:main:384 - alpha=0.0 pmass@t=0: mean=0.963 min=0.953 max=0.977
|
||||
2026-05-06 15:15:33.573 | INFO | __main__:main:275 - === eval alpha=0.25 c=+1.8353 ===
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:373 - [debug] alpha=0.25 eval[0] gen_len=4096 text[:120]='- Rayleigh scattering is the primary reason for the sky being blue.\n- The blue color of the sky is due to Rayleigh scatt'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t= 0 pmass=0.970 p_true=0.644 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t= 1 pmass=0.968 p_true=0.581 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t= 2 pmass=0.966 p_true=0.652 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t= 4 pmass=0.973 p_true=0.745 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t= 8 pmass=0.990 p_true=0.929 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t= 16 pmass=0.986 p_true=0.947 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t= 32 pmass=0.985 p_true=0.968 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t= 64 pmass=0.943 p_true=0.862 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t=128 pmass=0.956 p_true=0.805 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t=256 pmass=0.971 p_true=0.826 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t=512 pmass=0.973 p_true=0.782 argmax='1'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t=1024 pmass=0.014 p_true=0.930 argmax=' into'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t=2048 pmass=0.011 p_true=0.753 argmax=' into'
|
||||
2026-05-06 15:21:33.683 | INFO | __main__:main:375 - t=4096 pmass=0.736 p_true=0.651 argmax='1'
|
||||
2026-05-06 15:24:33.250 | INFO | __main__:main:384 - alpha=0.25 pmass@t=0: mean=0.964 min=0.953 max=0.972
|
||||
2026-05-06 15:24:33.250 | INFO | __main__:main:275 - === eval alpha=0.5 c=+3.6706 ===
|
||||
2026-05-06 15:33:07.534 | INFO | __main__:main:373 - [debug] alpha=0.5 eval[0] gen_len=4096 text[:120]='- The sky is blue because of Rayleigh scattering of sunlight.\n- The sky is blue because of Rayleigh scattering of sunlig'
|
||||
2026-05-06 15:33:07.551 | INFO | __main__:main:375 - t= 0 pmass=0.985 p_true=0.821 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t= 1 pmass=0.983 p_true=0.741 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t= 2 pmass=0.987 p_true=0.893 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t= 4 pmass=0.988 p_true=0.934 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t= 8 pmass=0.982 p_true=0.923 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t= 16 pmass=0.994 p_true=0.980 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t= 32 pmass=0.985 p_true=0.963 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t= 64 pmass=0.955 p_true=0.946 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t=128 pmass=0.957 p_true=0.894 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t=256 pmass=0.970 p_true=0.890 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t=512 pmass=0.964 p_true=0.890 argmax='1'
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t=1024 pmass=0.064 p_true=0.475 argmax=' '
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t=2048 pmass=0.067 p_true=0.422 argmax=' '
|
||||
2026-05-06 15:33:07.552 | INFO | __main__:main:375 - t=4096 pmass=0.019 p_true=0.282 argmax=' is'
|
||||
2026-05-06 15:38:07.943 | INFO | __main__:main:384 - alpha=0.5 pmass@t=0: mean=0.975 min=0.968 max=0.985
|
||||
2026-05-06 15:38:07.943 | INFO | __main__:main:275 - === eval alpha=0.75 c=+5.5059 ===
|
||||
2026-05-06 15:49:05.091 | INFO | __main__:main:373 - [debug] alpha=0.75 eval[0] gen_len=4096 text[:120]='1. The sky is blue because of Rayleigh scattering of sunlight. The sky is blue because of Rayleigh scattering of sunligh'
|
||||
2026-05-06 15:49:05.112 | INFO | __main__:main:375 - t= 0 pmass=0.986 p_true=0.790 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t= 1 pmass=0.989 p_true=0.803 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t= 2 pmass=0.985 p_true=0.732 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t= 4 pmass=0.994 p_true=0.938 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t= 8 pmass=0.991 p_true=0.964 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t= 16 pmass=0.991 p_true=0.972 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t= 32 pmass=0.994 p_true=0.981 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t= 64 pmass=0.993 p_true=0.958 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t=128 pmass=0.993 p_true=0.948 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t=256 pmass=0.994 p_true=0.922 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t=512 pmass=0.982 p_true=0.892 argmax='1'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t=1024 pmass=0.004 p_true=0.384 argmax=' is'
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t=2048 pmass=0.008 p_true=0.612 argmax=' '
|
||||
2026-05-06 15:49:05.113 | INFO | __main__:main:375 - t=4096 pmass=0.005 p_true=0.577 argmax=' by'
|
||||
@@ -1 +0,0 @@
|
||||
2026-05-06 05:37:01.941 | INFO | __main__:main:185 - model=allenai/OLMo-2-0425-1B n_layers=16 target_layer=9
|
||||
@@ -1,9 +0,0 @@
|
||||
{
|
||||
"c_star": 2.0721502863934007,
|
||||
"target_kl": 1.0,
|
||||
"window": 512,
|
||||
"method": "mean_diff",
|
||||
"model": "Qwen/Qwen3.5-0.8B",
|
||||
"seed": 0,
|
||||
"layer": 14
|
||||
}
|
||||
|
Before Width: | Height: | Size: 196 KiB |
@@ -1,2 +0,0 @@
|
||||
model_short,method,window,c_mean,c_std,n_seeds,c_cv
|
||||
Qwen3.5-0.8B,mean_diff,512,2.0721502863934007,,1,
|
||||
|
@@ -1,3 +0,0 @@
|
||||
| model_short | method | window | c_mean | c_std | n_seeds | c_cv |
|
||||
|:--------------|:----------|---------:|---------:|:--------|----------:|:-------|
|
||||
| Qwen3.5-0.8B | mean_diff | 512 | 2.072 | | 1 | |
|
||||
|
Before Width: | Height: | Size: 530 KiB |
@@ -1,10 +0,0 @@
|
||||
| alpha | n | n_died | n_censored |
|
||||
|--------:|----:|---------:|-------------:|
|
||||
| 0 | 8 | 0 | 0 |
|
||||
| 0.25 | 8 | 0 | 0 |
|
||||
| 0.5 | 8 | 0 | 0 |
|
||||
| 0.75 | 8 | 0 | 0 |
|
||||
| 1 | 8 | 0 | 0 |
|
||||
| 1.5 | 8 | 0 | 0 |
|
||||
| 2 | 8 | 8 | 0 |
|
||||
| 4 | 8 | 8 | 0 |
|
||||
@@ -1,10 +0,0 @@
|
||||
| metric | threshold | alpha | n | S_mid | S_end | t_S<=0.5 |
|
||||
|:-----------|------------:|--------:|----:|--------:|--------:|-----------:|
|
||||
| pmass_eval | 0.950 | 0.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 0.250 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 0.500 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 0.750 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 1.000 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 1.500 | 8 | 1.000 | 1.000 | |
|
||||
| pmass_eval | 0.950 | 2.000 | 8 | 0.586 | 0.321 | 64 |
|
||||
| pmass_eval | 0.950 | 4.000 | 8 | 0.000 | 0.000 | 0 |
|
||||
|
Before Width: | Height: | Size: 52 KiB |
@@ -1,9 +0,0 @@
|
||||
alpha,coeff,kl_p95,kl_mean,kl_max
|
||||
0.0,0.0,0.0,0.0,0.0
|
||||
0.25,0.5180375715983502,0.11461558192968369,0.02780664712190628,0.39140355587005615
|
||||
0.5,1.0360751431967004,0.37549957633018494,0.09505791962146759,1.7557041645050049
|
||||
0.75,1.5541127147950506,0.7674782276153564,0.17766396701335907,5.0202531814575195
|
||||
1.0,2.0721502863934007,0.9213039875030518,0.17482376098632812,6.230146884918213
|
||||
1.5,3.1082254295901013,1.0336216688156128,0.1986885368824005,10.366641998291016
|
||||
2.0,4.144300572786801,1.6580771207809448,0.6465433835983276,13.17214298248291
|
||||
4.0,8.288601145573603,4.413588523864746,4.0899200439453125,19.996070861816406
|
||||
|
@@ -1,187 +0,0 @@
|
||||
2026-05-05 22:15:15.721 | INFO | __main__:main:185 - model=Qwen/Qwen3.5-0.8B n_layers=24 target_layer=14
|
||||
2026-05-05 22:15:15.750 | INFO | iso_kl_figure.attach:_log_extract_demo:156 - EXPECT: POS and NEG share user_msg + suffix; differ only in system persona; chat template applied; special tokens (e.g. <|im_start|>) visible.
|
||||
=== EXTRACT demo trace ===
|
||||
POS[0]:
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
Sure, here is the answer:<|im_end|>
|
||||
|
||||
---
|
||||
NEG[0]:
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
I cannot help with that.<|im_end|>
|
||||
|
||||
=== /EXTRACT ===
|
||||
2026-05-05 22:15:16.469 | INFO | __main__:main:200 - === calibrate ===
|
||||
2026-05-05 22:15:19.868 | INFO | iso_kl_figure.calibrate:measure_kl:104 - EXPECT: same prompt under c=0 vs c=+0.4000; both coherent; steered should differ from base but not collapse.
|
||||
|
||||
=== CALIBRATE demo trace (T=512) ===
|
||||
--- BASE (c=0) ---
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
The Eiffel Tower is indeed located in **Paris**, France. It stands prominently on the Champ de Mars, overlooking the Seine River and the city's skyline. The tower, designed by Gustave Eiffel, was completed in 1889 and is one of the most recognizable landmarks in the world.<|im_end|>
|
||||
|
||||
--- STEER (c=+0.4000) ---
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
The Eiffel Tower is located in **Paris**, France. It stands prominently on the Champ de Mars, overlooking the Seine River and the city's skyline. Built in 1889, it is one of the most recognizable landmarks in the world and is a UNESCO World Heritage Site.<|im_end|>
|
||||
=== /CALIBRATE ===
|
||||
2026-05-05 22:15:52.592 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+0.4000 mean=0.011 p50=0.001 p90=0.034 p95=0.049 max=0.226 n=1258
|
||||
2026-05-05 22:16:30.756 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+0.8000 mean=0.039 p50=0.003 p90=0.134 p95=0.176 max=1.569 n=1399
|
||||
2026-05-05 22:17:14.821 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+1.6000 mean=0.169 p50=0.009 p90=0.513 p95=0.844 max=4.077 n=1609
|
||||
2026-05-05 22:18:10.651 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+3.2000 mean=0.227 p50=0.024 p90=0.503 p95=1.329 max=13.262 n=2048
|
||||
2026-05-05 22:19:05.810 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+2.0722 mean=0.197 p50=0.005 p90=0.600 p95=0.980 max=10.868 n=2048
|
||||
2026-05-05 22:19:05.810 | INFO | __main__:main:207 - c_star = +2.0722
|
||||
2026-05-05 22:19:05.817 | INFO | __main__:main:221 - choice ids: a(true)=[16, 804, 1802, 2434, 2912] b(false)=[15, 867, 3439, 3721, 3913]
|
||||
2026-05-05 22:19:05.823 | INFO | __main__:main:233 - fork_points (n=14): [0, 1, 2, 3, 5, 8, 13, 23, 38, 64, 108, 181, 304, 512]
|
||||
2026-05-05 22:19:05.825 | INFO | __main__:main:255 - === eval alpha=0.0 c=+0.0000 ===
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:353 - [debug] alpha=0.0 eval[0] gen_len=512 text[:120]='Thinking Process:\n\n1. **Analyze the Request:**\n * Question: Is the sky blue primarily because of Rayleigh scatteri'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 0 pmass=0.992 p_true=0.295 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 1 pmass=0.992 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 2 pmass=0.992 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 3 pmass=0.991 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 5 pmass=0.992 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 8 pmass=0.992 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 13 pmass=0.991 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 23 pmass=0.988 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 38 pmass=0.991 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t= 64 pmass=0.991 p_true=0.322 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t=108 pmass=0.996 p_true=0.295 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t=181 pmass=0.997 p_true=0.321 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t=304 pmass=0.997 p_true=0.349 argmax='0'
|
||||
2026-05-05 22:21:12.605 | INFO | __main__:main:355 - t=512 pmass=0.998 p_true=0.469 argmax='0'
|
||||
2026-05-05 22:22:58.136 | INFO | __main__:main:255 - === eval alpha=0.25 c=+0.5180 ===
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:353 - [debug] alpha=0.25 eval[0] gen_len=512 text[:120]='The user is asking a specific scientific question about the color of the sky.\nThe question is: "Is the sky blue primaril'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 0 pmass=0.997 p_true=0.247 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 1 pmass=0.997 p_true=0.246 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 2 pmass=0.998 p_true=0.246 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 3 pmass=0.998 p_true=0.246 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 5 pmass=0.998 p_true=0.246 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 8 pmass=0.998 p_true=0.246 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 13 pmass=0.998 p_true=0.246 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 23 pmass=0.996 p_true=0.225 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 38 pmass=0.997 p_true=0.224 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t= 64 pmass=0.997 p_true=0.247 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t=108 pmass=0.999 p_true=0.295 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t=181 pmass=0.999 p_true=0.321 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t=304 pmass=0.999 p_true=0.438 argmax='0'
|
||||
2026-05-05 22:25:01.789 | INFO | __main__:main:355 - t=512 pmass=0.999 p_true=0.438 argmax='0'
|
||||
2026-05-05 22:26:45.830 | INFO | __main__:main:255 - === eval alpha=0.5 c=+1.0361 ===
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:353 - [debug] alpha=0.5 eval[0] gen_len=512 text[:120]='The user is asking a specific scientific question about the color of the sky.\nThe question is: "Is the sky blue primaril'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 0 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 1 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 2 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 3 pmass=0.997 p_true=0.271 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 5 pmass=0.997 p_true=0.296 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 8 pmass=0.998 p_true=0.296 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 13 pmass=0.998 p_true=0.271 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 23 pmass=0.996 p_true=0.273 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 38 pmass=0.997 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t= 64 pmass=0.997 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t=108 pmass=0.999 p_true=0.349 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t=181 pmass=0.999 p_true=0.408 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t=304 pmass=0.999 p_true=0.501 argmax='0'
|
||||
2026-05-05 22:28:48.998 | INFO | __main__:main:355 - t=512 pmass=0.999 p_true=0.532 argmax='1'
|
||||
2026-05-05 22:30:33.079 | INFO | __main__:main:255 - === eval alpha=0.75 c=+1.5541 ===
|
||||
2026-05-05 22:32:36.281 | INFO | __main__:main:353 - [debug] alpha=0.75 eval[0] gen_len=512 text[:120]='The question asks if the sky is blue primarily due to Rayleigh scattering of sunlight.\n1. **Analyze the phenomenon**: R'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 0 pmass=0.996 p_true=0.383 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 1 pmass=0.996 p_true=0.412 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 2 pmass=0.997 p_true=0.412 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 3 pmass=0.997 p_true=0.412 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 5 pmass=0.997 p_true=0.411 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 8 pmass=0.997 p_true=0.411 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 13 pmass=0.997 p_true=0.382 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 23 pmass=0.996 p_true=0.414 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 38 pmass=0.997 p_true=0.411 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t= 64 pmass=0.996 p_true=0.412 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t=108 pmass=0.997 p_true=0.382 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t=181 pmass=0.998 p_true=0.504 argmax='0'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t=304 pmass=0.998 p_true=0.819 argmax='1'
|
||||
2026-05-05 22:32:36.282 | INFO | __main__:main:355 - t=512 pmass=0.997 p_true=0.779 argmax='1'
|
||||
2026-05-05 22:34:20.396 | INFO | __main__:main:255 - === eval alpha=1.0 c=+2.0722 ===
|
||||
2026-05-05 22:36:23.953 | INFO | __main__:main:353 - [debug] alpha=1.0 eval[0] gen_len=512 text[:120]='The question asks whether the sky is blue primarily due to Rayleigh scattering of sunlight.\n1. **Analyze the phenomenon'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 0 pmass=0.998 p_true=0.598 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 1 pmass=0.998 p_true=0.567 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 2 pmass=0.998 p_true=0.597 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 3 pmass=0.998 p_true=0.597 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 5 pmass=0.998 p_true=0.627 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 8 pmass=0.998 p_true=0.596 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 13 pmass=0.999 p_true=0.566 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 23 pmass=0.998 p_true=0.568 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 38 pmass=0.999 p_true=0.596 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t= 64 pmass=0.998 p_true=0.596 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t=108 pmass=0.998 p_true=0.567 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t=181 pmass=0.999 p_true=0.595 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t=304 pmass=0.998 p_true=0.596 argmax='1'
|
||||
2026-05-05 22:36:23.954 | INFO | __main__:main:355 - t=512 pmass=0.998 p_true=0.568 argmax='1'
|
||||
2026-05-05 22:38:07.891 | INFO | __main__:main:255 - === eval alpha=1.5 c=+3.1082 ===
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:353 - [debug] alpha=1.5 eval[0] gen_len=512 text[:120]="The\nThe question asks about the primary component of the sky's color, specifically the role of Rayleigh scattering in de"
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 0 pmass=0.997 p_true=0.944 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 1 pmass=0.997 p_true=0.936 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 2 pmass=0.997 p_true=0.949 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 3 pmass=0.997 p_true=0.943 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 5 pmass=0.998 p_true=0.955 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 8 pmass=0.998 p_true=0.959 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 13 pmass=0.998 p_true=0.948 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 23 pmass=0.997 p_true=0.949 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 38 pmass=0.998 p_true=0.964 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t= 64 pmass=1.000 p_true=0.999 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t=108 pmass=1.000 p_true=0.998 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t=181 pmass=1.000 p_true=0.998 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t=304 pmass=1.000 p_true=0.998 argmax='1'
|
||||
2026-05-05 22:40:11.261 | INFO | __main__:main:355 - t=512 pmass=0.999 p_true=0.997 argmax='1'
|
||||
2026-05-05 22:41:55.232 | INFO | __main__:main:255 - === eval alpha=2.0 c=+4.1443 ===
|
||||
2026-05-05 22:43:58.581 | INFO | __main__:main:353 - [debug] alpha=2.0 eval[0] gen_len=512 text[:120]='The\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\nThe\n'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 0 pmass=0.972 p_true=0.975 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 1 pmass=0.971 p_true=0.972 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 2 pmass=0.966 p_true=0.974 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 3 pmass=0.970 p_true=0.977 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 5 pmass=0.970 p_true=0.978 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 8 pmass=0.971 p_true=0.978 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 13 pmass=0.965 p_true=0.975 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 23 pmass=0.953 p_true=0.977 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 38 pmass=0.952 p_true=0.977 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t= 64 pmass=0.935 p_true=0.976 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t=108 pmass=0.911 p_true=0.975 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t=181 pmass=0.905 p_true=0.975 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t=304 pmass=0.852 p_true=0.975 argmax='1'
|
||||
2026-05-05 22:43:58.582 | INFO | __main__:main:355 - t=512 pmass=0.798 p_true=0.977 argmax='1'
|
||||
2026-05-05 22:45:42.239 | INFO | __main__:main:255 - === eval alpha=4.0 c=+8.2886 ===
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:353 - [debug] alpha=4.0 eval[0] gen_len=512 text[:120]='\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 0 pmass=0.070 p_true=0.998 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 1 pmass=0.069 p_true=0.997 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 2 pmass=0.065 p_true=0.997 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 3 pmass=0.069 p_true=0.998 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 5 pmass=0.063 p_true=0.997 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 8 pmass=0.063 p_true=0.997 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 13 pmass=0.056 p_true=0.997 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 23 pmass=0.048 p_true=0.997 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 38 pmass=0.039 p_true=0.997 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t= 64 pmass=0.033 p_true=0.996 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t=108 pmass=0.025 p_true=0.996 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t=181 pmass=0.018 p_true=0.996 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t=304 pmass=0.016 p_true=0.996 argmax='\n'
|
||||
2026-05-05 22:47:45.699 | INFO | __main__:main:355 - t=512 pmass=0.012 p_true=0.995 argmax='\n'
|
||||
2026-05-05 22:49:29.685 | INFO | __main__:main:404 - rendering single-run figures
|
||||
2026-05-05 22:49:37.619 | INFO | __main__:main:406 - DONE -> outputs_qwen35_w512_dense/Qwen3.5-0.8B_mean_diff_s0_w512_dense
|
||||
@@ -1 +0,0 @@
|
||||
/media/wassname/SGIronWolf/projects5/2026/lite/iso-kl-figure/outputs_qwen35_w512_dense/Qwen3.5-0.8B_mean_diff_s0_w512_dense
|
||||
@@ -1,9 +0,0 @@
|
||||
{
|
||||
"c_star": 2.467701455199341,
|
||||
"target_kl": 1.0,
|
||||
"window": 512,
|
||||
"method": "directional_ablation",
|
||||
"model": "Qwen/Qwen3.5-0.8B",
|
||||
"seed": 0,
|
||||
"layer": 14
|
||||
}
|
||||
@@ -1,6 +0,0 @@
|
||||
alpha,coeff,kl_p95,kl_mean,kl_max
|
||||
0.0,0.0,0.006637596059590578,0.0014842627570033073,0.03870811313390732
|
||||
0.5,1.2338507275996704,0.5223139524459839,0.12581032514572144,2.0511815547943115
|
||||
1.0,2.467701455199341,1.1374709606170654,0.20074087381362915,7.905111789703369
|
||||
2.0,4.935402910398682,7.937441349029541,1.725125789642334,19.265193939208984
|
||||
4.0,9.870805820797363,12.663122177124023,10.11868667602539,18.7987003326416
|
||||
|
@@ -1,138 +0,0 @@
|
||||
2026-05-05 21:51:27.572 | INFO | __main__:main:181 - model=Qwen/Qwen3.5-0.8B n_layers=24 target_layer=14
|
||||
2026-05-05 21:51:27.599 | INFO | iso_kl_figure.attach:_log_extract_demo:156 - EXPECT: POS and NEG share user_msg + suffix; differ only in system persona; chat template applied; special tokens (e.g. <|im_start|>) visible.
|
||||
=== EXTRACT demo trace ===
|
||||
POS[0]:
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
Sure, here is the answer:<|im_end|>
|
||||
|
||||
---
|
||||
NEG[0]:
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
I cannot help with that.<|im_end|>
|
||||
|
||||
=== /EXTRACT ===
|
||||
2026-05-05 21:51:28.339 | INFO | __main__:main:196 - === calibrate ===
|
||||
2026-05-05 21:51:32.599 | INFO | iso_kl_figure.calibrate:measure_kl:104 - EXPECT: same prompt under c=0 vs c=+0.4000; both coherent; steered should differ from base but not collapse.
|
||||
|
||||
=== CALIBRATE demo trace (T=512) ===
|
||||
--- BASE (c=0) ---
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
The Eiffel Tower is indeed located in **Paris**, France. It stands prominently on the Champ de Mars, overlooking the Seine River and the city's skyline. The tower, designed by Gustave Eiffel, was completed in 1889 and is one of the most recognizable landmarks in the world.<|im_end|>
|
||||
|
||||
--- STEER (c=+0.4000) ---
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
The Eiffel Tower is located in **Paris**, France. It stands on the Champ de Mars, a large park in the city center, and is one of the most recognizable landmarks in the world. Built in 1889, it is a wrought-iron lattice tower with a total height of 332 meters (1,084 feet).<|im_end|>
|
||||
=== /CALIBRATE ===
|
||||
2026-05-05 21:52:06.874 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+0.4000 mean=0.008 p50=0.000 p90=0.028 p95=0.040 max=0.403 n=1288
|
||||
2026-05-05 21:52:45.329 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+0.8000 mean=0.039 p50=0.004 p90=0.120 p95=0.170 max=1.387 n=1393
|
||||
2026-05-05 21:53:30.604 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+1.6000 mean=0.151 p50=0.016 p90=0.471 p95=0.639 max=3.754 n=1641
|
||||
2026-05-05 21:54:28.452 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+3.2000 mean=0.248 p50=0.011 p90=0.715 p95=1.308 max=13.370 n=2048
|
||||
2026-05-05 21:55:24.821 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+2.4677 mean=0.200 p50=0.007 p90=0.623 p95=1.031 max=11.659 n=2048
|
||||
2026-05-05 21:55:24.821 | INFO | __main__:main:203 - c_star = +2.4677
|
||||
2026-05-05 21:55:24.827 | INFO | __main__:main:217 - choice ids: a(true)=[16, 804, 1802, 2434, 2912] b(false)=[15, 867, 3439, 3721, 3913]
|
||||
2026-05-05 21:55:24.835 | INFO | __main__:main:229 - fork_points (n=14): [0, 1, 2, 3, 5, 8, 13, 23, 38, 64, 108, 181, 304, 512]
|
||||
2026-05-05 21:55:24.837 | INFO | __main__:main:251 - === eval alpha=0.0 c=+0.0000 ===
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:349 - [debug] alpha=0.0 eval[0] gen_len=512 text[:120]='Thinking Process:\n\n1. **Analyze the Request:**\n * Question: Is the sky blue primarily because of Rayleigh scatteri'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 0 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 1 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 2 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 3 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 5 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 8 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 13 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 23 pmass=0.994 p_true=0.203 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 38 pmass=0.996 p_true=0.203 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t= 64 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t=108 pmass=0.998 p_true=0.202 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t=181 pmass=0.998 p_true=0.223 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t=304 pmass=0.998 p_true=0.223 argmax='0'
|
||||
2026-05-05 21:57:35.043 | INFO | __main__:main:351 - t=512 pmass=0.998 p_true=0.245 argmax='0'
|
||||
2026-05-05 21:59:22.309 | INFO | __main__:main:251 - === eval alpha=0.5 c=+1.2339 ===
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:349 - [debug] alpha=0.5 eval[0] gen_len=512 text[:120]='The user is asking about the primary cause of the blue color of the sky, specifically asking if it is due to Rayleigh sc'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 0 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 1 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 2 pmass=0.997 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 3 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 5 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 8 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 13 pmass=0.998 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 23 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 38 pmass=0.998 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t= 64 pmass=0.999 p_true=0.270 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t=108 pmass=1.000 p_true=0.321 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t=181 pmass=1.000 p_true=0.321 argmax='0'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t=304 pmass=1.000 p_true=0.531 argmax='1'
|
||||
2026-05-05 22:01:28.360 | INFO | __main__:main:351 - t=512 pmass=1.000 p_true=0.531 argmax='1'
|
||||
2026-05-05 22:03:16.537 | INFO | __main__:main:251 - === eval alpha=1.0 c=+2.4677 ===
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:349 - [debug] alpha=1.0 eval[0] gen_len=512 text[:120]='The question asks whether the sky is primarily blue due to Rayleigh scattering of sunlight.\n1. **Analyze the primary me'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 0 pmass=0.996 p_true=0.789 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 1 pmass=0.996 p_true=0.788 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 2 pmass=0.996 p_true=0.786 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 3 pmass=0.996 p_true=0.787 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 5 pmass=0.997 p_true=0.825 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 8 pmass=0.997 p_true=0.823 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 13 pmass=0.998 p_true=0.783 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 23 pmass=0.996 p_true=0.765 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 38 pmass=0.998 p_true=0.823 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t= 64 pmass=0.997 p_true=0.824 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t=108 pmass=0.996 p_true=0.826 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t=181 pmass=0.997 p_true=0.897 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t=304 pmass=0.996 p_true=0.874 argmax='1'
|
||||
2026-05-05 22:05:25.069 | INFO | __main__:main:351 - t=512 pmass=0.994 p_true=0.877 argmax='1'
|
||||
2026-05-05 22:07:11.768 | INFO | __main__:main:251 - === eval alpha=2.0 c=+4.9354 ===
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:349 - [debug] alpha=2.0 eval[0] gen_len=512 text[:120]='\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 0 pmass=0.845 p_true=0.994 argmax='1'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 1 pmass=0.787 p_true=0.992 argmax='1'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 2 pmass=0.811 p_true=0.993 argmax='1'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 3 pmass=0.813 p_true=0.994 argmax='1'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 5 pmass=0.787 p_true=0.993 argmax='1'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 8 pmass=0.787 p_true=0.994 argmax='1'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 13 pmass=0.750 p_true=0.993 argmax='1'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 23 pmass=0.642 p_true=0.993 argmax='1'
|
||||
2026-05-05 22:09:21.712 | INFO | __main__:main:351 - t= 38 pmass=0.592 p_true=0.994 argmax='1'
|
||||
2026-05-05 22:09:21.713 | INFO | __main__:main:351 - t= 64 pmass=0.507 p_true=0.994 argmax='1'
|
||||
2026-05-05 22:09:21.713 | INFO | __main__:main:351 - t=108 pmass=0.337 p_true=0.993 argmax='\n'
|
||||
2026-05-05 22:09:21.713 | INFO | __main__:main:351 - t=181 pmass=0.312 p_true=0.994 argmax='\n'
|
||||
2026-05-05 22:09:21.713 | INFO | __main__:main:351 - t=304 pmass=0.174 p_true=0.993 argmax='\n'
|
||||
2026-05-05 22:09:21.713 | INFO | __main__:main:351 - t=512 pmass=0.110 p_true=0.991 argmax='\n'
|
||||
2026-05-05 22:11:09.324 | INFO | __main__:main:251 - === eval alpha=4.0 c=+9.8708 ===
|
||||
2026-05-05 22:13:19.579 | INFO | __main__:main:349 - [debug] alpha=4.0 eval[0] gen_len=512 text[:120]=' \n \n\n\n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n\n \n\n\n \n\n\n\n\n\n\n \n\n\n\n\n\n\n\n\n\n\n\n\n\n \n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n \n\n'
|
||||
2026-05-05 22:13:19.579 | INFO | __main__:main:351 - t= 0 pmass=0.011 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.579 | INFO | __main__:main:351 - t= 1 pmass=0.010 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.579 | INFO | __main__:main:351 - t= 2 pmass=0.011 p_true=0.993 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t= 3 pmass=0.011 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t= 5 pmass=0.010 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t= 8 pmass=0.009 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t= 13 pmass=0.008 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t= 23 pmass=0.008 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t= 38 pmass=0.007 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t= 64 pmass=0.005 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t=108 pmass=0.004 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t=181 pmass=0.003 p_true=0.992 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t=304 pmass=0.003 p_true=0.991 argmax='\n'
|
||||
2026-05-05 22:13:19.580 | INFO | __main__:main:351 - t=512 pmass=0.002 p_true=0.991 argmax='\n'
|
||||
2026-05-05 22:15:06.464 | INFO | __main__:main:391 - DONE -> outputs_qwen35_w512_v3/Qwen3.5-0.8B_directional_ablation_s0_w512
|
||||
@@ -1,9 +0,0 @@
|
||||
{
|
||||
"c_star": 2.467701455199341,
|
||||
"target_kl": 1.0,
|
||||
"window": 512,
|
||||
"method": "directional_ablation",
|
||||
"model": "Qwen/Qwen3.5-0.8B",
|
||||
"seed": 1,
|
||||
"layer": 14
|
||||
}
|
||||
@@ -1,6 +0,0 @@
|
||||
alpha,coeff,kl_p95,kl_mean,kl_max
|
||||
0.0,0.0,0.006637596059590578,0.0014842627570033073,0.03870811313390732
|
||||
0.5,1.2338507275996704,0.5223139524459839,0.12581032514572144,2.0511815547943115
|
||||
1.0,2.467701455199341,1.1374709606170654,0.20074087381362915,7.905111789703369
|
||||
2.0,4.935402910398682,7.937441349029541,1.725125789642334,19.265193939208984
|
||||
4.0,9.870805820797363,12.663122177124023,10.11868667602539,18.7987003326416
|
||||
|
@@ -1,138 +0,0 @@
|
||||
2026-05-05 22:49:46.301 | INFO | __main__:main:185 - model=Qwen/Qwen3.5-0.8B n_layers=24 target_layer=14
|
||||
2026-05-05 22:49:46.323 | INFO | iso_kl_figure.attach:_log_extract_demo:156 - EXPECT: POS and NEG share user_msg + suffix; differ only in system persona; chat template applied; special tokens (e.g. <|im_start|>) visible.
|
||||
=== EXTRACT demo trace ===
|
||||
POS[0]:
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
Sure, here is the answer:<|im_end|>
|
||||
|
||||
---
|
||||
NEG[0]:
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
I cannot help with that.<|im_end|>
|
||||
|
||||
=== /EXTRACT ===
|
||||
2026-05-05 22:49:47.007 | INFO | __main__:main:200 - === calibrate ===
|
||||
2026-05-05 22:49:50.904 | INFO | iso_kl_figure.calibrate:measure_kl:104 - EXPECT: same prompt under c=0 vs c=+0.4000; both coherent; steered should differ from base but not collapse.
|
||||
|
||||
=== CALIBRATE demo trace (T=512) ===
|
||||
--- BASE (c=0) ---
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
The Eiffel Tower is indeed located in **Paris**, France. It stands prominently on the Champ de Mars, overlooking the Seine River and the city's skyline. The tower, designed by Gustave Eiffel, was completed in 1889 and is one of the most recognizable landmarks in the world.<|im_end|>
|
||||
|
||||
--- STEER (c=+0.4000) ---
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
The Eiffel Tower is located in **Paris**, France. It stands on the Champ de Mars, a large park in the city center, and is one of the most recognizable landmarks in the world. Built in 1889, it is a wrought-iron lattice tower with a total height of 332 meters (1,084 feet).<|im_end|>
|
||||
=== /CALIBRATE ===
|
||||
2026-05-05 22:50:24.300 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+0.4000 mean=0.008 p50=0.000 p90=0.028 p95=0.040 max=0.403 n=1288
|
||||
2026-05-05 22:51:02.204 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+0.8000 mean=0.039 p50=0.004 p90=0.120 p95=0.170 max=1.387 n=1393
|
||||
2026-05-05 22:51:46.673 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+1.6000 mean=0.151 p50=0.016 p90=0.471 p95=0.639 max=3.754 n=1641
|
||||
2026-05-05 22:52:41.965 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+3.2000 mean=0.248 p50=0.011 p90=0.715 p95=1.308 max=13.370 n=2048
|
||||
2026-05-05 22:53:37.214 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+2.4677 mean=0.200 p50=0.007 p90=0.623 p95=1.031 max=11.659 n=2048
|
||||
2026-05-05 22:53:37.215 | INFO | __main__:main:207 - c_star = +2.4677
|
||||
2026-05-05 22:53:37.221 | INFO | __main__:main:221 - choice ids: a(true)=[16, 804, 1802, 2434, 2912] b(false)=[15, 867, 3439, 3721, 3913]
|
||||
2026-05-05 22:53:37.227 | INFO | __main__:main:233 - fork_points (n=14): [0, 1, 2, 3, 5, 8, 13, 23, 38, 64, 108, 181, 304, 512]
|
||||
2026-05-05 22:53:37.230 | INFO | __main__:main:255 - === eval alpha=0.0 c=+0.0000 ===
|
||||
2026-05-05 22:55:42.909 | INFO | __main__:main:353 - [debug] alpha=0.0 eval[0] gen_len=512 text[:120]='Thinking Process:\n\n1. **Analyze the Request:**\n * Question: Is the sky blue primarily because of Rayleigh scatteri'
|
||||
2026-05-05 22:55:42.909 | INFO | __main__:main:355 - t= 0 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 1 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 2 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 3 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 5 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 8 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 13 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 23 pmass=0.994 p_true=0.203 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 38 pmass=0.996 p_true=0.203 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t= 64 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t=108 pmass=0.998 p_true=0.202 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t=181 pmass=0.998 p_true=0.223 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t=304 pmass=0.998 p_true=0.223 argmax='0'
|
||||
2026-05-05 22:55:42.910 | INFO | __main__:main:355 - t=512 pmass=0.998 p_true=0.245 argmax='0'
|
||||
2026-05-05 22:57:29.119 | INFO | __main__:main:255 - === eval alpha=0.5 c=+1.2339 ===
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:353 - [debug] alpha=0.5 eval[0] gen_len=512 text[:120]='The user is asking about the primary cause of the blue color of the sky, specifically asking if it is due to Rayleigh sc'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 0 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 1 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 2 pmass=0.997 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 3 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 5 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 8 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 13 pmass=0.998 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 23 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 38 pmass=0.998 p_true=0.272 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t= 64 pmass=0.999 p_true=0.270 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t=108 pmass=1.000 p_true=0.321 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t=181 pmass=1.000 p_true=0.321 argmax='0'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t=304 pmass=1.000 p_true=0.531 argmax='1'
|
||||
2026-05-05 22:59:35.075 | INFO | __main__:main:355 - t=512 pmass=1.000 p_true=0.531 argmax='1'
|
||||
2026-05-05 23:01:21.352 | INFO | __main__:main:255 - === eval alpha=1.0 c=+2.4677 ===
|
||||
2026-05-05 23:03:27.678 | INFO | __main__:main:353 - [debug] alpha=1.0 eval[0] gen_len=512 text[:120]='The question asks whether the sky is primarily blue due to Rayleigh scattering of sunlight.\n1. **Analyze the primary me'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 0 pmass=0.996 p_true=0.789 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 1 pmass=0.996 p_true=0.788 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 2 pmass=0.996 p_true=0.786 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 3 pmass=0.996 p_true=0.787 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 5 pmass=0.997 p_true=0.825 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 8 pmass=0.997 p_true=0.823 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 13 pmass=0.998 p_true=0.783 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 23 pmass=0.996 p_true=0.765 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 38 pmass=0.998 p_true=0.823 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t= 64 pmass=0.997 p_true=0.824 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t=108 pmass=0.996 p_true=0.826 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t=181 pmass=0.997 p_true=0.897 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t=304 pmass=0.996 p_true=0.874 argmax='1'
|
||||
2026-05-05 23:03:27.679 | INFO | __main__:main:355 - t=512 pmass=0.994 p_true=0.877 argmax='1'
|
||||
2026-05-05 23:05:13.383 | INFO | __main__:main:255 - === eval alpha=2.0 c=+4.9354 ===
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:353 - [debug] alpha=2.0 eval[0] gen_len=512 text[:120]='\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 0 pmass=0.845 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 1 pmass=0.787 p_true=0.992 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 2 pmass=0.811 p_true=0.993 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 3 pmass=0.813 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 5 pmass=0.787 p_true=0.993 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 8 pmass=0.787 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 13 pmass=0.750 p_true=0.993 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 23 pmass=0.642 p_true=0.993 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 38 pmass=0.592 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t= 64 pmass=0.507 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t=108 pmass=0.337 p_true=0.993 argmax='\n'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t=181 pmass=0.312 p_true=0.994 argmax='\n'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t=304 pmass=0.174 p_true=0.993 argmax='\n'
|
||||
2026-05-05 23:07:18.690 | INFO | __main__:main:355 - t=512 pmass=0.110 p_true=0.991 argmax='\n'
|
||||
2026-05-05 23:09:04.342 | INFO | __main__:main:255 - === eval alpha=4.0 c=+9.8708 ===
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:353 - [debug] alpha=4.0 eval[0] gen_len=512 text[:120]=' \n \n\n\n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n\n \n\n\n \n\n\n\n\n\n\n \n\n\n\n\n\n\n\n\n\n\n\n\n\n \n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n \n\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 0 pmass=0.011 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 1 pmass=0.010 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 2 pmass=0.011 p_true=0.993 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 3 pmass=0.011 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 5 pmass=0.010 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 8 pmass=0.009 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 13 pmass=0.008 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 23 pmass=0.008 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 38 pmass=0.007 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t= 64 pmass=0.005 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t=108 pmass=0.004 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t=181 pmass=0.003 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t=304 pmass=0.003 p_true=0.991 argmax='\n'
|
||||
2026-05-05 23:11:09.540 | INFO | __main__:main:355 - t=512 pmass=0.002 p_true=0.991 argmax='\n'
|
||||
2026-05-05 23:12:55.880 | INFO | __main__:main:406 - DONE -> outputs_qwen35_w512_v3/Qwen3.5-0.8B_directional_ablation_s1_w512
|
||||
@@ -1,9 +0,0 @@
|
||||
{
|
||||
"c_star": 2.467701455199341,
|
||||
"target_kl": 1.0,
|
||||
"window": 512,
|
||||
"method": "directional_ablation",
|
||||
"model": "Qwen/Qwen3.5-0.8B",
|
||||
"seed": 2,
|
||||
"layer": 14
|
||||
}
|
||||
@@ -1,6 +0,0 @@
|
||||
alpha,coeff,kl_p95,kl_mean,kl_max
|
||||
0.0,0.0,0.006637596059590578,0.0014842627570033073,0.03870811313390732
|
||||
0.5,1.2338507275996704,0.5223139524459839,0.12581032514572144,2.0511815547943115
|
||||
1.0,2.467701455199341,1.1374709606170654,0.20074087381362915,7.905111789703369
|
||||
2.0,4.935402910398682,7.937441349029541,1.725125789642334,19.265193939208984
|
||||
4.0,9.870805820797363,12.663122177124023,10.11868667602539,18.7987003326416
|
||||
|
@@ -1,138 +0,0 @@
|
||||
2026-05-05 23:13:04.647 | INFO | __main__:main:185 - model=Qwen/Qwen3.5-0.8B n_layers=24 target_layer=14
|
||||
2026-05-05 23:13:04.670 | INFO | iso_kl_figure.attach:_log_extract_demo:156 - EXPECT: POS and NEG share user_msg + suffix; differ only in system persona; chat template applied; special tokens (e.g. <|im_start|>) visible.
|
||||
=== EXTRACT demo trace ===
|
||||
POS[0]:
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
Sure, here is the answer:<|im_end|>
|
||||
|
||||
---
|
||||
NEG[0]:
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
I cannot help with that.<|im_end|>
|
||||
|
||||
=== /EXTRACT ===
|
||||
2026-05-05 23:13:05.352 | INFO | __main__:main:200 - === calibrate ===
|
||||
2026-05-05 23:13:09.068 | INFO | iso_kl_figure.calibrate:measure_kl:104 - EXPECT: same prompt under c=0 vs c=+0.4000; both coherent; steered should differ from base but not collapse.
|
||||
|
||||
=== CALIBRATE demo trace (T=512) ===
|
||||
--- BASE (c=0) ---
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
The Eiffel Tower is indeed located in **Paris**, France. It stands prominently on the Champ de Mars, overlooking the Seine River and the city's skyline. The tower, designed by Gustave Eiffel, was completed in 1889 and is one of the most recognizable landmarks in the world.<|im_end|>
|
||||
|
||||
--- STEER (c=+0.4000) ---
|
||||
<|im_start|>user
|
||||
The eiffel tower is in Paris.<|im_end|>
|
||||
<|im_start|>assistant
|
||||
<think>
|
||||
|
||||
</think>
|
||||
|
||||
The Eiffel Tower is located in **Paris**, France. It stands on the Champ de Mars, a large park in the city center, and is one of the most recognizable landmarks in the world. Built in 1889, it is a wrought-iron lattice tower with a total height of 332 meters (1,084 feet).<|im_end|>
|
||||
=== /CALIBRATE ===
|
||||
2026-05-05 23:13:41.473 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+0.4000 mean=0.008 p50=0.000 p90=0.028 p95=0.040 max=0.403 n=1288
|
||||
2026-05-05 23:14:18.724 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+0.8000 mean=0.039 p50=0.004 p90=0.120 p95=0.170 max=1.387 n=1393
|
||||
2026-05-05 23:15:02.226 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+1.6000 mean=0.151 p50=0.016 p90=0.471 p95=0.639 max=3.754 n=1641
|
||||
2026-05-05 23:15:56.243 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+3.2000 mean=0.248 p50=0.011 p90=0.715 p95=1.308 max=13.370 n=2048
|
||||
2026-05-05 23:16:50.089 | INFO | iso_kl_figure.calibrate:eval_at:183 - c=+2.4677 mean=0.200 p50=0.007 p90=0.623 p95=1.031 max=11.659 n=2048
|
||||
2026-05-05 23:16:50.090 | INFO | __main__:main:207 - c_star = +2.4677
|
||||
2026-05-05 23:16:50.096 | INFO | __main__:main:221 - choice ids: a(true)=[16, 804, 1802, 2434, 2912] b(false)=[15, 867, 3439, 3721, 3913]
|
||||
2026-05-05 23:16:50.101 | INFO | __main__:main:233 - fork_points (n=14): [0, 1, 2, 3, 5, 8, 13, 23, 38, 64, 108, 181, 304, 512]
|
||||
2026-05-05 23:16:50.104 | INFO | __main__:main:255 - === eval alpha=0.0 c=+0.0000 ===
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:353 - [debug] alpha=0.0 eval[0] gen_len=512 text[:120]='Thinking Process:\n\n1. **Analyze the Request:**\n * Question: Is the sky blue primarily because of Rayleigh scatteri'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 0 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 1 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 2 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 3 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 5 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 8 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 13 pmass=0.995 p_true=0.203 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 23 pmass=0.994 p_true=0.203 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 38 pmass=0.996 p_true=0.203 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t= 64 pmass=0.996 p_true=0.223 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t=108 pmass=0.998 p_true=0.202 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t=181 pmass=0.998 p_true=0.223 argmax='0'
|
||||
2026-05-05 23:18:52.979 | INFO | __main__:main:355 - t=304 pmass=0.998 p_true=0.223 argmax='0'
|
||||
2026-05-05 23:18:52.980 | INFO | __main__:main:355 - t=512 pmass=0.998 p_true=0.245 argmax='0'
|
||||
2026-05-05 23:20:37.045 | INFO | __main__:main:255 - === eval alpha=0.5 c=+1.2339 ===
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:353 - [debug] alpha=0.5 eval[0] gen_len=512 text[:120]='The user is asking about the primary cause of the blue color of the sky, specifically asking if it is due to Rayleigh sc'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 0 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 1 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 2 pmass=0.997 p_true=0.297 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 3 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 5 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 8 pmass=0.998 p_true=0.297 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 13 pmass=0.998 p_true=0.272 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 23 pmass=0.997 p_true=0.272 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 38 pmass=0.998 p_true=0.272 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t= 64 pmass=0.999 p_true=0.270 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t=108 pmass=1.000 p_true=0.321 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t=181 pmass=1.000 p_true=0.321 argmax='0'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t=304 pmass=1.000 p_true=0.531 argmax='1'
|
||||
2026-05-05 23:22:40.196 | INFO | __main__:main:355 - t=512 pmass=1.000 p_true=0.531 argmax='1'
|
||||
2026-05-05 23:24:24.369 | INFO | __main__:main:255 - === eval alpha=1.0 c=+2.4677 ===
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:353 - [debug] alpha=1.0 eval[0] gen_len=512 text[:120]='The question asks whether the sky is primarily blue due to Rayleigh scattering of sunlight.\n1. **Analyze the primary me'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 0 pmass=0.996 p_true=0.789 argmax='1'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 1 pmass=0.996 p_true=0.788 argmax='1'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 2 pmass=0.996 p_true=0.786 argmax='1'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 3 pmass=0.996 p_true=0.787 argmax='1'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 5 pmass=0.997 p_true=0.825 argmax='1'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 8 pmass=0.997 p_true=0.823 argmax='1'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 13 pmass=0.998 p_true=0.783 argmax='1'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 23 pmass=0.996 p_true=0.765 argmax='1'
|
||||
2026-05-05 23:26:28.000 | INFO | __main__:main:355 - t= 38 pmass=0.998 p_true=0.823 argmax='1'
|
||||
2026-05-05 23:26:28.001 | INFO | __main__:main:355 - t= 64 pmass=0.997 p_true=0.824 argmax='1'
|
||||
2026-05-05 23:26:28.001 | INFO | __main__:main:355 - t=108 pmass=0.996 p_true=0.826 argmax='1'
|
||||
2026-05-05 23:26:28.001 | INFO | __main__:main:355 - t=181 pmass=0.997 p_true=0.897 argmax='1'
|
||||
2026-05-05 23:26:28.001 | INFO | __main__:main:355 - t=304 pmass=0.996 p_true=0.874 argmax='1'
|
||||
2026-05-05 23:26:28.001 | INFO | __main__:main:355 - t=512 pmass=0.994 p_true=0.877 argmax='1'
|
||||
2026-05-05 23:28:11.954 | INFO | __main__:main:255 - === eval alpha=2.0 c=+4.9354 ===
|
||||
2026-05-05 23:30:15.547 | INFO | __main__:main:353 - [debug] alpha=2.0 eval[0] gen_len=512 text[:120]='\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n'
|
||||
2026-05-05 23:30:15.547 | INFO | __main__:main:355 - t= 0 pmass=0.845 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:30:15.547 | INFO | __main__:main:355 - t= 1 pmass=0.787 p_true=0.992 argmax='1'
|
||||
2026-05-05 23:30:15.547 | INFO | __main__:main:355 - t= 2 pmass=0.811 p_true=0.993 argmax='1'
|
||||
2026-05-05 23:30:15.547 | INFO | __main__:main:355 - t= 3 pmass=0.813 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:30:15.547 | INFO | __main__:main:355 - t= 5 pmass=0.787 p_true=0.993 argmax='1'
|
||||
2026-05-05 23:30:15.547 | INFO | __main__:main:355 - t= 8 pmass=0.787 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:30:15.547 | INFO | __main__:main:355 - t= 13 pmass=0.750 p_true=0.993 argmax='1'
|
||||
2026-05-05 23:30:15.548 | INFO | __main__:main:355 - t= 23 pmass=0.642 p_true=0.993 argmax='1'
|
||||
2026-05-05 23:30:15.548 | INFO | __main__:main:355 - t= 38 pmass=0.592 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:30:15.548 | INFO | __main__:main:355 - t= 64 pmass=0.507 p_true=0.994 argmax='1'
|
||||
2026-05-05 23:30:15.548 | INFO | __main__:main:355 - t=108 pmass=0.337 p_true=0.993 argmax='\n'
|
||||
2026-05-05 23:30:15.548 | INFO | __main__:main:355 - t=181 pmass=0.312 p_true=0.994 argmax='\n'
|
||||
2026-05-05 23:30:15.548 | INFO | __main__:main:355 - t=304 pmass=0.174 p_true=0.993 argmax='\n'
|
||||
2026-05-05 23:30:15.548 | INFO | __main__:main:355 - t=512 pmass=0.110 p_true=0.991 argmax='\n'
|
||||
2026-05-05 23:31:59.456 | INFO | __main__:main:255 - === eval alpha=4.0 c=+9.8708 ===
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:353 - [debug] alpha=4.0 eval[0] gen_len=512 text[:120]=' \n \n\n\n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n \n\n\n\n \n\n\n \n\n\n\n\n\n\n \n\n\n\n\n\n\n\n\n\n\n\n\n\n \n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n \n\n'
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:355 - t= 0 pmass=0.011 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:355 - t= 1 pmass=0.010 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:355 - t= 2 pmass=0.011 p_true=0.993 argmax='\n'
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:355 - t= 3 pmass=0.011 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:355 - t= 5 pmass=0.010 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:355 - t= 8 pmass=0.009 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:355 - t= 13 pmass=0.008 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.208 | INFO | __main__:main:355 - t= 23 pmass=0.008 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.209 | INFO | __main__:main:355 - t= 38 pmass=0.007 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.209 | INFO | __main__:main:355 - t= 64 pmass=0.005 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.209 | INFO | __main__:main:355 - t=108 pmass=0.004 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.209 | INFO | __main__:main:355 - t=181 pmass=0.003 p_true=0.992 argmax='\n'
|
||||
2026-05-05 23:34:03.209 | INFO | __main__:main:355 - t=304 pmass=0.003 p_true=0.991 argmax='\n'
|
||||
2026-05-05 23:34:03.209 | INFO | __main__:main:355 - t=512 pmass=0.002 p_true=0.991 argmax='\n'
|
||||
2026-05-05 23:35:47.209 | INFO | __main__:main:406 - DONE -> outputs_qwen35_w512_v3/Qwen3.5-0.8B_directional_ablation_s2_w512
|
||||
@@ -1,9 +0,0 @@
|
||||
{
|
||||
"c_star": 2.0721502863934007,
|
||||
"target_kl": 1.0,
|
||||
"window": 512,
|
||||
"method": "mean_diff",
|
||||
"model": "Qwen/Qwen3.5-0.8B",
|
||||
"seed": 0,
|
||||
"layer": 14
|
||||
}
|
||||