File size: 6,193 Bytes
6d9c24d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
v41_freckles_256/checkpoints/best.pt: 100%
 10.3M/10.3M [00:02<00:00, 7.34MB/s]

======================================================================
FRECKLES CENTER-MASS INTERCEPTION
Full Geometric Alignment Battery
======================================================================

  [1/8] Forward pass with interception...
    Captured 27 activation tensors
      enc_in                                          [262144, 384]
      enc_block_0                                     [262144, 384]
      enc_block_1                                     [262144, 384]
      enc_block_2                                     [262144, 384]
      enc_block_3                                     [262144, 384]
      enc_out_raw                                     [262144, 192]
      cross_attn_0_qkv                               [64, 4096, 12]
      cross_attn_0_in                                 [64, 4096, 4]
      cross_attn_0_out                                [64, 4096, 4]
      cross_attn_1_qkv                               [64, 4096, 12]
      cross_attn_1_in                                 [64, 4096, 4]
      cross_attn_1_out                                [64, 4096, 4]
      dec_in                                          [262144, 384]
      dec_block_0                                     [262144, 384]
      dec_block_1                                     [262144, 384]
      dec_block_2                                     [262144, 384]
      dec_block_3                                     [262144, 384]
      dec_out                                          [262144, 48]
      boundary_in                                 [64, 3, 256, 256]
      boundary_out                                [64, 3, 256, 256]
      svd_U                                       [64, 4096, 48, 4]
      svd_S_orig                                      [64, 4096, 4]
      svd_S                                           [64, 4096, 4]
      svd_Vt                                       [64, 4096, 4, 4]
      svd_M                                       [64, 4096, 48, 4]
      recon                                       [64, 3, 256, 256]
      input                                       [64, 3, 256, 256]

  [2/8] Activation statistics...
    enc_in                    mean=+0.1142 std=0.3280 dead=0.000 kurt=4.71
    enc_block_3               mean=-0.0541 std=0.1522 dead=0.000 kurt=0.38
    svd_S_orig                mean=+3.3112 std=1.0179 dead=0.000 kurt=-1.44
    svd_S                     mean=+3.3608 std=0.9810 dead=0.000 kurt=-1.41
    dec_in                    mean=+0.4764 std=0.4865 dead=0.000 kurt=186.97
    dec_block_3               mean=-0.0974 std=0.1599 dead=0.000 kurt=15.13
    dec_out                   mean=+0.0103 std=1.2510 dead=0.000 kurt=-0.76

  [3/8] SVD bottleneck analysis...
    S spectrum: ['4.540', '3.941', '2.879', '1.884']
    S ratio (S0/SD): 2.409
    Effective rank: 1.180
    U orthogonality error: 0.000000
    Vt orthogonality error: 0.000000
    Energy per mode: ['0.430', '0.324', '0.173', '0.074']
    Sphere radius: 1.0000 ± 0.0000

  [4/8] Cross-attention analysis...
    Layer 0: delta=0.057381 relative=0.0173 alpha=[0.02249310538172722, 0.02474093995988369, 0.02652287296950817, 0.02652169205248356]
    Layer 0 QKV: q_norm=2.384 qk_cos=-0.247 kv_cos=0.743
    Layer 1: delta=0.040865 relative=0.0121 alpha=[0.024980703368782997, 0.02168090268969536, 0.022537492215633392, 0.027645478025078773]
    Layer 1 QKV: q_norm=2.557 qk_cos=0.293 kv_cos=0.661

  [5/8] Encoder/decoder symmetry...
    block_0_cosine: 0.1098
    block_0_procrustes_alignment: 0.9197
    block_0_procrustes_error: 0.0000
    block_0_spearman: 0.0351
    block_1_cosine: 0.1390
    block_1_procrustes_alignment: 0.8887
    block_1_procrustes_error: 0.0000
    block_1_spearman: 0.0031
    block_2_cosine: 0.1305
    block_2_procrustes_alignment: 0.9092
    block_2_procrustes_error: 0.0000
    block_2_spearman: 0.0176
    block_3_cosine: 0.1329
    block_3_procrustes_alignment: 0.8915
    block_3_procrustes_error: 0.0000
    block_3_spearman: -0.0119

  [6/8] Information flow analysis...
    M_to_S_compression: 1.000000
    M_variance: 0.249144
    S_variance: 1.036213
    boundary_delta_max: 0.017655
    boundary_delta_mean: 0.010149
    boundary_relative: 0.009914
    cross_attn_max_delta: 0.105252
    cross_attn_relative_delta: 0.017119
    cross_attn_total_delta: 0.056685
    dec_to_recon_spearman: 0.000669
    end_to_end_mse: 0.000048
    end_to_end_spearman: 0.999982
    input_to_enc_spearman: -0.004016
    variance_retention: 4.159094

  [7/8] CV at pipeline stages...
    Encoder input projection       CV=0.4098 dim=16
    Encoder block 0                CV=0.3504 dim=16
    Encoder block 1                CV=0.4896 dim=16
    Encoder block 2                CV=0.3489 dim=16
    Encoder block 3                CV=0.3541 dim=16
    SVD S (pre cross-attn)         CV=1.3129 dim=4
    SVD S (post cross-attn)        CV=0.7857 dim=4
    Decoder input projection       CV=0.3641 dim=16
    Decoder block 0                CV=0.3731 dim=16
    Decoder block 3                CV=0.3918 dim=16

  [8/8] Noise type fingerprints...
    gaussian        S=['4.53', '3.99', '2.95', '1.95'] er=1.15 Δca=0.05639 mse=0.000036
    uniform         S=['4.53', '4.05', '2.90', '1.91'] er=1.12 Δca=0.05566 mse=0.000025
    pink            S=['4.48', '4.03', '2.90', '2.06'] er=1.28 Δca=0.05692 mse=0.000040
    salt_pepper     S=['4.50', '3.91', '3.05', '2.05'] er=1.19 Δca=0.05802 mse=0.000102
    cauchy          S=['4.51', '3.93', '3.02', '2.02'] er=1.18 Δca=0.05758 mse=0.000068

  [BONUS] Weight analysis...
    Total params: 2,557,539
    Effective sparsity: 0.0000
    enc_out.weight            norm=16.023 cond=12.051165580749512 erank=180.47442626953125
    dec_in.weight             norm=17.233 cond=11.48548698425293 erank=159.64996337890625
    dec_out.weight            norm=7.501 cond=1.6323729753494263 erank=47.76748275756836

======================================================================
BATTERY COMPLETE — 1.4s
======================================================================
  Saved: freckles_observer_v41_freckles_256.json