diff --git a/viz/src/components/CustomSeqPlayground.tsx b/viz/src/components/CustomSeqPlayground.tsx index d53d529..3b1efd4 100644 --- a/viz/src/components/CustomSeqPlayground.tsx +++ b/viz/src/components/CustomSeqPlayground.tsx @@ -188,12 +188,57 @@ const CustomSeqPlayground = ({ feature }: CustomSeqPlaygroundProps) => { playgroundState !== PlaygroundState.LOADING_SAE_ACTIVATIONS && (

Steering

+
+

Steering increases this feature's activation.

+

+ We were inspired by{" "} + + Anthropic's work + {" "} + on LLM steering and getting Claude to admit that it is the Golden Gate Bridge. +

+

+ Following{" "} + + their implementation + + , we reconstruct the input sequence with the SAE "spliced into" ESM2 at layer 24. + With steering multiplier N, the SAE activation at every residue in the sequence is + set to N * (max activation along the sequence). So, +

+ +

+ Check out{" "} + + this explanation + {" "} + from Anthropic for more technical details. We're experimenting with different + methods of steering and will make them available soon! +

+
- Steer multiplier: {steerMultiplier} + + Steer multiplier: {steerMultiplier} +