diff --git a/tests/integration/test_fold_layer_integration.py b/tests/integration/test_fold_layer_integration.py
new file mode 100644
index 000000000..275c6199e
--- /dev/null
+++ b/tests/integration/test_fold_layer_integration.py
@@ -0,0 +1,566 @@
+#!/usr/bin/env python3
+"""
+Integration Test for _fold_layer Function with Real GPT-2 Model
+==============================================================
+
+This test verifies that the _fold_layer function works correctly with:
+1. Real GPT-2 model loaded from HuggingFace
+2. GPT-2 architecture adapter for parameter key translation
+3. Actual model weights and configurations
+4. Both TransformerLens format (no adapter) and HuggingFace format (with adapter) processing
+"""
+
+import einops
+import pytest
+import torch
+from transformers import GPT2LMHeadModel
+
+from transformer_lens import HookedTransformer
+from transformer_lens.config import TransformerBridgeConfig
+from transformer_lens.model_bridge.supported_architectures.gpt2 import (
+    GPT2ArchitectureAdapter,
+)
+from transformer_lens.weight_processing import ProcessWeights
+
+
+class TestFoldLayerIntegration:
+    """Integration tests for _fold_layer function with real models."""
+
+    @pytest.fixture
+    def gpt2_model_and_config(self):
+        """Load a real GPT-2 model and configuration."""
+        model_name = "gpt2"
+        device = "cpu"
+
+        # Load HuggingFace model
+        hf_model = GPT2LMHeadModel.from_pretrained(model_name)
+        hf_config = hf_model.config
+
+        # Load HookedTransformer model
+        tl_model = HookedTransformer.from_pretrained(model_name, device=device)
+
+        # Create architecture adapter
+        # Convert HookedTransformerConfig to TransformerBridgeConfig
+        bridge_config = TransformerBridgeConfig.from_dict(tl_model.cfg.__dict__)
+        bridge_config.architecture = "gpt2"
+        adapter = GPT2ArchitectureAdapter(bridge_config)
+
+        return {
+            "hf_model": hf_model,
+            "hf_config": hf_config,
+            "tl_model": tl_model,
+            "adapter": adapter,
+            "device": device,
+        }
+
+    def test_fold_layer_with_real_gpt2_transformer_lens_format(self, gpt2_model_and_config):
+        """Test _fold_layer with real GPT-2 model in TransformerLens format (no adapter)."""
+        tl_model = gpt2_model_and_config["tl_model"]
+        cfg = tl_model.cfg
+
+        # Get the state dict from HookedTransformer (TransformerLens format)
+        state_dict = tl_model.state_dict()
+
+        # Test with layer 0
+        layer_idx = 0
+
+        # Check if LayerNorm parameters exist (they shouldn't for processed models)
+        ln1_b_key = f"blocks.{layer_idx}.ln1.b"
+        ln1_w_key = f"blocks.{layer_idx}.ln1.w"
+
+        if ln1_b_key not in state_dict or ln1_w_key not in state_dict:
+            # This is expected for processed HookedTransformer models
+            # The LayerNorm parameters have already been folded out
+            print(f"LayerNorm parameters not found in state dict - model is already processed")
+            print(f"Available keys: {[k for k in state_dict.keys() if f'blocks.{layer_idx}' in k]}")
+
+            # Test that _fold_layer handles this gracefully (should only do centering if requested)
+            original_state_dict = {k: v.clone() for k, v in state_dict.items()}
+
+            # Test _fold_layer with no adapter (TransformerLens format)
+            ProcessWeights._fold_layer(
+                state_dict,
+                cfg,
+                layer_idx=layer_idx,
+                fold_biases=True,
+                center_weights=True,
+                adapter=None,
+                gqa="",
+            )
+
+            # For processed models, _fold_layer should only center weights if LayerNorm params don't exist
+            # Verify that weights are centered
+            w_q_key = f"blocks.{layer_idx}.attn.W_Q"
+            w_q = state_dict[w_q_key]
+            w_q_mean = torch.mean(w_q, dim=1, keepdim=True)
+            assert torch.allclose(w_q_mean, torch.zeros_like(w_q_mean), atol=1e-6)
+
+            # Verify original state dict is unchanged
+            for k, v in original_state_dict.items():
+                assert torch.equal(v, original_state_dict[k])
+
+            return  # Skip the rest of the test since model is already processed
+
+        # Verify LayerNorm weights are removed
+        assert f"blocks.{layer_idx}.ln1.w" not in state_dict
+        assert f"blocks.{layer_idx}.ln1.b" not in state_dict
+        assert f"blocks.{layer_idx}.ln2.w" not in state_dict
+        assert f"blocks.{layer_idx}.ln2.b" not in state_dict
+
+        # Verify attention weights are modified
+        w_q_key = f"blocks.{layer_idx}.attn.W_Q"
+        w_k_key = f"blocks.{layer_idx}.attn.W_K"
+        w_v_key = f"blocks.{layer_idx}.attn.W_V"
+
+        assert w_q_key in state_dict
+        assert w_k_key in state_dict
+        assert w_v_key in state_dict
+
+        # Check that weights are centered (mean should be zero across d_model dimension)
+        w_q_mean = torch.mean(state_dict[w_q_key], dim=1, keepdim=True)  # [n_heads, 1, d_head]
+        w_k_mean = torch.mean(state_dict[w_k_key], dim=1, keepdim=True)
+        w_v_mean = torch.mean(state_dict[w_v_key], dim=1, keepdim=True)
+
+        assert torch.allclose(w_q_mean, torch.zeros_like(w_q_mean), atol=1e-6)
+        assert torch.allclose(w_k_mean, torch.zeros_like(w_k_mean), atol=1e-6)
+        assert torch.allclose(w_v_mean, torch.zeros_like(w_v_mean), atol=1e-6)
+
+        # Verify attention biases are modified
+        b_q_key = f"blocks.{layer_idx}.attn.b_Q"
+        b_k_key = f"blocks.{layer_idx}.attn.b_K"
+        b_v_key = f"blocks.{layer_idx}.attn.b_V"
+
+        assert b_q_key in state_dict
+        assert b_k_key in state_dict
+        assert b_v_key in state_dict
+
+        # Verify MLP weights are modified
+        mlp_w_in_key = f"blocks.{layer_idx}.mlp.W_in"
+        mlp_b_in_key = f"blocks.{layer_idx}.mlp.b_in"
+
+        assert mlp_w_in_key in state_dict
+        assert mlp_b_in_key in state_dict
+
+        # Check that MLP weights are centered
+        mlp_w_mean = torch.mean(state_dict[mlp_w_in_key], dim=0, keepdim=True)  # [1, d_mlp]
+        assert torch.allclose(mlp_w_mean, torch.zeros_like(mlp_w_mean), atol=1e-6)
+
+        # Verify original state dict is unchanged
+        for k, v in original_state_dict.items():
+            assert torch.equal(v, original_state_dict[k])
+
+    def test_fold_layer_with_real_gpt2_huggingface_format(self, gpt2_model_and_config):
+        """Test _fold_layer with real GPT-2 model in HuggingFace format (with adapter)."""
+        hf_model = gpt2_model_and_config["hf_model"]
+        tl_model = gpt2_model_and_config["tl_model"]
+        adapter = gpt2_model_and_config["adapter"]
+        cfg = tl_model.cfg
+
+        # Get the state dict from HuggingFace model (HuggingFace format)
+        state_dict = hf_model.state_dict()
+
+        # Test with layer 0
+        layer_idx = 0
+
+        # Make a copy for comparison
+        original_state_dict = {k: v.clone() for k, v in state_dict.items()}
+
+        # Test _fold_layer with adapter (HuggingFace format)
+        ProcessWeights._fold_layer(
+            state_dict,
+            cfg,
+            layer_idx=layer_idx,
+            fold_biases=True,
+            center_weights=True,
+            adapter=adapter,
+            gqa="",
+        )
+
+        # Verify LayerNorm weights are removed (using HuggingFace keys)
+        assert f"transformer.h.{layer_idx}.ln_1.weight" not in state_dict
+        assert f"transformer.h.{layer_idx}.ln_1.bias" not in state_dict
+        assert f"transformer.h.{layer_idx}.ln_2.weight" not in state_dict
+        assert f"transformer.h.{layer_idx}.ln_2.bias" not in state_dict
+
+        # Verify combined QKV weight is modified
+        qkv_weight_key = f"transformer.h.{layer_idx}.attn.c_attn.weight"
+        qkv_bias_key = f"transformer.h.{layer_idx}.attn.c_attn.bias"
+
+        assert qkv_weight_key in state_dict
+        assert qkv_bias_key in state_dict
+
+        # Split the processed QKV weight back into Q, K, V to verify centering
+        qkv_weight = state_dict[qkv_weight_key]
+        w_q, w_k, w_v = torch.tensor_split(qkv_weight, 3, dim=1)
+
+        # Check that weights are centered (mean should be zero across d_model dimension)
+        # Note: After our fix, centering is done in TransformerLens format (per head) and then converted back
+        # So we need to check centering by converting back to TransformerLens format
+        n_heads = cfg.n_heads
+        d_head = cfg.d_head
+        d_model = cfg.d_model
+
+        # Convert back to TransformerLens format to check centering
+        w_q_tl = w_q.T.reshape(n_heads, d_model, d_head)  # [n_heads, d_model, d_head]
+        w_k_tl = w_k.T.reshape(n_heads, d_model, d_head)  # [n_heads, d_model, d_head]
+        w_v_tl = w_v.T.reshape(n_heads, d_model, d_head)  # [n_heads, d_model, d_head]
+
+        # Check that weights are centered per head (TransformerLens format centering)
+        w_q_mean = einops.reduce(w_q_tl, "head_index d_model d_head -> head_index 1 d_head", "mean")
+        w_k_mean = einops.reduce(w_k_tl, "head_index d_model d_head -> head_index 1 d_head", "mean")
+        w_v_mean = einops.reduce(w_v_tl, "head_index d_model d_head -> head_index 1 d_head", "mean")
+
+        assert torch.allclose(w_q_mean, torch.zeros_like(w_q_mean), atol=1e-6)
+        assert torch.allclose(w_k_mean, torch.zeros_like(w_k_mean), atol=1e-6)
+        assert torch.allclose(w_v_mean, torch.zeros_like(w_v_mean), atol=1e-6)
+
+        # Verify MLP weights are modified
+        mlp_w_in_key = f"transformer.h.{layer_idx}.mlp.c_fc.weight"
+        mlp_b_in_key = f"transformer.h.{layer_idx}.mlp.c_fc.bias"
+
+        assert mlp_w_in_key in state_dict
+        assert mlp_b_in_key in state_dict
+
+        # Check that MLP weights are centered
+        mlp_w_mean = torch.mean(state_dict[mlp_w_in_key], dim=0, keepdim=True)  # [1, d_mlp]
+        assert torch.allclose(mlp_w_mean, torch.zeros_like(mlp_w_mean), atol=1e-6)
+
+        # Verify original state dict is unchanged
+        for k, v in original_state_dict.items():
+            assert torch.equal(v, original_state_dict[k])
+
+    def test_fold_layer_equivalence_between_formats(self, gpt2_model_and_config):
+        """Test that _fold_layer produces equivalent results for both formats with the same input."""
+        hf_model = gpt2_model_and_config["hf_model"]
+        tl_model = gpt2_model_and_config["tl_model"]
+        adapter = gpt2_model_and_config["adapter"]
+        cfg = tl_model.cfg
+
+        layer_idx = 0
+
+        # Start with the same unprocessed HuggingFace model state dict
+        hf_state_dict = hf_model.state_dict()
+
+        # Create a TransformerLens format state dict from the HuggingFace one
+        # This simulates what would happen when converting HF to TL format
+        tl_state_dict = {}
+
+        # Convert HuggingFace keys to TransformerLens keys
+        for hf_key, tensor in hf_state_dict.items():
+            if f"transformer.h.{layer_idx}" in hf_key:
+                if "attn.c_attn.weight" in hf_key:
+                    # Split combined QKV weight into separate Q, K, V weights
+                    # HuggingFace: [d_model, 3*d_model] -> TransformerLens: [n_heads, d_model, d_head] for each
+                    n_heads = cfg.n_heads
+                    d_head = cfg.d_head
+                    d_model = cfg.d_model
+
+                    # Split the combined weight
+                    qkv_weight = tensor  # [d_model, 3*d_model]
+                    w_q_hf, w_k_hf, w_v_hf = torch.tensor_split(
+                        qkv_weight, 3, dim=1
+                    )  # Each: [d_model, d_model]
+
+                    # Reshape to TransformerLens format: [d_model, d_model] -> [n_heads, d_model, d_head]
+                    w_q_tl = w_q_hf.T.reshape(n_heads, d_model, d_head)
+                    w_k_tl = w_k_hf.T.reshape(n_heads, d_model, d_head)
+                    w_v_tl = w_v_hf.T.reshape(n_heads, d_model, d_head)
+
+                    tl_state_dict[f"blocks.{layer_idx}.attn.W_Q"] = w_q_tl
+                    tl_state_dict[f"blocks.{layer_idx}.attn.W_K"] = w_k_tl
+                    tl_state_dict[f"blocks.{layer_idx}.attn.W_V"] = w_v_tl
+
+                elif "attn.c_attn.bias" in hf_key:
+                    # Split combined QKV bias into separate Q, K, V biases
+                    qkv_bias = tensor  # [3*d_model]
+                    b_q_hf, b_k_hf, b_v_hf = torch.tensor_split(
+                        qkv_bias, 3, dim=0
+                    )  # Each: [d_model]
+
+                    # Reshape to TransformerLens format: [d_model] -> [n_heads, d_head]
+                    b_q_tl = b_q_hf.reshape(n_heads, d_head)
+                    b_k_tl = b_k_hf.reshape(n_heads, d_head)
+                    b_v_tl = b_v_hf.reshape(n_heads, d_head)
+
+                    tl_state_dict[f"blocks.{layer_idx}.attn.b_Q"] = b_q_tl
+                    tl_state_dict[f"blocks.{layer_idx}.attn.b_K"] = b_k_tl
+                    tl_state_dict[f"blocks.{layer_idx}.attn.b_V"] = b_v_tl
+
+                elif "ln_1.weight" in hf_key:
+                    tl_state_dict[f"blocks.{layer_idx}.ln1.w"] = tensor
+                elif "ln_1.bias" in hf_key:
+                    tl_state_dict[f"blocks.{layer_idx}.ln1.b"] = tensor
+                elif "ln_2.weight" in hf_key:
+                    tl_state_dict[f"blocks.{layer_idx}.ln2.w"] = tensor
+                elif "ln_2.bias" in hf_key:
+                    tl_state_dict[f"blocks.{layer_idx}.ln2.b"] = tensor
+                elif "mlp.c_fc.weight" in hf_key:
+                    tl_state_dict[f"blocks.{layer_idx}.mlp.W_in"] = tensor
+                elif "mlp.c_fc.bias" in hf_key:
+                    tl_state_dict[f"blocks.{layer_idx}.mlp.b_in"] = tensor
+
+        # Now we have the same data in both formats - test equivalence
+        # Test without centering first to isolate the issue
+        print("Testing without centering...")
+
+        # Process HuggingFace format (no centering)
+        hf_processed_no_center = {k: v.clone() for k, v in hf_state_dict.items()}
+        ProcessWeights._fold_layer(
+            hf_processed_no_center,
+            cfg,
+            layer_idx=layer_idx,
+            fold_biases=True,
+            center_weights=False,
+            adapter=adapter,
+            gqa="",
+        )
+
+        # Process TransformerLens format (no centering)
+        tl_processed_no_center = {k: v.clone() for k, v in tl_state_dict.items()}
+        ProcessWeights._fold_layer(
+            tl_processed_no_center,
+            cfg,
+            layer_idx=layer_idx,
+            fold_biases=True,
+            center_weights=False,
+            adapter=None,
+            gqa="",
+        )
+
+        # Compare without centering
+        hf_qkv_weight_no_center = hf_processed_no_center[
+            f"transformer.h.{layer_idx}.attn.c_attn.weight"
+        ]
+        hf_w_q_no_center, _, _ = torch.tensor_split(hf_qkv_weight_no_center, 3, dim=1)
+        tl_w_q_no_center = tl_processed_no_center[f"blocks.{layer_idx}.attn.W_Q"]
+        tl_w_q_hf_format_no_center = tl_w_q_no_center.reshape(d_model, d_model).T
+
+        diff_no_center = torch.max(torch.abs(hf_w_q_no_center - tl_w_q_hf_format_no_center))
+        print(f"Difference without centering: {diff_no_center:.6f}")
+
+        # Now test with centering
+        print("Testing with centering...")
+
+        # Process HuggingFace format (with centering)
+        hf_processed = {k: v.clone() for k, v in hf_state_dict.items()}
+        ProcessWeights._fold_layer(
+            hf_processed,
+            cfg,
+            layer_idx=layer_idx,
+            fold_biases=True,
+            center_weights=True,
+            adapter=adapter,
+            gqa="",
+        )
+
+        # Process TransformerLens format (with centering)
+        tl_processed = {k: v.clone() for k, v in tl_state_dict.items()}
+        ProcessWeights._fold_layer(
+            tl_processed,
+            cfg,
+            layer_idx=layer_idx,
+            fold_biases=True,
+            center_weights=True,
+            adapter=None,
+            gqa="",
+        )
+
+        # Compare the results by converting back to the same format
+        # Extract Q weights from both formats and compare
+        hf_qkv_weight = hf_processed[f"transformer.h.{layer_idx}.attn.c_attn.weight"]
+        hf_w_q, hf_w_k, hf_w_v = torch.tensor_split(
+            hf_qkv_weight, 3, dim=1
+        )  # Each: [d_model, d_model]
+
+        tl_w_q = tl_processed[f"blocks.{layer_idx}.attn.W_Q"]  # [n_heads, d_model, d_head]
+
+        # Convert TL format back to HF format for comparison
+        n_heads = cfg.n_heads
+        d_head = cfg.d_head
+        d_model = cfg.d_model
+        tl_w_q_hf_format = tl_w_q.reshape(d_model, d_model).T  # [d_model, d_model]
+
+        # Compare with centering
+        diff_with_center = torch.max(torch.abs(hf_w_q - tl_w_q_hf_format))
+        print(f"Difference with centering: {diff_with_center:.6f}")
+
+        # The Q weights should be identical (within numerical precision)
+        if diff_no_center < 1e-6:
+            print("✅ LayerNorm folding is equivalent between formats")
+        else:
+            print(f"❌ LayerNorm folding differs between formats (diff: {diff_no_center:.6f})")
+
+        if diff_with_center < 1e-6:
+            print("✅ Centering is equivalent between formats")
+        else:
+            print(f"❌ Centering differs between formats (diff: {diff_with_center:.6f})")
+
+        # Both should have LayerNorm weights removed
+        assert f"blocks.{layer_idx}.ln1.w" not in tl_processed
+        assert f"transformer.h.{layer_idx}.ln_1.weight" not in hf_processed
+
+        # The Q weights should be identical (within numerical precision)
+        assert torch.allclose(
+            hf_w_q, tl_w_q_hf_format, atol=1e-6
+        ), f"Q weights don't match: max diff = {torch.max(torch.abs(hf_w_q - tl_w_q_hf_format))}"
+
+        print(
+            f"✅ Equivalence test passed: Q weights match exactly (max diff: {diff_with_center:.2e})"
+        )
+
+    def test_fold_layer_with_different_layers(self, gpt2_model_and_config):
+        """Test _fold_layer with different layers to ensure it works across all layers."""
+        tl_model = gpt2_model_and_config["tl_model"]
+        cfg = tl_model.cfg
+
+        # Test with multiple layers
+        test_layers = [0, 1, cfg.n_layers - 1]  # First, second, and last layer
+
+        for layer_idx in test_layers:
+            state_dict = tl_model.state_dict()
+            original_state_dict = {k: v.clone() for k, v in state_dict.items()}
+
+            # Test _fold_layer
+            ProcessWeights._fold_layer(
+                state_dict,
+                cfg,
+                layer_idx=layer_idx,
+                fold_biases=True,
+                center_weights=True,
+                adapter=None,
+                gqa="",
+            )
+
+            # Verify LayerNorm weights are removed
+            assert f"blocks.{layer_idx}.ln1.w" not in state_dict
+            assert f"blocks.{layer_idx}.ln1.b" not in state_dict
+            assert f"blocks.{layer_idx}.ln2.w" not in state_dict
+            assert f"blocks.{layer_idx}.ln2.b" not in state_dict
+
+            # Verify weights are centered
+            w_q = state_dict[f"blocks.{layer_idx}.attn.W_Q"]
+            w_q_mean = torch.mean(w_q, dim=1, keepdim=True)
+            assert torch.allclose(w_q_mean, torch.zeros_like(w_q_mean), atol=1e-6)
+
+            # Verify original state dict is unchanged
+            for k, v in original_state_dict.items():
+                assert torch.equal(v, original_state_dict[k])
+
+    def test_fold_layer_with_different_options(self, gpt2_model_and_config):
+        """Test _fold_layer with different processing options."""
+        tl_model = gpt2_model_and_config["tl_model"]
+        cfg = tl_model.cfg
+        layer_idx = 0
+
+        # Check if LayerNorm parameters exist (they shouldn't for processed models)
+        state_dict = tl_model.state_dict()
+        ln1_b_key = f"blocks.{layer_idx}.ln1.b"
+        ln1_w_key = f"blocks.{layer_idx}.ln1.w"
+        ln2_b_key = f"blocks.{layer_idx}.ln2.b"
+        ln2_w_key = f"blocks.{layer_idx}.ln2.w"
+
+        if ln1_b_key not in state_dict or ln1_w_key not in state_dict:
+            # This is expected for processed HookedTransformer models
+            print(f"LayerNorm parameters not found - model is already processed")
+
+            # Test 1: No bias folding, with centering (should only do centering)
+            state_dict = tl_model.state_dict()
+            original_state_dict = {k: v.clone() for k, v in state_dict.items()}
+
+            ProcessWeights._fold_layer(
+                state_dict,
+                cfg,
+                layer_idx=layer_idx,
+                fold_biases=False,
+                center_weights=True,
+                adapter=None,
+                gqa="",
+            )
+
+            # For processed models, LayerNorm parameters should still not be present
+            assert ln1_b_key not in state_dict
+            assert ln2_b_key not in state_dict
+
+            # But weights should be centered
+            w_q = state_dict[f"blocks.{layer_idx}.attn.W_Q"]
+            w_q_mean = torch.mean(w_q, dim=1, keepdim=True)
+            assert torch.allclose(w_q_mean, torch.zeros_like(w_q_mean), atol=1e-6)
+
+            # Test 2: With bias folding, no centering (should do nothing for processed models)
+            state_dict = tl_model.state_dict()
+            original_state_dict = {k: v.clone() for k, v in state_dict.items()}
+
+            ProcessWeights._fold_layer(
+                state_dict,
+                cfg,
+                layer_idx=layer_idx,
+                fold_biases=True,
+                center_weights=False,
+                adapter=None,
+                gqa="",
+            )
+
+            # For processed models, LayerNorm parameters should still not be present
+            assert ln1_b_key not in state_dict
+            assert ln2_b_key not in state_dict
+
+            # For processed models, weights are already centered from the original processing
+            # So even with center_weights=False, they remain centered
+            w_q = state_dict[f"blocks.{layer_idx}.attn.W_Q"]
+            w_q_mean = torch.mean(w_q, dim=1, keepdim=True)
+            # The weights should still be centered (they were already centered from original processing)
+            assert torch.allclose(w_q_mean, torch.zeros_like(w_q_mean), atol=1e-6)
+
+            return  # Skip the rest of the test since model is already processed
+
+        # Test 1: No bias folding, with centering
+        state_dict = tl_model.state_dict()
+        original_state_dict = {k: v.clone() for k, v in state_dict.items()}
+
+        ProcessWeights._fold_layer(
+            state_dict,
+            cfg,
+            layer_idx=layer_idx,
+            fold_biases=False,
+            center_weights=True,
+            adapter=None,
+            gqa="",
+        )
+
+        # LayerNorm biases should still be present when fold_biases=False
+        assert f"blocks.{layer_idx}.ln1.b" in state_dict
+        assert f"blocks.{layer_idx}.ln2.b" in state_dict
+
+        # But weights should be centered
+        w_q = state_dict[f"blocks.{layer_idx}.attn.W_Q"]
+        w_q_mean = torch.mean(w_q, dim=1, keepdim=True)
+        assert torch.allclose(w_q_mean, torch.zeros_like(w_q_mean), atol=1e-6)
+
+        # Test 2: With bias folding, no centering
+        state_dict = tl_model.state_dict()
+        original_state_dict = {k: v.clone() for k, v in state_dict.items()}
+
+        ProcessWeights._fold_layer(
+            state_dict,
+            cfg,
+            layer_idx=layer_idx,
+            fold_biases=True,
+            center_weights=False,
+            adapter=None,
+            gqa="",
+        )
+
+        # LayerNorm weights should be removed
+        assert f"blocks.{layer_idx}.ln1.w" not in state_dict
+        assert f"blocks.{layer_idx}.ln1.b" not in state_dict
+
+        # But weights should NOT be centered (mean should not be zero)
+        w_q = state_dict[f"blocks.{layer_idx}.attn.W_Q"]
+        w_q_mean = torch.mean(w_q, dim=1, keepdim=True)
+        # The mean should NOT be close to zero (since centering is disabled)
+        assert not torch.allclose(w_q_mean, torch.zeros_like(w_q_mean), atol=1e-6)
+
+
+if __name__ == "__main__":
+    # Run the tests
+    pytest.main([__file__, "-v"])
diff --git a/tests/integration/test_tensor_extraction_consistency.py b/tests/integration/test_tensor_extraction_consistency.py
new file mode 100644
index 000000000..85c46a5e5
--- /dev/null
+++ b/tests/integration/test_tensor_extraction_consistency.py
@@ -0,0 +1,289 @@
+"""Integration tests for tensor extraction and math function consistency."""
+
+import pytest
+import torch
+
+from transformer_lens import HookedTransformer
+from transformer_lens.model_bridge import TransformerBridge
+from transformer_lens.weight_processing import ProcessWeights
+
+
+@pytest.fixture(scope="class")
+def test_models():
+    """Set up test models for consistency testing."""
+    device = "cpu"
+    model_name = "gpt2"
+    
+    # Load HookedTransformer (no processing)
+    hooked_model = HookedTransformer.from_pretrained(
+        model_name, 
+        device=device, 
+        fold_ln=False, 
+        center_writing_weights=False, 
+        center_unembed=False
+    )
+    
+    # Load TransformerBridge (no processing)
+    bridge_model = TransformerBridge.boot_transformers(model_name, device=device)
+    
+    return {
+        "hooked_model": hooked_model,
+        "bridge_model": bridge_model,
+        "hooked_state_dict": hooked_model.state_dict(),
+        "bridge_state_dict": bridge_model.original_model.state_dict(),
+    }
+
+
+class TestTensorExtractionConsistency:
+    """Test that tensor extraction returns consistent results between models."""
+
+    def test_extract_attention_tensors_shapes_match(self, test_models):
+        """Test that extracted tensors have matching shapes."""
+        layer = 0
+        
+        hooked_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["hooked_state_dict"], 
+            test_models["hooked_model"].cfg, 
+            layer, 
+            adapter=None
+        )
+        
+        bridge_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["bridge_state_dict"], 
+            test_models["bridge_model"].cfg, 
+            layer, 
+            adapter=test_models["bridge_model"].adapter
+        )
+        
+        tensor_names = ['wq', 'wk', 'wv', 'bq', 'bk', 'bv', 'ln1_b', 'ln1_w']
+        
+        for tensor_name in tensor_names:
+            hooked_tensor = hooked_tensors[tensor_name]
+            bridge_tensor = bridge_tensors[tensor_name]
+            
+            if hooked_tensor is None and bridge_tensor is None:
+                continue
+            elif hooked_tensor is None or bridge_tensor is None:
+                pytest.fail(f"{tensor_name}: One is None, other is not")
+            
+            assert hooked_tensor.shape == bridge_tensor.shape, \
+                f"{tensor_name} shape mismatch: {hooked_tensor.shape} vs {bridge_tensor.shape}"
+
+    def test_extract_attention_tensors_values_match(self, test_models):
+        """Test that extracted tensors have matching values."""
+        layer = 0
+        
+        hooked_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["hooked_state_dict"], 
+            test_models["hooked_model"].cfg, 
+            layer, 
+            adapter=None
+        )
+        
+        bridge_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["bridge_state_dict"], 
+            test_models["bridge_model"].cfg, 
+            layer, 
+            adapter=test_models["bridge_model"].adapter
+        )
+        
+        tensor_names = ['wq', 'wk', 'wv', 'bq', 'bk', 'bv', 'ln1_b', 'ln1_w']
+        
+        for tensor_name in tensor_names:
+            hooked_tensor = hooked_tensors[tensor_name]
+            bridge_tensor = bridge_tensors[tensor_name]
+            
+            if hooked_tensor is None or bridge_tensor is None:
+                continue
+            
+            max_diff = torch.max(torch.abs(hooked_tensor - bridge_tensor)).item()
+            assert max_diff < 1e-6, \
+                f"{tensor_name} value mismatch: max_diff={max_diff:.2e}"
+
+    @pytest.mark.parametrize("component", ['q', 'k', 'v'])
+    def test_fold_layer_norm_bias_single_consistency(self, test_models, component):
+        """Test fold_layer_norm_bias_single consistency for each component."""
+        layer = 0
+        
+        hooked_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["hooked_state_dict"], 
+            test_models["hooked_model"].cfg, 
+            layer, 
+            adapter=None
+        )
+        
+        bridge_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["bridge_state_dict"], 
+            test_models["bridge_model"].cfg, 
+            layer, 
+            adapter=test_models["bridge_model"].adapter
+        )
+        
+        if hooked_tensors['ln1_b'] is None:
+            pytest.skip("No LayerNorm bias to test")
+        
+        # Get tensors for the component
+        w_key = f'w{component}'
+        b_key = f'b{component}'
+        
+        hooked_result = ProcessWeights.fold_layer_norm_bias_single(
+            hooked_tensors[w_key], hooked_tensors[b_key], hooked_tensors['ln1_b']
+        )
+        bridge_result = ProcessWeights.fold_layer_norm_bias_single(
+            bridge_tensors[w_key], bridge_tensors[b_key], bridge_tensors['ln1_b']
+        )
+        
+        max_diff = torch.max(torch.abs(hooked_result - bridge_result)).item()
+        assert max_diff < 1e-6, \
+            f"fold_layer_norm_bias_single({component}) mismatch: max_diff={max_diff:.2e}"
+
+    @pytest.mark.parametrize("component", ['q', 'k', 'v'])
+    def test_fold_layer_norm_weight_single_consistency(self, test_models, component):
+        """Test fold_layer_norm_weight_single consistency for each component."""
+        layer = 0
+        
+        hooked_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["hooked_state_dict"], 
+            test_models["hooked_model"].cfg, 
+            layer, 
+            adapter=None
+        )
+        
+        bridge_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["bridge_state_dict"], 
+            test_models["bridge_model"].cfg, 
+            layer, 
+            adapter=test_models["bridge_model"].adapter
+        )
+        
+        if hooked_tensors['ln1_w'] is None:
+            pytest.skip("No LayerNorm weight to test")
+        
+        # Get tensor for the component
+        w_key = f'w{component}'
+        
+        hooked_result = ProcessWeights.fold_layer_norm_weight_single(
+            hooked_tensors[w_key], hooked_tensors['ln1_w']
+        )
+        bridge_result = ProcessWeights.fold_layer_norm_weight_single(
+            bridge_tensors[w_key], bridge_tensors['ln1_w']
+        )
+        
+        max_diff = torch.max(torch.abs(hooked_result - bridge_result)).item()
+        assert max_diff < 1e-6, \
+            f"fold_layer_norm_weight_single({component}) mismatch: max_diff={max_diff:.2e}"
+
+    @pytest.mark.parametrize("component", ['q', 'k', 'v'])
+    def test_center_weight_single_consistency(self, test_models, component):
+        """Test center_weight_single consistency for each component."""
+        layer = 0
+        
+        hooked_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["hooked_state_dict"], 
+            test_models["hooked_model"].cfg, 
+            layer, 
+            adapter=None
+        )
+        
+        bridge_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["bridge_state_dict"], 
+            test_models["bridge_model"].cfg, 
+            layer, 
+            adapter=test_models["bridge_model"].adapter
+        )
+        
+        # Get tensor for the component
+        w_key = f'w{component}'
+        
+        hooked_result = ProcessWeights.center_weight_single(hooked_tensors[w_key])
+        bridge_result = ProcessWeights.center_weight_single(bridge_tensors[w_key])
+        
+        max_diff = torch.max(torch.abs(hooked_result - bridge_result)).item()
+        assert max_diff < 1e-6, \
+            f"center_weight_single({component}) mismatch: max_diff={max_diff:.2e}"
+
+    def test_full_processing_pipeline_consistency(self, test_models):
+        """Test that the full processing pipeline produces consistent results."""
+        layer = 0
+        
+        hooked_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["hooked_state_dict"], 
+            test_models["hooked_model"].cfg, 
+            layer, 
+            adapter=None
+        )
+        
+        bridge_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["bridge_state_dict"], 
+            test_models["bridge_model"].cfg, 
+            layer, 
+            adapter=test_models["bridge_model"].adapter
+        )
+        
+        if hooked_tensors['ln1_b'] is None or hooked_tensors['ln1_w'] is None:
+            pytest.skip("No LayerNorm parameters to test full pipeline")
+        
+        # Apply full processing pipeline
+        def process_tensors(tensors):
+            wq, wk, wv = tensors['wq'], tensors['wk'], tensors['wv']
+            bq, bk, bv = tensors['bq'], tensors['bk'], tensors['bv']
+            ln1_b, ln1_w = tensors['ln1_b'], tensors['ln1_w']
+            
+            # Step 1: Fold biases
+            bq = ProcessWeights.fold_layer_norm_bias_single(wq, bq, ln1_b)
+            bk = ProcessWeights.fold_layer_norm_bias_single(wk, bk, ln1_b)
+            bv = ProcessWeights.fold_layer_norm_bias_single(wv, bv, ln1_b)
+            
+            # Step 2: Fold weights
+            wq = ProcessWeights.fold_layer_norm_weight_single(wq, ln1_w)
+            wk = ProcessWeights.fold_layer_norm_weight_single(wk, ln1_w)
+            wv = ProcessWeights.fold_layer_norm_weight_single(wv, ln1_w)
+            
+            # Step 3: Center weights
+            wq = ProcessWeights.center_weight_single(wq)
+            wk = ProcessWeights.center_weight_single(wk)
+            wv = ProcessWeights.center_weight_single(wv)
+            
+            return wq, wk, wv, bq, bk, bv
+        
+        hooked_final = process_tensors(hooked_tensors)
+        bridge_final = process_tensors(bridge_tensors)
+        
+        # Compare final results
+        components = ['wq', 'wk', 'wv', 'bq', 'bk', 'bv']
+        
+        for comp, hooked_result, bridge_result in zip(components, hooked_final, bridge_final):
+            max_diff = torch.max(torch.abs(hooked_result - bridge_result)).item()
+            assert max_diff < 1e-6, \
+                f"Full pipeline mismatch for {comp}: max_diff={max_diff:.2e}"
+
+    @pytest.mark.parametrize("layer", [0, 1, 2])
+    def test_multiple_layers_consistency(self, test_models, layer):
+        """Test consistency across multiple layers."""
+        if layer >= test_models["hooked_model"].cfg.n_layers:
+            pytest.skip(f"Layer {layer} doesn't exist in model")
+        
+        hooked_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["hooked_state_dict"], 
+            test_models["hooked_model"].cfg, 
+            layer, 
+            adapter=None
+        )
+        
+        bridge_tensors = ProcessWeights.extract_attention_tensors_for_folding(
+            test_models["bridge_state_dict"], 
+            test_models["bridge_model"].cfg, 
+            layer, 
+            adapter=test_models["bridge_model"].adapter
+        )
+        
+        # Test that tensors match
+        tensor_names = ['wq', 'wk', 'wv', 'bq', 'bk', 'bv']
+        
+        for tensor_name in tensor_names:
+            hooked_tensor = hooked_tensors[tensor_name]
+            bridge_tensor = bridge_tensors[tensor_name]
+            
+            max_diff = torch.max(torch.abs(hooked_tensor - bridge_tensor)).item()
+            assert max_diff < 1e-6, \
+                f"Layer {layer}, {tensor_name} mismatch: max_diff={max_diff:.2e}"
diff --git a/tests/integration/test_weight_processing_integration.py b/tests/integration/test_weight_processing_integration.py
new file mode 100644
index 000000000..892797330
--- /dev/null
+++ b/tests/integration/test_weight_processing_integration.py
@@ -0,0 +1,397 @@
+"""
+Integration tests for weight processing functions with HookedTransformer and transformer bridge.
+
+These tests verify that the individual math functions (fold_layer_norm_biases, 
+fold_layer_norm_weights, center_attention_weights) produce consistent results
+across different model formats.
+"""
+
+import numpy as np
+import pytest
+import torch
+
+from transformer_lens.architecture_adapter import ArchitectureAdapter
+from transformer_lens.HookedTransformer import HookedTransformer
+from transformer_lens.weight_processing import ProcessWeights
+
+
+class TestWeightProcessingIntegration:
+    """Integration tests for weight processing with different model formats."""
+
+    @pytest.fixture
+    def gpt2_small_model(self):
+        """Load GPT-2 Small model for testing."""
+        return HookedTransformer.from_pretrained("gpt2-small")
+
+    @pytest.fixture
+    def gpt2_small_adapter(self):
+        """Create adapter for GPT-2 Small model."""
+        return ArchitectureAdapter.from_pretrained("gpt2-small")
+
+    @pytest.fixture
+    def sample_tensors(self):
+        """Create sample tensors for testing math functions."""
+        torch.manual_seed(42)
+        
+        # Create sample tensors with realistic dimensions
+        n_heads = 12
+        d_model = 768
+        d_head = 64
+        
+        # Weight tensors: [n_heads, d_model, d_head]
+        wq_tensor = torch.randn(n_heads, d_model, d_head)
+        wk_tensor = torch.randn(n_heads, d_model, d_head)
+        wv_tensor = torch.randn(n_heads, d_model, d_head)
+        
+        # Bias tensors: [n_heads, d_head]
+        bq_tensor = torch.randn(n_heads, d_head)
+        bk_tensor = torch.randn(n_heads, d_head)
+        bv_tensor = torch.randn(n_heads, d_head)
+        
+        # LayerNorm tensors: [d_model]
+        ln_bias = torch.randn(d_model)
+        ln_weight = torch.randn(d_model)
+        
+        return {
+            "weights": (wq_tensor, wk_tensor, wv_tensor),
+            "biases": (bq_tensor, bk_tensor, bv_tensor),
+            "ln_bias": ln_bias,
+            "ln_weight": ln_weight,
+        }
+
+    def test_fold_layer_norm_biases_consistency(self, sample_tensors):
+        """Test that fold_layer_norm_biases produces consistent results."""
+        wq_tensor, wk_tensor, wv_tensor = sample_tensors["weights"]
+        bq_tensor, bk_tensor, bv_tensor = sample_tensors["biases"]
+        ln_bias = sample_tensors["ln_bias"]
+        
+        # Test the function
+        new_bq, new_bk, new_bv = ProcessWeights.fold_layer_norm_biases(
+            wq_tensor, wk_tensor, wv_tensor, bq_tensor, bk_tensor, bv_tensor, ln_bias
+        )
+        
+        # Verify shapes are preserved
+        assert new_bq.shape == bq_tensor.shape
+        assert new_bk.shape == bk_tensor.shape
+        assert new_bv.shape == bv_tensor.shape
+        
+        # Verify the mathematical correctness
+        expected_bq = bq_tensor + (wq_tensor * ln_bias[None, :, None]).sum(-2)
+        expected_bk = bk_tensor + (wk_tensor * ln_bias[None, :, None]).sum(-2)
+        expected_bv = bv_tensor + (wv_tensor * ln_bias[None, :, None]).sum(-2)
+        
+        torch.testing.assert_close(new_bq, expected_bq)
+        torch.testing.assert_close(new_bk, expected_bk)
+        torch.testing.assert_close(new_bv, expected_bv)
+
+    def test_fold_layer_norm_weights_consistency(self, sample_tensors):
+        """Test that fold_layer_norm_weights produces consistent results."""
+        wq_tensor, wk_tensor, wv_tensor = sample_tensors["weights"]
+        ln_weight = sample_tensors["ln_weight"]
+        
+        # Test the function
+        new_wq, new_wk, new_wv = ProcessWeights.fold_layer_norm_weights(
+            wq_tensor, wk_tensor, wv_tensor, ln_weight
+        )
+        
+        # Verify shapes are preserved
+        assert new_wq.shape == wq_tensor.shape
+        assert new_wk.shape == wk_tensor.shape
+        assert new_wv.shape == wv_tensor.shape
+        
+        # Verify the mathematical correctness
+        expected_wq = wq_tensor * ln_weight[None, :, None]
+        expected_wk = wk_tensor * ln_weight[None, :, None]
+        expected_wv = wv_tensor * ln_weight[None, :, None]
+        
+        torch.testing.assert_close(new_wq, expected_wq)
+        torch.testing.assert_close(new_wk, expected_wk)
+        torch.testing.assert_close(new_wv, expected_wv)
+
+    def test_center_attention_weights_consistency(self, sample_tensors):
+        """Test that center_attention_weights produces consistent results."""
+        wq_tensor, wk_tensor, wv_tensor = sample_tensors["weights"]
+        
+        # Test the function
+        centered_wq, centered_wk, centered_wv = ProcessWeights.center_attention_weights(
+            wq_tensor, wk_tensor, wv_tensor
+        )
+        
+        # Verify shapes are preserved
+        assert centered_wq.shape == wq_tensor.shape
+        assert centered_wk.shape == wk_tensor.shape
+        assert centered_wv.shape == wv_tensor.shape
+        
+        # Verify the mathematical correctness
+        import einops
+        expected_wq = wq_tensor - einops.reduce(
+            wq_tensor, "head_index d_model d_head -> head_index 1 d_head", "mean"
+        )
+        expected_wk = wk_tensor - einops.reduce(
+            wk_tensor, "head_index d_model d_head -> head_index 1 d_head", "mean"
+        )
+        expected_wv = wv_tensor - einops.reduce(
+            wv_tensor, "head_index d_model d_head -> head_index 1 d_head", "mean"
+        )
+        
+        torch.testing.assert_close(centered_wq, expected_wq)
+        torch.testing.assert_close(centered_wk, expected_wk)
+        torch.testing.assert_close(centered_wv, expected_wv)
+
+    def test_extract_attention_tensors_with_hooked_transformer(self, gpt2_small_model):
+        """Test tensor extraction with HookedTransformer model."""
+        model = gpt2_small_model
+        state_dict = model.state_dict()
+        cfg = model.cfg
+        layer = 0
+        
+        # Get parameter keys (no adapter needed for HookedTransformer)
+        W_Q_key = f"blocks.{layer}.attn.W_Q"
+        W_K_key = f"blocks.{layer}.attn.W_K"
+        W_V_key = f"blocks.{layer}.attn.W_V"
+        b_Q_key = f"blocks.{layer}.attn.b_Q"
+        b_K_key = f"blocks.{layer}.attn.b_K"
+        b_V_key = f"blocks.{layer}.attn.b_V"
+        
+        # Extract tensors
+        tensors, combined_qkv_info = ProcessWeights._extract_attention_tensors(
+            state_dict, cfg, layer, None, W_Q_key, W_K_key, W_V_key, b_Q_key, b_K_key, b_V_key
+        )
+        
+        wq_tensor, wk_tensor, wv_tensor = tensors["weights"]
+        bq_tensor, bk_tensor, bv_tensor = tensors["biases"]
+        
+        # Verify shapes
+        expected_shape = (cfg.n_heads, cfg.d_model, cfg.d_head)
+        assert wq_tensor.shape == expected_shape
+        assert wk_tensor.shape == expected_shape
+        assert wv_tensor.shape == expected_shape
+        
+        expected_bias_shape = (cfg.n_heads, cfg.d_head)
+        assert bq_tensor.shape == expected_bias_shape
+        assert bk_tensor.shape == expected_bias_shape
+        assert bv_tensor.shape == expected_bias_shape
+        
+        # Verify no combined QKV info (HookedTransformer uses separate format)
+        assert combined_qkv_info is None
+
+    def test_extract_attention_tensors_with_adapter(self, gpt2_small_adapter):
+        """Test tensor extraction with HuggingFace adapter."""
+        # Create a mock state dict with HuggingFace format
+        d_model = 768
+        n_heads = 12
+        d_head = 64
+        
+        # Combined QKV weight: [d_model, 3*d_model]
+        combined_qkv_weight = torch.randn(d_model, 3 * d_model)
+        # Combined QKV bias: [3*d_model]
+        combined_qkv_bias = torch.randn(3 * d_model)
+        
+        # Mock state dict
+        state_dict = {
+            "transformer.h.0.attn.c_attn.weight": combined_qkv_weight,
+            "transformer.h.0.attn.c_attn.bias": combined_qkv_bias,
+        }
+        
+        # Mock config
+        class MockConfig:
+            n_heads = n_heads
+            d_head = d_head
+            d_model = d_model
+        
+        cfg = MockConfig()
+        layer = 0
+        adapter = gpt2_small_adapter
+        
+        # Get parameter keys
+        W_Q_key = adapter.translate_transformer_lens_path(f"blocks.{layer}.attn.W_Q")
+        W_K_key = adapter.translate_transformer_lens_path(f"blocks.{layer}.attn.W_K")
+        W_V_key = adapter.translate_transformer_lens_path(f"blocks.{layer}.attn.W_V")
+        b_Q_key = adapter.translate_transformer_lens_path(f"blocks.{layer}.attn.b_Q")
+        b_K_key = adapter.translate_transformer_lens_path(f"blocks.{layer}.attn.b_K")
+        b_V_key = adapter.translate_transformer_lens_path(f"blocks.{layer}.attn.b_V")
+        
+        # Extract tensors
+        tensors, combined_qkv_info = ProcessWeights._extract_attention_tensors(
+            state_dict, cfg, layer, adapter, W_Q_key, W_K_key, W_V_key, b_Q_key, b_K_key, b_V_key
+        )
+        
+        wq_tensor, wk_tensor, wv_tensor = tensors["weights"]
+        bq_tensor, bk_tensor, bv_tensor = tensors["biases"]
+        
+        # Verify shapes (should be in TransformerLens format)
+        expected_shape = (n_heads, d_model, d_head)
+        assert wq_tensor.shape == expected_shape
+        assert wk_tensor.shape == expected_shape
+        assert wv_tensor.shape == expected_shape
+        
+        expected_bias_shape = (n_heads, d_head)
+        assert bq_tensor.shape == expected_bias_shape
+        assert bk_tensor.shape == expected_bias_shape
+        assert bv_tensor.shape == expected_bias_shape
+        
+        # Verify combined QKV info exists
+        assert combined_qkv_info is not None
+        assert combined_qkv_info["n_heads"] == n_heads
+        assert combined_qkv_info["d_head"] == d_head
+        assert combined_qkv_info["d_model"] == d_model
+
+    def test_full_pipeline_with_hooked_transformer(self, gpt2_small_model):
+        """Test the full pipeline with HookedTransformer model."""
+        model = gpt2_small_model
+        state_dict = model.state_dict()
+        cfg = model.cfg
+        layer = 0
+        
+        # Get parameter keys
+        W_Q_key = f"blocks.{layer}.attn.W_Q"
+        W_K_key = f"blocks.{layer}.attn.W_K"
+        W_V_key = f"blocks.{layer}.attn.W_V"
+        b_Q_key = f"blocks.{layer}.attn.b_Q"
+        b_K_key = f"blocks.{layer}.attn.b_K"
+        b_V_key = f"blocks.{layer}.attn.b_V"
+        
+        # Extract tensors
+        tensors, combined_qkv_info = ProcessWeights._extract_attention_tensors(
+            state_dict, cfg, layer, None, W_Q_key, W_K_key, W_V_key, b_Q_key, b_K_key, b_V_key
+        )
+        
+        wq_tensor, wk_tensor, wv_tensor = tensors["weights"]
+        bq_tensor, bk_tensor, bv_tensor = tensors["biases"]
+        
+        # Test LayerNorm folding if parameters exist
+        ln1_b_key = f"blocks.{layer}.ln1.b"
+        ln1_w_key = f"blocks.{layer}.ln1.w"
+        
+        if ln1_b_key in state_dict and ln1_w_key in state_dict:
+            ln1_b = state_dict[ln1_b_key]
+            ln1_w = state_dict[ln1_w_key]
+            
+            # Test bias folding
+            new_bq, new_bk, new_bv = ProcessWeights.fold_layer_norm_biases(
+                wq_tensor, wk_tensor, wv_tensor, bq_tensor, bk_tensor, bv_tensor, ln1_b
+            )
+            
+            # Test weight folding
+            new_wq, new_wk, new_wv = ProcessWeights.fold_layer_norm_weights(
+                wq_tensor, wk_tensor, wv_tensor, ln1_w
+            )
+            
+            # Verify shapes are preserved
+            assert new_bq.shape == bq_tensor.shape
+            assert new_bk.shape == bk_tensor.shape
+            assert new_bv.shape == bv_tensor.shape
+            assert new_wq.shape == wq_tensor.shape
+            assert new_wk.shape == wk_tensor.shape
+            assert new_wv.shape == wv_tensor.shape
+        
+        # Test weight centering
+        centered_wq, centered_wk, centered_wv = ProcessWeights.center_attention_weights(
+            wq_tensor, wk_tensor, wv_tensor
+        )
+        
+        # Verify shapes are preserved
+        assert centered_wq.shape == wq_tensor.shape
+        assert centered_wk.shape == wk_tensor.shape
+        assert centered_wv.shape == wv_tensor.shape
+
+    def test_consistency_between_formats(self, gpt2_small_model, gpt2_small_adapter):
+        """Test that the same mathematical operations produce consistent results across formats."""
+        model = gpt2_small_model
+        cfg = model.cfg
+        layer = 0
+        
+        # Get tensors from HookedTransformer format
+        state_dict_tl = model.state_dict()
+        W_Q_key = f"blocks.{layer}.attn.W_Q"
+        W_K_key = f"blocks.{layer}.attn.W_K"
+        W_V_key = f"blocks.{layer}.attn.W_V"
+        b_Q_key = f"blocks.{layer}.attn.b_Q"
+        b_K_key = f"blocks.{layer}.attn.b_K"
+        b_V_key = f"blocks.{layer}.attn.b_V"
+        
+        tensors_tl, _ = ProcessWeights._extract_attention_tensors(
+            state_dict_tl, cfg, layer, None, W_Q_key, W_K_key, W_V_key, b_Q_key, b_K_key, b_V_key
+        )
+        wq_tl, wk_tl, wv_tl = tensors_tl["weights"]
+        bq_tl, bk_tl, bv_tl = tensors_tl["biases"]
+        
+        # Convert to HuggingFace format and back
+        adapter = gpt2_small_adapter
+        
+        # Convert TL tensors to HF format
+        wq_hf = ProcessWeights.convert_tensor_to_hf_format(
+            wq_tl, f"blocks.{layer}.attn.W_Q", adapter, cfg, layer
+        )
+        wk_hf = ProcessWeights.convert_tensor_to_hf_format(
+            wk_tl, f"blocks.{layer}.attn.W_K", adapter, cfg, layer
+        )
+        wv_hf = ProcessWeights.convert_tensor_to_hf_format(
+            wv_tl, f"blocks.{layer}.attn.W_V", adapter, cfg, layer
+        )
+        bq_hf = ProcessWeights.convert_tensor_to_hf_format(
+            bq_tl, f"blocks.{layer}.attn.b_Q", adapter, cfg, layer
+        )
+        bk_hf = ProcessWeights.convert_tensor_to_hf_format(
+            bk_tl, f"blocks.{layer}.attn.b_K", adapter, cfg, layer
+        )
+        bv_hf = ProcessWeights.convert_tensor_to_hf_format(
+            bv_tl, f"blocks.{layer}.attn.b_V", adapter, cfg, layer
+        )
+        
+        # Convert back to TL format
+        wq_tl_converted = ProcessWeights.convert_tensor_to_tl_format(
+            f"blocks.{layer}.attn.W_Q", adapter, {"dummy": wq_hf}, cfg, layer
+        )
+        wk_tl_converted = ProcessWeights.convert_tensor_to_tl_format(
+            f"blocks.{layer}.attn.W_K", adapter, {"dummy": wk_hf}, cfg, layer
+        )
+        wv_tl_converted = ProcessWeights.convert_tensor_to_tl_format(
+            f"blocks.{layer}.attn.W_V", adapter, {"dummy": wv_hf}, cfg, layer
+        )
+        bq_tl_converted = ProcessWeights.convert_tensor_to_tl_format(
+            f"blocks.{layer}.attn.b_Q", adapter, {"dummy": bq_hf}, cfg, layer
+        )
+        bk_tl_converted = ProcessWeights.convert_tensor_to_tl_format(
+            f"blocks.{layer}.attn.b_K", adapter, {"dummy": bk_hf}, cfg, layer
+        )
+        bv_tl_converted = ProcessWeights.convert_tensor_to_tl_format(
+            f"blocks.{layer}.attn.b_V", adapter, {"dummy": bv_hf}, cfg, layer
+        )
+        
+        # Test that the math functions produce the same results
+        ln_bias = torch.randn(cfg.d_model)
+        ln_weight = torch.randn(cfg.d_model)
+        
+        # Apply operations to original TL tensors
+        new_bq_tl, new_bk_tl, new_bv_tl = ProcessWeights.fold_layer_norm_biases(
+            wq_tl, wk_tl, wv_tl, bq_tl, bk_tl, bv_tl, ln_bias
+        )
+        new_wq_tl, new_wk_tl, new_wv_tl = ProcessWeights.fold_layer_norm_weights(
+            wq_tl, wk_tl, wv_tl, ln_weight
+        )
+        centered_wq_tl, centered_wk_tl, centered_wv_tl = ProcessWeights.center_attention_weights(
+            wq_tl, wk_tl, wv_tl
+        )
+        
+        # Apply operations to converted TL tensors
+        new_bq_converted, new_bk_converted, new_bv_converted = ProcessWeights.fold_layer_norm_biases(
+            wq_tl_converted, wk_tl_converted, wv_tl_converted, bq_tl_converted, bk_tl_converted, bv_tl_converted, ln_bias
+        )
+        new_wq_converted, new_wk_converted, new_wv_converted = ProcessWeights.fold_layer_norm_weights(
+            wq_tl_converted, wk_tl_converted, wv_tl_converted, ln_weight
+        )
+        centered_wq_converted, centered_wk_converted, centered_wv_converted = ProcessWeights.center_attention_weights(
+            wq_tl_converted, wk_tl_converted, wv_tl_converted
+        )
+        
+        # Verify results are consistent (within numerical precision)
+        torch.testing.assert_close(new_bq_tl, new_bq_converted, atol=1e-6, rtol=1e-6)
+        torch.testing.assert_close(new_bk_tl, new_bk_converted, atol=1e-6, rtol=1e-6)
+        torch.testing.assert_close(new_bv_tl, new_bv_converted, atol=1e-6, rtol=1e-6)
+        torch.testing.assert_close(new_wq_tl, new_wq_converted, atol=1e-6, rtol=1e-6)
+        torch.testing.assert_close(new_wk_tl, new_wk_converted, atol=1e-6, rtol=1e-6)
+        torch.testing.assert_close(new_wv_tl, new_wv_converted, atol=1e-6, rtol=1e-6)
+        torch.testing.assert_close(centered_wq_tl, centered_wq_converted, atol=1e-6, rtol=1e-6)
+        torch.testing.assert_close(centered_wk_tl, centered_wk_converted, atol=1e-6, rtol=1e-6)
+        torch.testing.assert_close(centered_wv_tl, centered_wv_converted, atol=1e-6, rtol=1e-6)
diff --git a/tests/unit/test_bridge_state_dict.py b/tests/unit/test_bridge_state_dict.py
new file mode 100644
index 000000000..45a7457b6
--- /dev/null
+++ b/tests/unit/test_bridge_state_dict.py
@@ -0,0 +1,370 @@
+#!/usr/bin/env python3
+"""
+Unit tests for TransformerBridge state_dict functionality.
+
+This module tests that the bridge properly handles state_dict operations by:
+1. Filtering out _original_component references when getting state_dict
+2. Mapping clean keys back to _original_component keys when loading state_dict
+3. Supporting both original model keys and TransformerLens keys
+"""
+
+
+import pytest
+import torch
+import torch.nn as nn
+
+from transformer_lens.model_bridge.architecture_adapter import ArchitectureAdapter
+from transformer_lens.model_bridge.bridge import TransformerBridge
+
+
+class MockAdapter(ArchitectureAdapter):
+    """Mock adapter for testing."""
+
+    def __init__(self):
+        self.cfg = type(
+            "Config", (), {"n_layers": 1, "d_model": 10, "n_heads": 2, "d_head": 5, "device": "cpu"}
+        )()
+        self.component_mapping = {}
+
+    def get_component_mapping(self):
+        return {}
+
+    def get_remote_component(self, model, path):
+        return getattr(model, path)
+
+    def translate_transformer_lens_path(self, path):
+        return path
+
+
+class MockModelWithOriginalComponent(nn.Module):
+    """Test model that simulates having _original_component references."""
+
+    def __init__(self):
+        super().__init__()
+        self.linear = nn.Linear(10, 5)
+        self.embedding = nn.Embedding(100, 10)
+        # Simulate the bridge adding _original_component references
+        self.add_module("_original_component", nn.Linear(10, 5))
+
+    def __getattr__(self, name):
+        """Allow access to OV and other components through _original_component."""
+        if name == "OV":
+            # Return a mock OV component
+            return nn.Linear(5, 10)
+        return super().__getattr__(name)
+
+
+class MockTransformerBridge(TransformerBridge):
+    """Test bridge that doesn't require full initialization."""
+
+    def __init__(self, original_model):
+        # Skip the full initialization to avoid hook setup issues
+        nn.Module.__init__(self)
+        self.original_model = original_model
+        self.adapter = MockAdapter()
+        self.cfg = self.adapter.cfg
+        self.tokenizer = None
+        self.compatibility_mode = False
+        self._hook_cache = None
+        self._hook_registry = {}
+
+
+class TestBridgeStateDict:
+    """Test cases for bridge state_dict functionality."""
+
+    def test_state_dict_filters_original_component_references(self):
+        """Test that state_dict() filters out _original_component references but preserves submodules."""
+        # Create test model with _original_component references
+        test_model = MockModelWithOriginalComponent()
+        bridge = MockTransformerBridge(test_model)
+
+        # Get state dict
+        state_dict = bridge.state_dict()
+
+        # Verify no direct _original_component references in the keys
+        has_original_component = any("_original_component" in key for key in state_dict.keys())
+        assert (
+            not has_original_component
+        ), f"Found _original_component references: {[k for k in state_dict.keys() if '_original_component' in k]}"
+
+        # Verify we have the expected clean keys
+        expected_keys = {"linear.weight", "linear.bias", "embedding.weight"}
+        actual_keys = set(state_dict.keys())
+        assert actual_keys == expected_keys, f"Expected {expected_keys}, got {actual_keys}"
+
+        # Verify that submodules like OV are still accessible via __getattr__
+        # This tests that the _original_component module itself is filtered but its submodules are accessible
+        try:
+            ov_component = bridge.OV
+            assert ov_component is not None, "OV component should be accessible"
+        except AttributeError:
+            # This is expected if the mock model doesn't have an OV component
+            pass
+
+    def test_load_state_dict_with_clean_keys(self):
+        """Test that load_state_dict() accepts clean keys and maps them correctly."""
+        # Create test model with _original_component references
+        test_model = MockModelWithOriginalComponent()
+        bridge = MockTransformerBridge(test_model)
+
+        # Get initial state dict
+        initial_state_dict = bridge.state_dict()
+
+        # Create modified state dict with clean keys
+        modified_state_dict = {}
+        for key, tensor in initial_state_dict.items():
+            modified_state_dict[key] = tensor + 0.1
+
+        # Load the modified state dict
+        missing_keys, unexpected_keys = bridge.load_state_dict(modified_state_dict, strict=False)
+
+        # Verify no unexpected keys (missing keys are expected for _original_component)
+        assert len(unexpected_keys) == 0, f"Unexpected unexpected keys: {unexpected_keys}"
+        # Missing keys should only be _original_component keys
+        expected_missing = {"_original_component.weight", "_original_component.bias"}
+        actual_missing = set(missing_keys)
+        assert (
+            actual_missing == expected_missing
+        ), f"Expected missing keys {expected_missing}, got {actual_missing}"
+
+        # Verify weights were actually loaded
+        new_state_dict = bridge.state_dict()
+        for key in initial_state_dict.keys():
+            expected_weight = modified_state_dict[key]  # This is original + 0.1
+            new_weight = new_state_dict[key]
+            assert torch.allclose(
+                new_weight, expected_weight, atol=1e-6
+            ), f"Weight for {key} was not loaded correctly"
+
+    def test_load_state_dict_with_original_component_keys(self):
+        """Test that load_state_dict() accepts keys with _original_component references."""
+        # Create test model with _original_component references
+        test_model = MockModelWithOriginalComponent()
+        bridge = MockTransformerBridge(test_model)
+
+        # Get the raw state dict (with _original_component references)
+        raw_state_dict = test_model.state_dict()
+
+        # Create modified state dict with ALL keys (including _original_component keys)
+        modified_state_dict = {}
+        for key, tensor in raw_state_dict.items():
+            modified_state_dict[key] = tensor + 0.2
+
+        # Load the modified state dict
+        missing_keys, unexpected_keys = bridge.load_state_dict(modified_state_dict, strict=False)
+
+        # Verify no missing or unexpected keys when loading with original keys
+        assert len(missing_keys) == 0, f"Unexpected missing keys: {missing_keys}"
+        assert len(unexpected_keys) == 0, f"Unexpected unexpected keys: {unexpected_keys}"
+
+        # Verify weights were loaded correctly
+        new_state_dict = bridge.state_dict()
+        for key in modified_state_dict.keys():
+            if not key.startswith("_original_component") and key in new_state_dict:
+                expected_weight = modified_state_dict[key]  # This is original + 0.2
+                new_weight = new_state_dict[key]
+                assert torch.allclose(
+                    new_weight, expected_weight, atol=1e-6
+                ), f"Weight for {key} was not loaded correctly"
+
+    def test_round_trip_state_dict_operations(self):
+        """Test round-trip: save -> modify -> load -> save."""
+        # Create test model
+        test_model = MockModelWithOriginalComponent()
+        bridge = MockTransformerBridge(test_model)
+
+        # Get initial weights
+        initial_weights = bridge.state_dict()
+
+        # Modify weights
+        modified_weights = {k: v + 0.3 for k, v in initial_weights.items()}
+
+        # Load modified weights
+        bridge.load_state_dict(modified_weights, strict=False)
+
+        # Verify weights were loaded
+        final_weights = bridge.state_dict()
+        for key in initial_weights.keys():
+            expected_weight = modified_weights[key]  # This is initial + 0.3
+            actual_weight = final_weights[key]
+            assert torch.allclose(
+                expected_weight, actual_weight, atol=1e-6
+            ), f"Round-trip failed for {key}"
+
+    def test_state_dict_with_transformer_lens_keys(self):
+        """Test state_dict operations with TransformerLens-style keys."""
+
+        # Create a simple model with TL-style structure
+        class MockTLModel(nn.Module):
+            def __init__(self):
+                super().__init__()
+                self.embed = nn.Embedding(100, 10)
+                self.unembed = nn.Linear(10, 100)
+                self.linear = nn.Linear(10, 10)
+
+        # Create bridge with mock model
+        mock_model = MockTLModel()
+        bridge = MockTransformerBridge(mock_model)
+
+        # Test state_dict with TL keys
+        state_dict = bridge.state_dict()
+
+        # Verify we get clean keys (no _original_component references)
+        has_original_component = any("_original_component" in key for key in state_dict.keys())
+        assert (
+            not has_original_component
+        ), f"Found _original_component references: {[k for k in state_dict.keys() if '_original_component' in k]}"
+
+        # Test loading with TL keys
+        modified_state_dict = {k: v + 0.1 for k, v in state_dict.items()}
+        missing_keys, unexpected_keys = bridge.load_state_dict(modified_state_dict, strict=False)
+
+        # Verify successful loading
+        assert len(missing_keys) == 0, f"Unexpected missing keys: {missing_keys}"
+        assert len(unexpected_keys) == 0, f"Unexpected unexpected keys: {unexpected_keys}"
+
+    def test_state_dict_preserves_tensor_properties(self):
+        """Test that state_dict operations preserve tensor properties (device, dtype, etc.)."""
+        # Create test model on CPU
+        test_model = MockModelWithOriginalComponent()
+        bridge = MockTransformerBridge(test_model)
+
+        # Get state dict
+        state_dict = bridge.state_dict()
+
+        # Verify tensor properties are preserved
+        for key, tensor in state_dict.items():
+            assert isinstance(tensor, torch.Tensor), f"{key} is not a tensor"
+            assert tensor.device.type == "cpu", f"{key} is not on CPU"
+            assert tensor.dtype == torch.float32, f"{key} is not float32"
+
+    def test_state_dict_with_different_prefixes(self):
+        """Test state_dict operations with different prefix scenarios."""
+        # Create test model
+        test_model = MockModelWithOriginalComponent()
+        bridge = MockTransformerBridge(test_model)
+
+        # Test with prefix
+        state_dict_with_prefix = bridge.state_dict(prefix="model.")
+
+        # Verify prefix is applied
+        for key in state_dict_with_prefix.keys():
+            assert key.startswith("model."), f"Key {key} does not have prefix 'model.'"
+
+        # Test loading with prefix
+        modified_with_prefix = {k: v + 0.1 for k, v in state_dict_with_prefix.items()}
+        missing_keys, unexpected_keys = bridge.load_state_dict(modified_with_prefix, strict=False)
+
+        # Should have missing keys because we're loading with prefix but model expects no prefix
+        assert len(missing_keys) > 0, "Expected missing keys when loading with prefix"
+
+    def test_state_dict_strict_mode(self):
+        """Test state_dict loading in strict mode."""
+        # Create test model
+        test_model = MockModelWithOriginalComponent()
+        bridge = MockTransformerBridge(test_model)
+
+        # Get initial state dict
+        initial_state_dict = bridge.state_dict()
+
+        # Create state dict with extra keys
+        extra_state_dict = initial_state_dict.copy()
+        extra_state_dict["nonexistent.weight"] = torch.randn(5, 10)
+
+        # Test strict mode (should fail with unexpected keys)
+        with pytest.raises(RuntimeError, match="Unexpected key"):
+            bridge.load_state_dict(extra_state_dict, strict=True)
+
+        # Test non-strict mode (should succeed)
+        missing_keys, unexpected_keys = bridge.load_state_dict(extra_state_dict, strict=False)
+        assert "nonexistent.weight" in unexpected_keys, "Extra key should be in unexpected_keys"
+
+    def test_load_state_dict_with_mixed_keys(self):
+        """Test that load_state_dict() accepts a mix of clean keys and original keys."""
+        # Create test model with _original_component references
+        test_model = MockModelWithOriginalComponent()
+        bridge = MockTransformerBridge(test_model)
+
+        # Get both clean and raw state dicts
+        clean_state_dict = bridge.state_dict()
+        raw_state_dict = test_model.state_dict()
+
+        # Create a mixed state dict with both clean and original keys
+        mixed_state_dict = {}
+        # Add some clean keys
+        for key, tensor in clean_state_dict.items():
+            if key == "linear.weight":  # Only add one clean key
+                mixed_state_dict[key] = tensor + 0.3
+                break
+
+        # Add some original keys (including _original_component)
+        for key, tensor in raw_state_dict.items():
+            if key == "linear.bias":  # Add one original key
+                mixed_state_dict[key] = tensor + 0.3
+                break
+
+        # Load the mixed state dict
+        missing_keys, unexpected_keys = bridge.load_state_dict(mixed_state_dict, strict=False)
+
+        # Should have missing keys for the keys we didn't include
+        assert len(unexpected_keys) == 0, f"Unexpected unexpected keys: {unexpected_keys}"
+
+        # Verify the weights we loaded were loaded correctly
+        new_state_dict = bridge.state_dict()
+        for key in mixed_state_dict.keys():
+            if not key.startswith("_original_component") and key in new_state_dict:
+                expected_weight = mixed_state_dict[key]
+                new_weight = new_state_dict[key]
+                assert torch.allclose(
+                    new_weight, expected_weight, atol=1e-6
+                ), f"Weight for {key} was not loaded correctly"
+
+    def test_state_dict_filtering_preserves_submodules(self):
+        """Test that state_dict filtering preserves submodules while filtering _original_component."""
+        # Create a simple test model
+        test_model = nn.Module()
+        test_model.linear = nn.Linear(10, 5)
+        test_model.embedding = nn.Embedding(100, 10)
+        # Add a mock OV component directly
+        test_model.OV = nn.Linear(5, 10)
+        # Simulate the bridge adding _original_component references
+        test_model.add_module("_original_component", nn.Linear(10, 5))
+
+        bridge = MockTransformerBridge(test_model)
+
+        # Get state dict (this should filter out _original_component but preserve submodules)
+        state_dict = bridge.state_dict()
+
+        # Verify no _original_component references in state_dict
+        has_original_component = any("_original_component" in key for key in state_dict.keys())
+        assert (
+            not has_original_component
+        ), f"Found _original_component references: {[k for k in state_dict.keys() if '_original_component' in k]}"
+
+        # Verify that submodules like OV are still in the state_dict
+        ov_keys = [k for k in state_dict.keys() if "OV" in k]
+        assert len(ov_keys) > 0, "OV component should be present in state_dict"
+
+        # Verify we have the expected clean keys
+        expected_keys = {"linear.weight", "linear.bias", "embedding.weight", "OV.weight", "OV.bias"}
+        actual_keys = set(state_dict.keys())
+        assert actual_keys == expected_keys, f"Expected {expected_keys}, got {actual_keys}"
+
+    def test_state_dict_with_empty_model(self):
+        """Test state_dict operations with an empty model."""
+        # Create empty model
+        empty_model = nn.Module()
+        bridge = MockTransformerBridge(empty_model)
+
+        # Test state_dict
+        state_dict = bridge.state_dict()
+        assert len(state_dict) == 0, "Empty model should have empty state_dict"
+
+        # Test load_state_dict
+        missing_keys, unexpected_keys = bridge.load_state_dict({}, strict=False)
+        assert len(missing_keys) == 0, "Should have no missing keys for empty model"
+        assert len(unexpected_keys) == 0, "Should have no unexpected keys for empty model"
+
+
+if __name__ == "__main__":
+    pytest.main([__file__])
diff --git a/transformer_lens/model_bridge/architecture_adapter.py b/transformer_lens/model_bridge/architecture_adapter.py
index 5de366259..19d327d90 100644
--- a/transformer_lens/model_bridge/architecture_adapter.py
+++ b/transformer_lens/model_bridge/architecture_adapter.py
@@ -183,6 +183,110 @@ def get_component_from_list_module(
                     f"Component {subcomponent_name} not found in {parts[0]} components"
                 )
 
+    def get_generalized_component(self, path: TransformerLensPath) -> GeneralizedComponent:
+        """Get the generalized component (bridge component) for a given TransformerLens path.
+
+        Args:
+            path: The TransformerLens path to get the component for
+
+        Returns:
+            The generalized component that handles this path
+
+        Raises:
+            ValueError: If component_mapping is not set or if the component is not found
+
+        Examples:
+            Get the embedding bridge component:
+
+            >>> # adapter.get_generalized_component("embed")
+            >>> # <EmbeddingBridge>
+
+            Get the attention bridge component:
+
+            >>> # adapter.get_generalized_component("blocks.0.attn")
+            >>> # <AttentionBridge>
+        """
+        if self.component_mapping is None:
+            raise ValueError(
+                "component_mapping must be set before calling get_generalized_component"
+            )
+
+        # Strip parameter suffixes to get the component path
+        component_path, _ = self._preprocess_parameter_path(path)
+        parts = component_path.split(".")
+        if not parts:
+            raise ValueError("Empty path")
+
+        # Get the top-level component from the mapping
+        if parts[0] not in self.component_mapping:
+            raise ValueError(f"Component {parts[0]} not found in component mapping")
+
+        bridge_component = self.component_mapping[parts[0]]
+
+        if len(parts) == 1:
+            # Simple case: just return the top-level component
+            return bridge_component
+
+        # For nested paths, navigate through the component hierarchy
+        current_component = bridge_component
+        for i in range(1, len(parts)):
+            part = parts[i]
+
+            # Handle list item indexing (like blocks.0)
+            if part.isdigit():
+                # For list items, we return the bridge component itself
+                # since the indexing is handled at the model level
+                continue
+
+            # Navigate to subcomponent
+            if hasattr(current_component, "submodules") and part in current_component.submodules:
+                current_component = current_component.submodules[part]
+            else:
+                # Check if this is an attention parameter (q, k, v, o) that should map to the attention component
+                # This handles cases like "blocks.0.attn.W_Q" -> "blocks.0.attn.q" -> return attention component
+                if (
+                    hasattr(current_component, "__class__")
+                    and "AttentionBridge" in current_component.__class__.__name__
+                    and part in ["q", "k", "v", "o"]
+                ):
+                    # Check if this is a JointQKVAttentionBridge (like GPT-2) or regular AttentionBridge (like Gemma3)
+                    if "JointQKV" in current_component.__class__.__name__:
+                        # For joint QKV attention, return the attention component itself
+                        # since the individual q, k, v, o are handled as attributes, not submodules
+                        continue
+                    else:
+                        # For separate Q, K, V attention (like Gemma3), navigate to the subcomponent
+                        if (
+                            hasattr(current_component, "submodules")
+                            and part in current_component.submodules
+                        ):
+                            current_component = current_component.submodules[part]
+                            continue
+                # Check if this is an MLP parameter (in, out, gate) that should map to the MLP component
+                # This handles cases like "blocks.0.mlp.W_in" -> "blocks.0.mlp.in" -> return MLP component
+                elif (
+                    hasattr(current_component, "__class__")
+                    and "MLPBridge" in current_component.__class__.__name__
+                    and part in ["in", "out", "gate"]
+                ):
+                    # Check if this MLP has separate subcomponents (like Gemma3) or property aliases (like GPT-2)
+                    if (
+                        hasattr(current_component, "submodules")
+                        and part in current_component.submodules
+                    ):
+                        # For separate MLP components (like Gemma3), navigate to the subcomponent
+                        current_component = current_component.submodules[part]
+                        continue
+                    else:
+                        # For property alias MLP (like GPT-2), return the MLP component itself
+                        continue
+                else:
+                    raise ValueError(
+                        f"Component {part} not found in {'.'.join(parts[:i])} components"
+                    )
+
+        return current_component
+
     def get_component(self, model: RemoteModel, path: TransformerLensPath) -> RemoteComponent:
         """Get a component from the model using the component_mapping.
 
@@ -662,3 +766,84 @@ def flatten_nested_dict(
             items[parent_key] = input
 
         return items
+
+    def convert_hf_key_to_bridge_key(self, hf_key: str) -> str:
+        """Convert a HuggingFace-style key to a bridge key with _original_component references.
+        
+        Args:
+            hf_key: The HuggingFace-style key (e.g., "transformer.h.0.attn.c_attn.weight")
+            
+        Returns:
+            The bridge key with _original_component references (e.g., "transformer.h.0._original_component.attn._original_component.c_attn._original_component.weight")
+        """
+        # Handle different key patterns
+        if "transformer.h." in hf_key:
+            parts = hf_key.split(".")
+            if len(parts) >= 4 and parts[2].isdigit():
+                layer = parts[2]
+                
+                # Pattern: transformer.h.X.attn.c_attn.weight -> transformer.h.X._original_component.attn._original_component.c_attn._original_component.weight
+                if "attn.c_attn" in hf_key:
+                    return f"transformer.h.{layer}._original_component.attn._original_component.c_attn._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.attn.c_proj.weight -> transformer.h.X._original_component.attn._original_component.c_proj._original_component.weight
+                elif "attn.c_proj" in hf_key:
+                    return f"transformer.h.{layer}._original_component.attn._original_component.c_proj._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.mlp.c_fc.weight -> transformer.h.X._original_component.mlp._original_component.c_fc._original_component.weight
+                elif "mlp.c_fc" in hf_key:
+                    return f"transformer.h.{layer}._original_component.mlp._original_component.c_fc._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.mlp.c_proj.weight -> transformer.h.X._original_component.mlp._original_component.c_proj._original_component.weight
+                elif "mlp.c_proj" in hf_key:
+                    return f"transformer.h.{layer}._original_component.mlp._original_component.c_proj._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.attn.qkv.weight -> transformer.h.X._original_component.attn.qkv._original_component.weight
+                elif "attn.qkv" in hf_key:
+                    return f"transformer.h.{layer}._original_component.attn.qkv._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.attn.o.weight -> transformer.h.X._original_component.attn.o._original_component.weight
+                elif "attn.o" in hf_key:
+                    return f"transformer.h.{layer}._original_component.attn.o._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.mlp.input.weight -> transformer.h.X._original_component.mlp.input._original_component.weight
+                elif "mlp.input" in hf_key:
+                    return f"transformer.h.{layer}._original_component.mlp.input._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.mlp.out.weight -> transformer.h.X._original_component.mlp.out._original_component.weight
+                elif "mlp.out" in hf_key:
+                    return f"transformer.h.{layer}._original_component.mlp.out._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.ln1.weight -> transformer.h.X._original_component.ln1._original_component.weight
+                elif "ln1" in hf_key:
+                    return f"transformer.h.{layer}._original_component.ln1._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.ln2.weight -> transformer.h.X._original_component.ln2._original_component.weight
+                elif "ln2" in hf_key:
+                    return f"transformer.h.{layer}._original_component.ln2._original_component.{parts[-1]}"
+                
+                # Pattern: transformer.h.X.ln_2.weight -> transformer.h.X._original_component.ln_2._original_component.weight
+                elif "ln_2" in hf_key:
+                    return f"transformer.h.{layer}._original_component.ln_2._original_component.{parts[-1]}"
+        
+        # Pattern: transformer.wte.weight -> transformer.wte._original_component.weight
+        elif hf_key == "transformer.wte.weight":
+            return "transformer.wte._original_component.weight"
+        
+        # Pattern: transformer.wpe.weight -> transformer.wpe._original_component.weight
+        elif hf_key == "transformer.wpe.weight":
+            return "transformer.wpe._original_component.weight"
+        
+        # Pattern: lm_head.weight -> lm_head._original_component.weight
+        elif hf_key == "lm_head.weight":
+            return "lm_head._original_component.weight"
+        
+        # Pattern: transformer.ln_f.bias -> transformer.ln_f._original_component.bias
+        elif "transformer.ln_f" in hf_key:
+            if "weight" in hf_key:
+                return "transformer.ln_f._original_component.weight"
+            elif "bias" in hf_key:
+                return "transformer.ln_f._original_component.bias"
+        
+        # If no pattern matches, return the original key
+        return hf_key
diff --git a/transformer_lens/model_bridge/bridge.py b/transformer_lens/model_bridge/bridge.py
index 65d6ccc7c..d324c6412 100644
--- a/transformer_lens/model_bridge/bridge.py
+++ b/transformer_lens/model_bridge/bridge.py
@@ -98,7 +98,8 @@ def __init__(
             tokenizer: The tokenizer to use (required)
         """
         super().__init__()
-        self.original_model: nn.Module = model
+        # Set original_model directly in __dict__ to avoid any property issues
+        self.__dict__["original_model"] = model
         self.adapter = adapter
         self.cfg = adapter.cfg
 
@@ -121,7 +122,9 @@ def __init__(
             raise ValueError("Adapter must have a component_mapping attribute")
 
         # Set original components on the pre-created bridge components
-        set_original_components(self, self.adapter, self.original_model)
+        # Access original_model directly from __dict__ to avoid __getattr__ issues
+        original_model = self.__dict__["original_model"]
+        set_original_components(self, self.adapter, original_model)
 
         # Initialize hook registry after components are set up
         self._initialize_hook_registry()
@@ -265,9 +268,13 @@ def _add_aliases_to_hooks(self, hooks: Dict[str, HookPoint]) -> None:
                         break
                     continue
             else:
-                target_hook = resolve_alias(self, alias_name, {alias_name: target})
-                if target_hook is not None:
-                    hooks[alias_name] = target_hook
+                try:
+                    target_hook = resolve_alias(self, alias_name, {alias_name: target})
+                    if target_hook is not None:
+                        hooks[alias_name] = target_hook
+                except AttributeError:
+                    # Skip this alias if it can't be resolved (e.g., during initialization)
+                    continue
 
     def _scan_existing_hooks(self, module: nn.Module, prefix: str = "") -> None:
         """Scan existing modules for hooks and add them to registry."""
@@ -295,10 +302,30 @@ def scan_module(mod: nn.Module, path: str = "") -> None:
             for attr_name in dir(mod):
                 if attr_name.startswith("_"):
                     continue
-                if attr_name == "original_component" or "original_model":
+                if attr_name == "original_component" or attr_name == "original_model":
+                    continue
+
+                # Skip properties that might not be ready during initialization
+                if attr_name in [
+                    "OV",
+                    "QK",
+                    "W_V",
+                    "W_O",
+                    "W_Q",
+                    "W_K",
+                    "W_in",
+                    "W_gate",
+                    "W_out",
+                    "b_V",
+                    "b_O",
+                    "b_Q",
+                    "b_K",
+                    "b_in",
+                    "b_out",
+                ]:
                     continue
 
-                    attr = getattr(mod, attr_name)
+                attr = getattr(mod, attr_name)
 
                 name = f"{path}.{attr_name}" if path else attr_name
 
@@ -454,6 +481,7 @@ def set_hooks_to_cache(
 
     def __getattr__(self, name: str) -> Any:
         """Provide a clear error message for missing attributes."""
+        # First check if the attribute is in __dict__ (direct attributes)
         if name in self.__dict__:
             return self.__dict__[name]
 
@@ -463,7 +491,22 @@ def __getattr__(self, name: str) -> Any:
             if resolved_hook is not None:
                 return resolved_hook
 
-        return super().__getattr__(name)
+        # Try to get from original_model if it exists
+        if "original_model" in self.__dict__ and self.__dict__["original_model"] is not None:
+            try:
+                name_split = name.split(".")
+                if len(name_split) > 1:
+                    current = getattr(self.__dict__["original_model"], name_split[0])
+                    for part in name_split[1:]:
+                        current = getattr(current, part)
+                    return current
+                else:
+                    return getattr(self.__dict__["original_model"], name)
+            except AttributeError:
+                pass
+
+        # If we get here, the attribute wasn't found anywhere
+        raise AttributeError(f"'{type(self).__name__}' object has no attribute '{name}'")
 
     def _get_nested_attr(self, path: str) -> Any:
         """Get a nested attribute using dot notation."""
@@ -578,6 +621,7 @@ def set_compatibility_mode(component: Any) -> None:
                 center_writing_weights=True,
                 center_unembed=True,
                 fold_value_biases=True,
+                refactor_factored_attn_matrices=False,  # Keep unfactored format to match HuggingFace
             )
 
     def process_weights(
@@ -588,148 +632,73 @@ def process_weights(
         fold_value_biases: bool = True,
         refactor_factored_attn_matrices: bool = False,
     ):
-        """Apply weight processing transformations directly to HuggingFace tensor formats.
+        """Apply weight processing transformations using the centralized ProcessWeights class.
 
-        Keeps weights in HF format throughout and applies the same mathematical
-        transformations as ProcessWeights, adapted for HF tensor shapes.
+        This method extracts weights from the original HuggingFace model and applies weight processing
+        using the centralized ProcessWeights class with the architecture adapter to handle parameter
+        name translation from TransformerLens format to HuggingFace format.
         """
-        import torch
-
-        original_state_dict = self.original_model.state_dict()
-
-        state_dict = {}
-        for key, tensor in original_state_dict.items():
-            clean_key = key.replace("._original_component", "")
-            state_dict[clean_key] = tensor.clone()
+        # import torch
+        # import torch.nn as nn
+
+        from transformer_lens.weight_processing import ProcessWeights
+
+        # # Step 1: Extract HuggingFace weights from original model
+        hf_state_dict = self._extract_hf_weights()
+
+        # # Step 2: Apply centralized weight processing with architecture adapter
+        # # The adapter will translate TransformerLens parameter names to HuggingFace parameter names
+        processed_hf_state_dict = ProcessWeights.process_weights(
+            hf_state_dict,
+            self.cfg,
+            fold_ln=fold_ln,
+            center_writing_weights=center_writing_weights,
+            center_unembed=center_unembed,
+            fold_value_biases=fold_value_biases,
+            refactor_factored_attn_matrices=refactor_factored_attn_matrices,
+            adapter=self.adapter,
+        )
 
+        # # Step 3: Replace LayerNorm components with LayerNormPre-like operations if fold_ln is True
+        # This is equivalent to what HookedTransformer does when it replaces LayerNorm with LayerNormPre
         if fold_ln:
-            self._fold_layer_norm_hf_native(state_dict)
-
-        if center_writing_weights:
-            self._center_writing_weights_hf_native(state_dict)
+            self._replace_layer_norm_with_identity(self.original_model)
 
-        if center_unembed:
-            self._center_unembed_hf_native(state_dict)
+        # # Step 4: Load processed weights into the original model using the bridge's load_state_dict method
+        # This handles the key mapping between clean keys and _original_component keys
+        # Use strict=False because weight processing may remove some keys (e.g., individual Q,K,V -> combined QKV)
+        self.load_state_dict(processed_hf_state_dict, strict=False, assign=True)
 
-        self._add_identity_layer_norm_params(state_dict)
-        self._load_processed_hf_weights(state_dict)
-
-    def _fold_layer_norm_hf_native(self, state_dict):
-        """Fold LayerNorm into subsequent layers using HF tensor formats."""
-        import torch
+    def _extract_hf_weights(self):
+        """Extract weights from the original HuggingFace model."""
+        # Use the bridge's clean state_dict method which automatically filters out _original_component
+        hf_state_dict = self.state_dict()
 
+        # Remove separate Q, K, V weights if combined QKV weights exist
+        # This prevents the adapter from processing the same combined weight multiple times
         for layer_idx in range(self.cfg.n_layers):
-            # Fold LN1 into attention
-            ln1_weight = state_dict[f"transformer.h.{layer_idx}.ln_1.weight"]
-            ln1_bias = state_dict[f"transformer.h.{layer_idx}.ln_1.bias"]
-
-            c_attn_weight = state_dict[f"transformer.h.{layer_idx}.attn.c_attn.weight"]
-            c_attn_bias = state_dict[f"transformer.h.{layer_idx}.attn.c_attn.bias"]
-
-            # Split combined QKV for processing
-            d_model = self.cfg.d_model
-            q_weight = c_attn_weight[:, :d_model]
-            k_weight = c_attn_weight[:, d_model : 2 * d_model]
-            v_weight = c_attn_weight[:, 2 * d_model :]
-
-            q_bias = c_attn_bias[:d_model]
-            k_bias = c_attn_bias[d_model : 2 * d_model]
-            v_bias = c_attn_bias[2 * d_model :]
-
-            # Apply LayerNorm folding: fold biases, then weights, then center
-            q_bias = q_bias + torch.sum(q_weight * ln1_bias[:, None], dim=0)
-            k_bias = k_bias + torch.sum(k_weight * ln1_bias[:, None], dim=0)
-            v_bias = v_bias + torch.sum(v_weight * ln1_bias[:, None], dim=0)
-
-            q_weight = q_weight * ln1_weight[:, None]
-            k_weight = k_weight * ln1_weight[:, None]
-            v_weight = v_weight * ln1_weight[:, None]
-
-            q_weight = q_weight - torch.mean(q_weight, dim=0, keepdim=True)
-            k_weight = k_weight - torch.mean(k_weight, dim=0, keepdim=True)
-            v_weight = v_weight - torch.mean(v_weight, dim=0, keepdim=True)
-
-            # Recombine and store
-            state_dict[f"transformer.h.{layer_idx}.attn.c_attn.weight"] = torch.cat(
-                [q_weight, k_weight, v_weight], dim=1
-            )
-            state_dict[f"transformer.h.{layer_idx}.attn.c_attn.bias"] = torch.cat(
-                [q_bias, k_bias, v_bias], dim=0
-            )
-
-            del state_dict[f"transformer.h.{layer_idx}.ln_1.weight"]
-            del state_dict[f"transformer.h.{layer_idx}.ln_1.bias"]
-
-            # Fold LN2 into MLP
-            ln2_weight = state_dict[f"transformer.h.{layer_idx}.ln_2.weight"]
-            ln2_bias = state_dict[f"transformer.h.{layer_idx}.ln_2.bias"]
-
-            c_fc_weight = state_dict[f"transformer.h.{layer_idx}.mlp.c_fc.weight"]
-            c_fc_bias = state_dict[f"transformer.h.{layer_idx}.mlp.c_fc.bias"]
-
-            c_fc_bias = c_fc_bias + torch.sum(c_fc_weight * ln2_bias[:, None], dim=0)
-            c_fc_weight = c_fc_weight * ln2_weight[:, None]
-            c_fc_weight = c_fc_weight - torch.mean(c_fc_weight, dim=0, keepdim=True)
-
-            state_dict[f"transformer.h.{layer_idx}.mlp.c_fc.weight"] = c_fc_weight
-            state_dict[f"transformer.h.{layer_idx}.mlp.c_fc.bias"] = c_fc_bias
-
-            del state_dict[f"transformer.h.{layer_idx}.ln_2.weight"]
-            del state_dict[f"transformer.h.{layer_idx}.ln_2.bias"]
-
-        # Fold final LayerNorm into unembedding
-        ln_final_weight = state_dict["transformer.ln_f.weight"]
-        ln_final_bias = state_dict["transformer.ln_f.bias"]
-
-        lm_head_weight = state_dict["lm_head.weight"]
-
-        if "lm_head.bias" in state_dict:
-            lm_head_bias = state_dict["lm_head.bias"]
-            lm_head_bias = lm_head_bias + torch.sum(lm_head_weight * ln_final_bias[None, :], dim=1)
-            state_dict["lm_head.bias"] = lm_head_bias
-
-        lm_head_weight = lm_head_weight * ln_final_weight[None, :]
-        state_dict["lm_head.weight"] = lm_head_weight
-
-        del state_dict["transformer.ln_f.weight"]
-        del state_dict["transformer.ln_f.bias"]
-
-    def _center_writing_weights_hf_native(self, state_dict):
-        """Center weights that write to the residual stream."""
-        import torch
-
-        # Center embedding weights
-        wte_weight = state_dict["transformer.wte.weight"]
-        wte_weight = wte_weight - torch.mean(wte_weight, dim=1, keepdim=True)
-        state_dict["transformer.wte.weight"] = wte_weight
-
-        if "transformer.wpe.weight" in state_dict:
-            wpe_weight = state_dict["transformer.wpe.weight"]
-            wpe_weight = wpe_weight - torch.mean(wpe_weight, dim=1, keepdim=True)
-            state_dict["transformer.wpe.weight"] = wpe_weight
-
-        # Center output weights that write to residual stream
-        for layer_idx in range(self.cfg.n_layers):
-            c_proj_weight = state_dict[f"transformer.h.{layer_idx}.attn.c_proj.weight"]
-            c_proj_weight = c_proj_weight - torch.mean(c_proj_weight, dim=1, keepdim=True)
-            state_dict[f"transformer.h.{layer_idx}.attn.c_proj.weight"] = c_proj_weight
-
-            mlp_c_proj_weight = state_dict[f"transformer.h.{layer_idx}.mlp.c_proj.weight"]
-            mlp_c_proj_weight = mlp_c_proj_weight - torch.mean(
-                mlp_c_proj_weight, dim=1, keepdim=True
-            )
-            state_dict[f"transformer.h.{layer_idx}.mlp.c_proj.weight"] = mlp_c_proj_weight
-
-    def _center_unembed_hf_native(self, state_dict):
-        """Center unembedding weights."""
-        import torch
-
-        lm_head_weight = state_dict["lm_head.weight"]
-        lm_head_weight = lm_head_weight - torch.mean(lm_head_weight, dim=1, keepdim=True)
-        state_dict["lm_head.weight"] = lm_head_weight
+            combined_qkv_key = f"transformer.h.{layer_idx}.attn.c_attn.weight"
+            combined_qkv_bias_key = f"transformer.h.{layer_idx}.attn.c_attn.bias"
+
+            if combined_qkv_key in hf_state_dict:
+                # Remove separate Q, K, V weights since we have combined QKV
+                separate_keys_to_remove = [
+                    f"transformer.h.{layer_idx}.attn.q.weight",
+                    f"transformer.h.{layer_idx}.attn.q.bias",
+                    f"transformer.h.{layer_idx}.attn.k.weight",
+                    f"transformer.h.{layer_idx}.attn.k.bias",
+                    f"transformer.h.{layer_idx}.attn.v.weight",
+                    f"transformer.h.{layer_idx}.attn.v.bias",
+                ]
+
+                for key_to_remove in separate_keys_to_remove:
+                    if key_to_remove in hf_state_dict:
+                        del hf_state_dict[key_to_remove]
+
+        return hf_state_dict
 
     def _add_identity_layer_norm_params(self, processed_hf_state_dict):
-        """Add missing LayerNorm parameters as identity values.
+        """Add identity LayerNorm parameters after folding.
 
         After folding LayerNorm into other layers, HuggingFace models still expect
         LayerNorm parameters to exist. Set them to identity (weight=1, bias=0).
@@ -742,274 +711,57 @@ def _add_identity_layer_norm_params(self, processed_hf_state_dict):
             ln2_weight_key = f"transformer.h.{layer_idx}.ln_2.weight"
             ln2_bias_key = f"transformer.h.{layer_idx}.ln_2.bias"
 
-            if ln1_weight_key not in processed_hf_state_dict:
-                processed_hf_state_dict[ln1_weight_key] = torch.ones(self.cfg.d_model)
-            if ln1_bias_key not in processed_hf_state_dict:
-                processed_hf_state_dict[ln1_bias_key] = torch.zeros(self.cfg.d_model)
-            if ln2_weight_key not in processed_hf_state_dict:
-                processed_hf_state_dict[ln2_weight_key] = torch.ones(self.cfg.d_model)
-            if ln2_bias_key not in processed_hf_state_dict:
-                processed_hf_state_dict[ln2_bias_key] = torch.zeros(self.cfg.d_model)
+            # Always add identity LayerNorm parameters (they were deleted by ProcessWeights.fold_layer_norm)
+            processed_hf_state_dict[ln1_weight_key] = torch.ones(self.cfg.d_model)
+            processed_hf_state_dict[ln1_bias_key] = torch.zeros(self.cfg.d_model)
+            processed_hf_state_dict[ln2_weight_key] = torch.ones(self.cfg.d_model)
+            processed_hf_state_dict[ln2_bias_key] = torch.zeros(self.cfg.d_model)
 
         ln_final_weight_key = "transformer.ln_f.weight"
         ln_final_bias_key = "transformer.ln_f.bias"
 
-        if ln_final_weight_key not in processed_hf_state_dict:
-            processed_hf_state_dict[ln_final_weight_key] = torch.ones(self.cfg.d_model)
-        if ln_final_bias_key not in processed_hf_state_dict:
-            processed_hf_state_dict[ln_final_bias_key] = torch.zeros(self.cfg.d_model)
-
-    def _load_processed_hf_weights(self, processed_hf_state_dict):
-        """Load processed HuggingFace weights back into the original model."""
-        # Get the original model's state dict with _original_component suffixes
-        original_state_dict = self.original_model.state_dict()
+        # Always add identity final LayerNorm parameters (they were deleted by ProcessWeights.fold_layer_norm)
+        processed_hf_state_dict[ln_final_weight_key] = torch.ones(self.cfg.d_model)
+        processed_hf_state_dict[ln_final_bias_key] = torch.zeros(self.cfg.d_model)
 
-        # Load processed weights into the original model components
-        for processed_key, processed_tensor in processed_hf_state_dict.items():
-            # Find the corresponding key with _original_component suffix
-            for orig_key in original_state_dict.keys():
-                if orig_key.replace("._original_component", "") == processed_key:
-                    original_state_dict[orig_key].data.copy_(processed_tensor)
-                    break
+    def _replace_layer_norm_with_identity(self, model):
+        """Replace LayerNorm components with LayerNormPre-like operations to maintain mathematical equivalence.
 
-    def _load_processed_weights_from_hf_dict(self, processed_hf_dict):
-        """Load processed weights (in HF format) back into the TransformerBridge.
-
-        Args:
-            processed_hf_dict: Dictionary of processed weights in HuggingFace format
-        """
-        # Load the processed weights back into the original model components
-        # This preserves the HF format without conversion
-        original_state_dict = self.original_model.state_dict()
-
-        for key, processed_tensor in processed_hf_dict.items():
-            # Find the corresponding key in the original model (with _original_component)
-            original_key = None
-            for orig_key in original_state_dict.keys():
-                if orig_key.replace("._original_component", "") == key:
-                    original_key = orig_key
-                    break
-
-            if original_key and original_key in original_state_dict:
-                # Load the processed tensor back into the original model
-                original_state_dict[original_key].data.copy_(processed_tensor)
-
-    def _apply_weight_processing_inplace(
-        self,
-        fold_ln: bool = True,
-        center_writing_weights: bool = True,
-        center_unembed: bool = True,
-        fold_value_biases: bool = True,
-        refactor_factored_attn_matrices: bool = False,
-    ):
-        """Apply weight processing transformations directly to bridge components in HuggingFace format.
-
-        This method applies the same transformations as ProcessWeights but works directly on the
-        bridge's components without converting tensor formats.
+        After folding LayerNorm into other layers, we need to replace the LayerNorm components
+        with operations that only apply normalization (centering and scaling) without learnable parameters.
+        This is equivalent to what HookedTransformer does when it replaces LayerNorm with LayerNormPre components.
         """
+        import torch.nn as nn
 
-        # Step 1: Fold LayerNorm if requested (DISABLED for debugging)
-        if fold_ln:
-            # self._fold_layer_norm_inplace()
-            pass
-
-        # Step 2: Center writing weights if requested
-        if center_writing_weights:
-            self._center_writing_weights_inplace()
-
-        # Step 3: Center unembedding if requested (DISABLED for debugging)
-        if center_unembed:
-            # self._center_unembed_inplace()
-            pass
-
-        # Step 4: Fold value biases if requested (DISABLED for debugging)
-        if fold_value_biases:
-            # self._fold_value_biases_inplace()
-            pass
-
-        # Step 5: Refactor attention matrices if requested
-        if refactor_factored_attn_matrices:
-            self._refactor_factored_attn_matrices_inplace()
-
-    def _fold_layer_norm_inplace(self):
-        """Fold LayerNorm weights into subsequent layers in-place."""
-        # For now, implement a simple version - we can expand this later
-        # TODO: Implement LayerNorm folding logic for HF format
-        pass
-
-    def _center_writing_weights_inplace(self):
-        """Center weights that write to the residual stream in-place."""
-
-        # Center embedding weights (W_E)
-        if hasattr(self, "embed") and hasattr(self.embed, "weight"):
-            embed_weight = self.embed.weight.data  # HF format: [vocab_size, d_model]
-            # Subtract mean along d_model dimension (last dim = -1)
-            embed_mean = embed_weight.mean(dim=-1, keepdim=True)
-            self.embed.weight.data = embed_weight - embed_mean
-
-        # Center positional embedding weights (W_pos)
-        if hasattr(self, "pos_embed") and hasattr(self.pos_embed, "weight"):
-            if getattr(self.cfg, "positional_embedding_type", "standard") != "rotary":
-                pos_weight = self.pos_embed.weight.data  # HF format: [seq_len, d_model]
-                # Subtract mean along d_model dimension (last dim = -1)
-                pos_mean = pos_weight.mean(dim=-1, keepdim=True)
-                self.pos_embed.weight.data = pos_weight - pos_mean
-
-        # Center attention output weights and biases (W_O, b_O)
-        for layer_idx in range(self.cfg.n_layers):
-            if layer_idx >= len(self.blocks):
-                continue
-            block = self.blocks[layer_idx]
-
-            # Center attention output weights
-            if hasattr(block.attn, "o") and hasattr(block.attn.o, "weight"):
-                o_weight = block.attn.o.weight.data  # HF format: [d_model, d_model]
-                # For writing weights, center along the last dimension (same as ProcessWeights)
-                o_mean = o_weight.mean(dim=-1, keepdim=True)
-                block.attn.o.weight.data = o_weight - o_mean
-
-            # Center attention output biases
-            if (
-                hasattr(block.attn, "o")
-                and hasattr(block.attn.o, "bias")
-                and block.attn.o.bias is not None
-            ):
-                o_bias = block.attn.o.bias.data
-                o_bias_mean = o_bias.mean()
-                block.attn.o.bias.data = o_bias - o_bias_mean
-
-            # Center MLP output weights and biases (W_out, b_out)
-            if hasattr(block, "mlp") and not getattr(self.cfg, "attn_only", False):
-                # Handle different MLP component names (out vs output)
-                mlp_out_attr = (
-                    "out"
-                    if hasattr(block.mlp, "out")
-                    else "output"
-                    if hasattr(block.mlp, "output")
-                    else None
-                )
+        # Import the proper LayerNormPre from HookedTransformer
+        from transformer_lens.components.layer_norm_pre import LayerNormPre
+        from transformer_lens.config.HookedTransformerConfig import (
+            HookedTransformerConfig,
+        )
 
-                if mlp_out_attr:
-                    mlp_out = getattr(block.mlp, mlp_out_attr)
-
-                    # Center MLP output weights
-                    if hasattr(mlp_out, "weight"):
-                        mlp_weight = mlp_out.weight.data  # HF format: [d_mlp, d_model]
-                        # Subtract mean along the last dimension (d_model)
-                        mlp_mean = mlp_weight.mean(dim=-1, keepdim=True)
-                        mlp_out.weight.data = mlp_weight - mlp_mean
-
-                    # Center MLP output biases
-                    if hasattr(mlp_out, "bias") and mlp_out.bias is not None:
-                        mlp_bias = mlp_out.bias.data
-                        mlp_bias_mean = mlp_bias.mean()
-                        mlp_out.bias.data = mlp_bias - mlp_bias_mean
-
-    def _center_unembed_inplace(self):
-        """Center unembedding weights in-place."""
-        if hasattr(self, "unembed") and hasattr(self.unembed, "weight"):
-            # Center the unembedding weights (HF format: [vocab_size, d_model])
-            unembed_weight = self.unembed.weight.data
-            # Subtract the mean along the d_model dimension (dim=1)
-            unembed_mean = unembed_weight.mean(dim=1, keepdim=True)
-            self.unembed.weight.data = unembed_weight - unembed_mean
-
-    def _fold_value_biases_inplace(self):
-        """Fold value biases into output bias in-place."""
+        # Create a compatible HookedTransformerConfig from the bridge config
+        hooked_config = HookedTransformerConfig(
+            d_model=self.cfg.d_model,
+            d_vocab=self.cfg.d_vocab,
+            n_layers=self.cfg.n_layers,
+            n_heads=self.cfg.n_heads,
+            d_head=self.cfg.d_head,
+            d_mlp=self.cfg.d_mlp,
+            eps=self.cfg.eps,
+            n_ctx=1024,  # Default context length
+            device=self.cfg.device,
+            act_fn="relu",  # GPT-2 uses ReLU activation
+            attn_only=getattr(self.cfg, 'attn_only', False),
+        )
 
+        # Replace LayerNorm components in each layer
         for layer_idx in range(self.cfg.n_layers):
-            if layer_idx >= len(self.blocks):
-                continue
-            block = self.blocks[layer_idx]
-
-            # Get value biases and output weights/biases
-            v_bias = None
-            w_o = None
-            b_o = None
+            # Replace ln_1 and ln_2 with LayerNormPre using proper constructor
+            model.transformer.h[layer_idx].ln_1 = LayerNormPre(hooked_config)
+            model.transformer.h[layer_idx].ln_2 = LayerNormPre(hooked_config)
 
-            # Find value biases - need to use the original HuggingFace structure
-            # In GPT-2, the original transformer uses combined qkv, so extract V bias from there
-            if (
-                hasattr(block.attn, "qkv")
-                and hasattr(block.attn.qkv, "bias")
-                and block.attn.qkv.bias is not None
-            ):
-                # For combined qkv, extract the V portion
-                qkv_bias = block.attn.qkv.bias.data
-                d_head = self.cfg.d_head
-                n_heads = self.cfg.n_heads
-                # Split into Q, K, V portions (each is n_heads * d_head)
-                if qkv_bias.shape[0] == 3 * n_heads * d_head:
-                    v_bias = qkv_bias[2 * n_heads * d_head :]  # V is the last third
-            elif (
-                hasattr(block.attn, "v")
-                and hasattr(block.attn.v, "bias")
-                and block.attn.v.bias is not None
-            ):
-                v_bias = block.attn.v.bias.data  # HF format: [n_heads * d_head] or similar
-
-            # Find output weights and biases
-            if hasattr(block.attn, "o"):
-                if hasattr(block.attn.o, "weight"):
-                    w_o = block.attn.o.weight.data  # HF format: [d_model, n_heads * d_head]
-                if hasattr(block.attn.o, "bias") and block.attn.o.bias is not None:
-                    b_o = block.attn.o.bias.data  # HF format: [d_model]
-
-            # Apply the folding transformation if we have all components
-            if v_bias is not None and w_o is not None and b_o is not None:
-                try:
-                    # Reshape v_bias to [n_heads, d_head] if needed
-                    if v_bias.dim() == 1:
-                        expected_size = self.cfg.n_heads * self.cfg.d_head
-                    if v_bias.shape[0] != expected_size:
-                        continue
-                        v_bias = v_bias.view(self.cfg.n_heads, self.cfg.d_head)
-
-                    # Reshape w_o from HF format [d_model, n_heads * d_head] to [d_model, n_heads, d_head]
-                    if w_o.dim() == 2:
-                        expected_size = self.cfg.n_heads * self.cfg.d_head
-                    if w_o.shape[1] != expected_size:
-                        continue
-                        w_o = w_o.view(w_o.shape[0], self.cfg.n_heads, self.cfg.d_head)
-
-                    # Compute the folded bias: b_O_new = b_O_original + sum_head(b_V_head @ W_O_head)
-                    # v_bias: [n_heads, d_head], w_o: [d_model, n_heads, d_head]
-                    # We want to compute sum over heads of (v_bias[h, :] @ w_o[:, h, :].T) for each head h
-                    folded_contribution = torch.zeros_like(b_o)
-                    for h in range(self.cfg.n_heads):
-                        # v_bias[h]: [d_head], w_o[:, h]: [d_model, d_head]
-                        # Compute v_bias[h] @ w_o[:, h].T = [d_model]
-                        head_contribution = torch.matmul(w_o[:, h], v_bias[h])
-                        folded_contribution += head_contribution
-
-                    # Update the output bias
-                    block.attn.o.bias.data = b_o + folded_contribution
-
-                except Exception as e:
-                    continue
-
-                # Zero out the value biases (same logic as extraction)
-                if (
-                    hasattr(block.attn, "qkv")
-                    and hasattr(block.attn.qkv, "bias")
-                    and block.attn.qkv.bias is not None
-                ):
-                    # Zero out only the V portion of the combined qkv bias
-                    d_head = self.cfg.d_head
-                    n_heads = self.cfg.n_heads
-                    if block.attn.qkv.bias.shape[0] == 3 * n_heads * d_head:
-                        block.attn.qkv.bias.data[2 * n_heads * d_head :].zero_()
-                elif (
-                    hasattr(block.attn, "v")
-                    and hasattr(block.attn.v, "bias")
-                    and block.attn.v.bias is not None
-                ):
-                    block.attn.v.bias.data.zero_()
-
-    def _refactor_factored_attn_matrices_inplace(self):
-        """Refactor factored attention matrices in-place."""
-        # TODO: Implement attention matrix refactoring for HF format
-        pass
+        # Replace final LayerNorm with LayerNormPre
+        model.transformer.ln_f = LayerNormPre(hooked_config)
 
     def _load_processed_weights(self, processed_state_dict):
         """Load processed weights back into the TransformerBridge.
@@ -1884,6 +1636,9 @@ def stop_hook(tensor: torch.Tensor, *, hook: Any) -> torch.Tensor:
             except StopAtLayerException as e:
                 # Return the intermediate output from the specified layer
                 output = e.layer_output
+            except Exception as e:
+                # Re-raise any other exceptions
+                raise e
             finally:
                 for hp, _ in hooks:
                     hp.remove_hooks()
diff --git a/transformer_lens/model_bridge/generalized_components/base.py b/transformer_lens/model_bridge/generalized_components/base.py
index 3afb404b3..22a852003 100644
--- a/transformer_lens/model_bridge/generalized_components/base.py
+++ b/transformer_lens/model_bridge/generalized_components/base.py
@@ -282,6 +282,24 @@ def __setattr__(self, name: str, value: Any) -> None:
         # Fall back to normal attribute setting
         super().__setattr__(name, value)
 
+    def load_state_dict(self, state_dict, strict=True, assign=False):
+        """Load state dict into the component, forwarding to the original component.
+
+        Args:
+            state_dict: Dictionary containing a whole state of the module
+            strict: Whether to strictly enforce that the keys in state_dict match the keys returned by this module's state_dict() function
+            assign: Whether to assign items in the state dictionary to their corresponding keys in the module instead of copying them
+
+        Returns:
+            NamedTuple with missing_keys and unexpected_keys fields
+        """
+        if self.original_component is None:
+            raise RuntimeError(
+                f"Original component not set for {self.name}. Call set_original_component() first."
+            )
+        # Forward the load_state_dict call to the original component
+        return self.original_component.load_state_dict(state_dict, strict=strict, assign=assign)
+
     def has_bias(self) -> bool:
         """Check if the linear layer has a bias."""
         if self.original_component is None:
diff --git a/transformer_lens/model_bridge/generalized_components/embedding.py b/transformer_lens/model_bridge/generalized_components/embedding.py
index f19873dba..c1e0fe8ce 100644
--- a/transformer_lens/model_bridge/generalized_components/embedding.py
+++ b/transformer_lens/model_bridge/generalized_components/embedding.py
@@ -52,6 +52,11 @@ def W_E(self) -> torch.Tensor:
         assert isinstance(weight, torch.Tensor), f"Weight is not a tensor for {self.name}"
         return weight
 
+    @property
+    def weight(self) -> torch.Tensor:
+        """Return the embedding weight matrix (alias for W_E)."""
+        return self.W_E
+
     def forward(
         self,
         input_ids: torch.Tensor,
diff --git a/transformer_lens/model_bridge/generalized_components/unembedding.py b/transformer_lens/model_bridge/generalized_components/unembedding.py
index 75b9fd58e..e640d4a97 100644
--- a/transformer_lens/model_bridge/generalized_components/unembedding.py
+++ b/transformer_lens/model_bridge/generalized_components/unembedding.py
@@ -50,6 +50,11 @@ def W_U(self) -> torch.Tensor:
         assert isinstance(weight, torch.Tensor), f"Weight is not a tensor for {self.name}"
         return weight.T
 
+    @property
+    def weight(self) -> torch.Tensor:
+        """Return the unembedding weight matrix (alias for W_U)."""
+        return self.W_U
+
     def forward(
         self,
         hidden_states: torch.Tensor,
diff --git a/transformer_lens/model_bridge/supported_architectures/gpt2.py b/transformer_lens/model_bridge/supported_architectures/gpt2.py
index b549b04e1..ed1dc4567 100644
--- a/transformer_lens/model_bridge/supported_architectures/gpt2.py
+++ b/transformer_lens/model_bridge/supported_architectures/gpt2.py
@@ -5,6 +5,7 @@
 import torch
 
 from transformer_lens.conversion_utils.conversion_steps import (
+    BaseHookConversion,
     HookConversionSet,
     RearrangeHookConversion,
 )
@@ -20,6 +21,94 @@
 )
 
 
+class QKVSplitRearrangeConversion(BaseHookConversion):
+    """Custom conversion that splits QKV tensor and then rearranges."""
+
+    def __init__(self, qkv_index: int, rearrange_pattern: str, **axes_lengths):
+        """Initialize the conversion.
+
+        Args:
+            qkv_index: Index of Q (0), K (1), or V (2) in the QKV tensor
+            rearrange_pattern: Einops pattern for rearrangement
+            **axes_lengths: Additional axes lengths for einops
+        """
+        super().__init__()
+        self.qkv_index = qkv_index
+        self.rearrange_pattern = rearrange_pattern
+        self.axes_lengths = axes_lengths
+
+    def handle_conversion(self, input_value: torch.Tensor, *full_context) -> torch.Tensor:
+        """Split QKV tensor and rearrange the selected part."""
+        # Determine the split dimension based on tensor shape
+        if len(input_value.shape) == 2:
+            # Weight tensor: [d_model, 3*d_model] -> split along dim=1
+            split_dim = 1
+        elif len(input_value.shape) == 1:
+            # Bias tensor: [3*n_heads*d_head] -> split along dim=0
+            split_dim = 0
+        else:
+            raise ValueError(f"Unexpected tensor shape: {input_value.shape}")
+
+        # Split the QKV tensor
+        qkv_parts = torch.chunk(input_value, 3, dim=split_dim)
+        selected_part = qkv_parts[self.qkv_index]
+
+        # Apply rearrangement
+        import einops
+
+        return einops.rearrange(selected_part, self.rearrange_pattern, **self.axes_lengths)
+
+    def revert(self, input_value: torch.Tensor, *full_context) -> torch.Tensor:
+        """Revert the conversion (not fully implemented for QKV case)."""
+        # This is complex for QKV case since we need to reconstruct the full tensor
+        # For now, just return the input
+        return input_value
+
+    def __repr__(self):
+        return f'QKVSplitRearrangeConversion(qkv_index={self.qkv_index}, pattern="{self.rearrange_pattern}")'
+
+
+class QKVBiasConversion(BaseHookConversion):
+    """Custom conversion for QKV biases that matches the original GPT-2 logic."""
+
+    def __init__(self, qkv_index: int, n_heads: int, d_head: int):
+        """Initialize the conversion.
+
+        Args:
+            qkv_index: Index of Q (0), K (1), or V (2) in the QKV tensor
+            n_heads: Number of attention heads
+            d_head: Dimension of each head
+        """
+        super().__init__()
+        self.qkv_index = qkv_index
+        self.n_heads = n_heads
+        self.d_head = d_head
+
+    def handle_conversion(self, input_value: torch.Tensor, *full_context) -> torch.Tensor:
+        """Convert QKV bias following the original GPT-2 logic."""
+        import einops
+
+        # Original logic: rearrange the entire bias tensor first, then split by QKV
+        qkv_bias = einops.rearrange(
+            input_value,
+            "(qkv index head)->qkv index head",
+            qkv=3,
+            index=self.n_heads,
+            head=self.d_head,
+        )
+        # Return the selected QKV part
+        return qkv_bias[self.qkv_index]
+
+    def revert(self, input_value: torch.Tensor, *full_context) -> torch.Tensor:
+        """Revert the conversion (not fully implemented for QKV case)."""
+        # This is complex for QKV case since we need to reconstruct the full tensor
+        # For now, just return the input
+        return input_value
+
+    def __repr__(self):
+        return f"QKVBiasConversion(qkv_index={self.qkv_index}, n_heads={self.n_heads}, d_head={self.d_head})"
+
+
 class GPT2ArchitectureAdapter(ArchitectureAdapter):
     """Architecture adapter for GPT2 models."""
 
@@ -33,53 +122,139 @@ def __init__(self, cfg: Any) -> None:
             "uses_split_attention": True,  # GPT-2 uses combined QKV attention that needs splitting
         }
 
+        # GPT-2 uses combined QKV weights in HuggingFace format
+        self.uses_combined_qkv = True
+
+        # Set config variable to indicate that attention weights are split (use TransformerLens format processing)
+        self.cfg.split_attention_weights = True
+
         self.conversion_rules = HookConversionSet(
             {
+                # Original parameter names (for compatibility)
                 "pos_embed.pos": "transformer.wpe.weight",
                 "embed.e": "transformer.wte.weight",
-                "blocks.{i}.ln1.w": "transformer.h.{i}.ln_1.weight",
-                "blocks.{i}.ln1.b": "transformer.h.{i}.ln_1.bias",
-                "blocks.{i}.attn.q": (
+                "blocks.{i}.ln1.weight": "transformer.h.{i}.ln_1.weight",
+                "blocks.{i}.ln1.bias": "transformer.h.{i}.ln_1.bias",
+                "blocks.{i}.attn.q.weight": (
                     "transformer.h.{i}.attn.c_attn.weight",
                     RearrangeHookConversion(
-                        "m (three n h) -> three n m h",
-                        three=3,
+                        "(n h) m-> n m h",
                         n=self.cfg.n_heads,
                     ),
                 ),
-                "blocks.{i}.attn.k": (
+                "blocks.{i}.attn.k.weight": (
                     "transformer.h.{i}.attn.c_attn.weight",
                     RearrangeHookConversion(
-                        "m (three n h) -> three n m h",
-                        three=3,
+                        "(n h) m-> n m h",
                         n=self.cfg.n_heads,
                     ),
                 ),
-                "blocks.{i}.attn.v": (
+                "blocks.{i}.attn.v.weight": (
                     "transformer.h.{i}.attn.c_attn.weight",
                     RearrangeHookConversion(
-                        "m (three n h) -> three n m h",
-                        three=3,
+                        "(n h) m-> n m h",
                         n=self.cfg.n_heads,
                     ),
                 ),
-                "blocks.{i}.attn.o": (
+                "blocks.{i}.attn.o.weight": (
                     "transformer.h.{i}.attn.c_proj.weight",
                     RearrangeHookConversion("(n h) m -> n h m", n=self.cfg.n_heads),
                 ),
-                "blocks.{i}.attn.b_Q": "transformer.h.{i}.attn.c_attn.bias",
-                "blocks.{i}.attn.b_K": "transformer.h.{i}.attn.c_attn.bias",
-                "blocks.{i}.attn.b_V": "transformer.h.{i}.attn.c_attn.bias",
+                "blocks.{i}.attn.q.bias": (
+                    "transformer.h.{i}.attn.c_attn.bias",
+                    RearrangeHookConversion("(n d_head) -> n d_head", n=self.cfg.n_heads),
+                ),
+                "blocks.{i}.attn.k.bias": (
+                    "transformer.h.{i}.attn.c_attn.bias",
+                    RearrangeHookConversion("(n d_head) -> n d_head", n=self.cfg.n_heads),
+                ),
+                "blocks.{i}.attn.v.bias": (
+                    "transformer.h.{i}.attn.c_attn.bias",
+                    RearrangeHookConversion("(n d_head) -> n d_head", n=self.cfg.n_heads),
+                ),
+                "blocks.{i}.attn.o.bias": "transformer.h.{i}.attn.c_proj.bias",
+                "blocks.{i}.ln2.weight": "transformer.h.{i}.ln_2.weight",
+                "blocks.{i}.ln2.bias": "transformer.h.{i}.ln_2.bias",
+                "blocks.{i}.mlp.input.weight": "transformer.h.{i}.mlp.c_fc.weight",
+                "blocks.{i}.mlp.input.bias": "transformer.h.{i}.mlp.c_fc.bias",
+                "blocks.{i}.mlp.out": "transformer.h.{i}.mlp.c_proj.weight",
+                "blocks.{i}.mlp.b_out": "transformer.h.{i}.mlp.c_proj.bias",
+                "ln_final.weight": "transformer.ln_f.weight",
+                "ln_final.bias": "transformer.ln_f.bias",
+                "unembed.weight": (
+                    "lm_head.weight",
+                    RearrangeHookConversion("d_model d_vocab -> d_vocab d_model"),
+                ),
+                "unembed.bias": "lm_head.bias",
+                # TransformerLens parameter names (for weight processing functions)
+                "blocks.{i}.attn.W_Q": (
+                    "transformer.h.{i}.attn.c_attn.weight",
+                    QKVSplitRearrangeConversion(
+                        qkv_index=0,  # Q is the first part
+                        rearrange_pattern="m (i h) -> i m h",
+                        i=self.cfg.n_heads,
+                    ),
+                ),
+                "blocks.{i}.attn.W_K": (
+                    "transformer.h.{i}.attn.c_attn.weight",
+                    QKVSplitRearrangeConversion(
+                        qkv_index=1,  # K is the second part
+                        rearrange_pattern="m (i h) -> i m h",
+                        i=self.cfg.n_heads,
+                    ),
+                ),
+                "blocks.{i}.attn.W_V": (
+                    "transformer.h.{i}.attn.c_attn.weight",
+                    QKVSplitRearrangeConversion(
+                        qkv_index=2,  # V is the third part
+                        rearrange_pattern="m (i h) -> i m h",
+                        i=self.cfg.n_heads,
+                    ),
+                ),
+                "blocks.{i}.attn.W_O": (
+                    "transformer.h.{i}.attn.c_proj.weight",
+                    RearrangeHookConversion("(i h) m -> i h m", i=self.cfg.n_heads),
+                ),
+                "blocks.{i}.attn.b_Q": (
+                    "transformer.h.{i}.attn.c_attn.bias",
+                    QKVBiasConversion(
+                        qkv_index=0,  # Q bias is the first part
+                        n_heads=self.cfg.n_heads,
+                        d_head=self.cfg.d_head,
+                    ),
+                ),
+                "blocks.{i}.attn.b_K": (
+                    "transformer.h.{i}.attn.c_attn.bias",
+                    QKVBiasConversion(
+                        qkv_index=1,  # K bias is the second part
+                        n_heads=self.cfg.n_heads,
+                        d_head=self.cfg.d_head,
+                    ),
+                ),
+                "blocks.{i}.attn.b_V": (
+                    "transformer.h.{i}.attn.c_attn.bias",
+                    QKVBiasConversion(
+                        qkv_index=2,  # V bias is the third part
+                        n_heads=self.cfg.n_heads,
+                        d_head=self.cfg.d_head,
+                    ),
+                ),
                 "blocks.{i}.attn.b_O": "transformer.h.{i}.attn.c_proj.bias",
+                "blocks.{i}.ln1.w": "transformer.h.{i}.ln_1.weight",
+                "blocks.{i}.ln1.b": "transformer.h.{i}.ln_1.bias",
                 "blocks.{i}.ln2.w": "transformer.h.{i}.ln_2.weight",
                 "blocks.{i}.ln2.b": "transformer.h.{i}.ln_2.bias",
-                "blocks.{i}.mlp.in": "transformer.h.{i}.mlp.c_fc.weight",
+                "blocks.{i}.mlp.W_in": "transformer.h.{i}.mlp.c_fc.weight",
+                "blocks.{i}.mlp.W_out": "transformer.h.{i}.mlp.c_proj.weight",
                 "blocks.{i}.mlp.b_in": "transformer.h.{i}.mlp.c_fc.bias",
-                "blocks.{i}.mlp.out": "transformer.h.{i}.mlp.c_proj.weight",
                 "blocks.{i}.mlp.b_out": "transformer.h.{i}.mlp.c_proj.bias",
                 "ln_final.w": "transformer.ln_f.weight",
                 "ln_final.b": "transformer.ln_f.bias",
-                "unembed.u": "lm_head.weight",
+                "unembed.W_U": (
+                    "lm_head.weight",
+                    RearrangeHookConversion("d_model d_vocab -> d_vocab d_model"),
+                ),
+                "unembed.b_U": "lm_head.bias",
             }
         )
 
@@ -103,7 +278,7 @@ def __init__(self, cfg: Any) -> None:
                     "mlp": MLPBridge(
                         name="mlp",
                         submodules={
-                            "in": LinearBridge(name="c_fc"),
+                            "input": LinearBridge(name="c_fc"),
                             "out": LinearBridge(name="c_proj"),
                         },
                     ),