Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
29 commits
Select commit Hold shift + click to select a range
f47dbb9
updating loading in stable lm demo to use transformer bridge
degenfabian Aug 19, 2025
8a7f3a6
add stable_lm demo to CI
degenfabian Aug 19, 2025
f44faa6
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Aug 20, 2025
a99dfb6
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Aug 22, 2025
06c0732
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Aug 26, 2025
ebc1feb
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 4, 2025
1a0f780
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 5, 2025
2fdd6e0
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 6, 2025
59f7fe2
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 7, 2025
e53db49
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 10, 2025
69f9e7c
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 10, 2025
e8516b4
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 12, 2025
e0914a1
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 12, 2025
b069985
Merge remote-tracking branch 'origin/dev-3.x' into stable_lm_demo_tra…
bryce13950 Sep 12, 2025
1904dce
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 10, 2025
17f27e8
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 13, 2025
d1d7af3
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 14, 2025
49a1695
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 14, 2025
4854ab6
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 15, 2025
6a3de9f
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 15, 2025
18c7177
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 15, 2025
de0f324
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 16, 2025
bf93d3b
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 16, 2025
2be7624
fixed booting
bryce13950 Oct 16, 2025
7057314
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 16, 2025
15a1e48
added dtype selction
bryce13950 Oct 16, 2025
824e3d3
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 16, 2025
a2fc9a5
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 16, 2025
7de0ec2
Merge remote-tracking branch 'origin/dev-3.x-folding' into stable_lm_…
bryce13950 Oct 17, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions .github/workflows/checks.yml
Original file line number Diff line number Diff line change
Expand Up @@ -237,6 +237,7 @@ jobs:
# - "No_Position_Experiment"
- "Othello_GPT"
- "Patchscopes_Generation_Demo"
- "stable_lm"
# - "T5"
steps:
- uses: actions/checkout@v3
Expand Down
12 changes: 7 additions & 5 deletions demos/stable_lm.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -60,21 +60,22 @@
},
{
"cell_type": "code",
"execution_count": 2,
"execution_count": null,
"metadata": {
"id": "PXB6xkimoH2h"
},
"outputs": [],
"source": [
"import torch\n",
"from transformer_lens import HookedTransformer\n",
"from transformer_lens.model_bridge import TransformerBridge\n",
"\n",
"device = \"cuda\" if torch.cuda.is_available() else \"cpu\""
"device = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
"dtype = torch.bfloat16 if torch.cuda.is_available() else torch.float32"
]
},
{
"cell_type": "code",
"execution_count": 3,
"execution_count": null,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
Expand Down Expand Up @@ -355,7 +356,8 @@
"source": [
"# Load the 3 billion parameters version in 16 bits\n",
"# You can increase the precision or the size if you have enough GPU RAM available\n",
"model = HookedTransformer.from_pretrained(\"stabilityai/stablelm-tuned-alpha-3b\", torch_dtype=torch.bfloat16, device=device)"
"model = TransformerBridge.boot_transformers(\"stabilityai/stablelm-tuned-alpha-3b\", dtype=dtype, device=device)\n",
"model.enable_compatibility_mode()"
]
},
{
Expand Down
Loading