Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
21 commits
Select commit Hold shift + click to select a range
805e37d
updating loading in qwen demo to use transformer bridge
degenfabian Aug 19, 2025
abcd7c1
add qwen demo to CI
degenfabian Aug 19, 2025
3884f30
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Aug 20, 2025
70497be
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Aug 22, 2025
16ed10b
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Aug 26, 2025
2212cbe
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 4, 2025
a749b16
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 5, 2025
c88f831
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 6, 2025
3cd158c
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 7, 2025
b20294d
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 10, 2025
d576791
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 10, 2025
9a2d414
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 12, 2025
05db7d6
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 12, 2025
0858bf8
Merge remote-tracking branch 'origin/dev-3.x' into qwen_demo_transfor…
bryce13950 Sep 12, 2025
64a10bd
Merge remote-tracking branch 'origin/dev-3.x-folding' into qwen_demo_…
bryce13950 Oct 15, 2025
30ea8f6
Merge remote-tracking branch 'origin/dev-3.x-folding' into qwen_demo_…
bryce13950 Oct 16, 2025
36eccb9
Merge remote-tracking branch 'origin/dev-3.x-folding' into qwen_demo_…
bryce13950 Oct 16, 2025
a28f5ba
Merge remote-tracking branch 'origin/dev-3.x-folding' into qwen_demo_…
bryce13950 Oct 16, 2025
d482eef
Merge remote-tracking branch 'origin/dev-3.x-folding' into qwen_demo_…
bryce13950 Oct 16, 2025
e84409b
Merge remote-tracking branch 'origin/dev-3.x-folding' into qwen_demo_…
bryce13950 Oct 17, 2025
cc1ccfb
Merge remote-tracking branch 'origin/dev-3.x-folding' into qwen_demo_…
bryce13950 Nov 12, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions .github/workflows/checks.yml
Original file line number Diff line number Diff line change
Expand Up @@ -238,6 +238,7 @@ jobs:
# - "No_Position_Experiment"
- "Othello_GPT"
- "Patchscopes_Generation_Demo"
- "Qwen"
# - "T5"
steps:
- uses: actions/checkout@v3
Expand Down
14 changes: 8 additions & 6 deletions demos/Qwen.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -154,7 +154,7 @@
},
{
"cell_type": "code",
"execution_count": 4,
"execution_count": null,
"metadata": {},
"outputs": [
{
Expand All @@ -171,7 +171,7 @@
"torch.set_grad_enabled(False)\n",
"\n",
"from transformers import AutoTokenizer\n",
"from transformer_lens import HookedTransformer\n",
"from transformer_lens.model_bridge import TransformerBridge\n",
"from transformers import AutoModelForCausalLM, AutoTokenizer\n",
"from transformers.generation import GenerationConfig\n",
"\n",
Expand Down Expand Up @@ -208,7 +208,7 @@
},
{
"cell_type": "code",
"execution_count": 6,
"execution_count": null,
"metadata": {},
"outputs": [
{
Expand Down Expand Up @@ -283,12 +283,13 @@
" trust_remote_code = True\n",
").eval()\n",
"\n",
"tl_model = HookedTransformer.from_pretrained_no_processing(\n",
"tl_model = TransformerBridge.boot_transformers(\n",
" model_path,\n",
" device=device,\n",
" fp32=True,\n",
" dtype=torch.float32,\n",
").to(device)\n",
"tl_model.enable_compatibility_mode()\n",
"\n",
"assert_hf_and_tl_model_are_close(hf_model, tl_model, tokenizer)"
]
Expand All @@ -302,7 +303,7 @@
},
{
"cell_type": "code",
"execution_count": 7,
"execution_count": null,
"metadata": {},
"outputs": [
{
Expand Down Expand Up @@ -335,11 +336,12 @@
" device_map=device,\n",
").eval()\n",
"\n",
"tl_model = HookedTransformer.from_pretrained_no_processing(\n",
"tl_model = TransformerBridge.boot_transformers(\n",
" model_path,\n",
" device=device,\n",
" dtype=torch.float32,\n",
").to(device)\n",
"tl_model.enable_compatibility_mode()\n",
"\n",
"assert_hf_and_tl_model_are_close(hf_model, tl_model, tokenizer)"
]
Expand Down
Loading