Coverage for transformer_lens/model_bridge/supported_architectures/__init__.py: 100%
55 statements
« prev ^ index » next coverage.py v7.10.1, created at 2026-04-30 01:33 +0000
« prev ^ index » next coverage.py v7.10.1, created at 2026-04-30 01:33 +0000
1"""Supported architecture adapters.
3This module contains all the supported architecture adapters for different model architectures.
4"""
6from transformer_lens.model_bridge.supported_architectures.apertus import (
7 ApertusArchitectureAdapter,
8)
9from transformer_lens.model_bridge.supported_architectures.baichuan import (
10 BaichuanArchitectureAdapter,
11)
12from transformer_lens.model_bridge.supported_architectures.bert import (
13 BertArchitectureAdapter,
14)
15from transformer_lens.model_bridge.supported_architectures.bloom import (
16 BloomArchitectureAdapter,
17)
18from transformer_lens.model_bridge.supported_architectures.codegen import (
19 CodeGenArchitectureAdapter,
20)
21from transformer_lens.model_bridge.supported_architectures.cohere import (
22 CohereArchitectureAdapter,
23)
24from transformer_lens.model_bridge.supported_architectures.deepseek_v3 import (
25 DeepSeekV3ArchitectureAdapter,
26)
27from transformer_lens.model_bridge.supported_architectures.falcon import (
28 FalconArchitectureAdapter,
29)
30from transformer_lens.model_bridge.supported_architectures.gemma1 import (
31 Gemma1ArchitectureAdapter,
32)
33from transformer_lens.model_bridge.supported_architectures.gemma2 import (
34 Gemma2ArchitectureAdapter,
35)
36from transformer_lens.model_bridge.supported_architectures.gemma3 import (
37 Gemma3ArchitectureAdapter,
38)
39from transformer_lens.model_bridge.supported_architectures.gemma3_multimodal import (
40 Gemma3MultimodalArchitectureAdapter,
41)
42from transformer_lens.model_bridge.supported_architectures.gpt2 import (
43 GPT2ArchitectureAdapter,
44)
45from transformer_lens.model_bridge.supported_architectures.gpt_bigcode import (
46 GPTBigCodeArchitectureAdapter,
47)
48from transformer_lens.model_bridge.supported_architectures.gpt2_lm_head_custom import (
49 Gpt2LmHeadCustomArchitectureAdapter,
50)
51from transformer_lens.model_bridge.supported_architectures.gpt_oss import (
52 GPTOSSArchitectureAdapter,
53)
54from transformer_lens.model_bridge.supported_architectures.gptj import (
55 GptjArchitectureAdapter,
56)
57from transformer_lens.model_bridge.supported_architectures.granite import (
58 GraniteArchitectureAdapter,
59)
60from transformer_lens.model_bridge.supported_architectures.granite_moe import (
61 GraniteMoeArchitectureAdapter,
62)
63from transformer_lens.model_bridge.supported_architectures.granite_moe_hybrid import (
64 GraniteMoeHybridArchitectureAdapter,
65)
66from transformer_lens.model_bridge.supported_architectures.hubert import (
67 HubertArchitectureAdapter,
68)
69from transformer_lens.model_bridge.supported_architectures.internlm2 import (
70 InternLM2ArchitectureAdapter,
71)
72from transformer_lens.model_bridge.supported_architectures.llama import (
73 LlamaArchitectureAdapter,
74)
75from transformer_lens.model_bridge.supported_architectures.llava import (
76 LlavaArchitectureAdapter,
77)
78from transformer_lens.model_bridge.supported_architectures.llava_next import (
79 LlavaNextArchitectureAdapter,
80)
81from transformer_lens.model_bridge.supported_architectures.llava_onevision import (
82 LlavaOnevisionArchitectureAdapter,
83)
84from transformer_lens.model_bridge.supported_architectures.mamba import (
85 MambaArchitectureAdapter,
86)
87from transformer_lens.model_bridge.supported_architectures.mamba2 import (
88 Mamba2ArchitectureAdapter,
89)
90from transformer_lens.model_bridge.supported_architectures.mingpt import (
91 MingptArchitectureAdapter,
92)
93from transformer_lens.model_bridge.supported_architectures.mistral import (
94 MistralArchitectureAdapter,
95)
96from transformer_lens.model_bridge.supported_architectures.mixtral import (
97 MixtralArchitectureAdapter,
98)
99from transformer_lens.model_bridge.supported_architectures.mpt import (
100 MPTArchitectureAdapter,
101)
102from transformer_lens.model_bridge.supported_architectures.nanogpt import (
103 NanogptArchitectureAdapter,
104)
105from transformer_lens.model_bridge.supported_architectures.neel_solu_old import (
106 NeelSoluOldArchitectureAdapter,
107)
108from transformer_lens.model_bridge.supported_architectures.neo import (
109 NeoArchitectureAdapter,
110)
111from transformer_lens.model_bridge.supported_architectures.neox import (
112 NeoxArchitectureAdapter,
113)
114from transformer_lens.model_bridge.supported_architectures.olmo import (
115 OlmoArchitectureAdapter,
116)
117from transformer_lens.model_bridge.supported_architectures.olmo2 import (
118 Olmo2ArchitectureAdapter,
119)
120from transformer_lens.model_bridge.supported_architectures.olmo3 import (
121 Olmo3ArchitectureAdapter,
122)
123from transformer_lens.model_bridge.supported_architectures.olmoe import (
124 OlmoeArchitectureAdapter,
125)
126from transformer_lens.model_bridge.supported_architectures.openelm import (
127 OpenElmArchitectureAdapter,
128)
129from transformer_lens.model_bridge.supported_architectures.opt import (
130 OptArchitectureAdapter,
131)
132from transformer_lens.model_bridge.supported_architectures.phi import (
133 PhiArchitectureAdapter,
134)
135from transformer_lens.model_bridge.supported_architectures.phi3 import (
136 Phi3ArchitectureAdapter,
137)
138from transformer_lens.model_bridge.supported_architectures.pythia import (
139 PythiaArchitectureAdapter,
140)
141from transformer_lens.model_bridge.supported_architectures.qwen import (
142 QwenArchitectureAdapter,
143)
144from transformer_lens.model_bridge.supported_architectures.qwen2 import (
145 Qwen2ArchitectureAdapter,
146)
147from transformer_lens.model_bridge.supported_architectures.qwen3 import (
148 Qwen3ArchitectureAdapter,
149)
150from transformer_lens.model_bridge.supported_architectures.qwen3_moe import (
151 Qwen3MoeArchitectureAdapter,
152)
153from transformer_lens.model_bridge.supported_architectures.qwen3_next import (
154 Qwen3NextArchitectureAdapter,
155)
156from transformer_lens.model_bridge.supported_architectures.qwen3_5 import (
157 Qwen3_5ArchitectureAdapter,
158)
159from transformer_lens.model_bridge.supported_architectures.stablelm import (
160 StableLmArchitectureAdapter,
161)
162from transformer_lens.model_bridge.supported_architectures.t5 import (
163 T5ArchitectureAdapter,
164)
165from transformer_lens.model_bridge.supported_architectures.xglm import (
166 XGLMArchitectureAdapter,
167)
169__all__ = [
170 "ApertusArchitectureAdapter",
171 "BaichuanArchitectureAdapter",
172 "BertArchitectureAdapter",
173 "BloomArchitectureAdapter",
174 "CodeGenArchitectureAdapter",
175 "CohereArchitectureAdapter",
176 "DeepSeekV3ArchitectureAdapter",
177 "FalconArchitectureAdapter",
178 "Gemma1ArchitectureAdapter",
179 "Gemma2ArchitectureAdapter",
180 "Gemma3ArchitectureAdapter",
181 "Gemma3MultimodalArchitectureAdapter",
182 "GraniteArchitectureAdapter",
183 "GraniteMoeArchitectureAdapter",
184 "GraniteMoeHybridArchitectureAdapter",
185 "GPT2ArchitectureAdapter",
186 "GPTBigCodeArchitectureAdapter",
187 "GPTOSSArchitectureAdapter",
188 "Gpt2LmHeadCustomArchitectureAdapter",
189 "GptjArchitectureAdapter",
190 "HubertArchitectureAdapter",
191 "InternLM2ArchitectureAdapter",
192 "LlamaArchitectureAdapter",
193 "LlavaArchitectureAdapter",
194 "LlavaNextArchitectureAdapter",
195 "LlavaOnevisionArchitectureAdapter",
196 "MambaArchitectureAdapter",
197 "Mamba2ArchitectureAdapter",
198 "MingptArchitectureAdapter",
199 "MistralArchitectureAdapter",
200 "MixtralArchitectureAdapter",
201 "MPTArchitectureAdapter",
202 "NanogptArchitectureAdapter",
203 "NeelSoluOldArchitectureAdapter",
204 "NeoArchitectureAdapter",
205 "NeoxArchitectureAdapter",
206 "OpenElmArchitectureAdapter",
207 "OlmoArchitectureAdapter",
208 "Olmo2ArchitectureAdapter",
209 "Olmo3ArchitectureAdapter",
210 "OlmoeArchitectureAdapter",
211 "OptArchitectureAdapter",
212 "PhiArchitectureAdapter",
213 "Phi3ArchitectureAdapter",
214 "PythiaArchitectureAdapter",
215 "QwenArchitectureAdapter",
216 "Qwen2ArchitectureAdapter",
217 "Qwen3ArchitectureAdapter",
218 "Qwen3MoeArchitectureAdapter",
219 "Qwen3NextArchitectureAdapter",
220 "Qwen3_5ArchitectureAdapter",
221 "StableLmArchitectureAdapter",
222 "T5ArchitectureAdapter",
223 "XGLMArchitectureAdapter",
224]