| transformer_lens/ActivationCache.py |
313 |
12 |
0 |
170 |
13 |
93% |
| transformer_lens/BertNextSentencePrediction.py |
59 |
1 |
38 |
14 |
2 |
96% |
| transformer_lens/FactoredMatrix.py |
126 |
3 |
34 |
32 |
3 |
95% |
| transformer_lens/HookedAudioEncoder.py |
232 |
63 |
12 |
90 |
20 |
62% |
| transformer_lens/HookedEncoder.py |
191 |
62 |
40 |
44 |
5 |
60% |
| transformer_lens/HookedEncoderDecoder.py |
273 |
171 |
32 |
100 |
0 |
27% |
| transformer_lens/HookedTransformer.py |
721 |
167 |
80 |
350 |
57 |
71% |
| transformer_lens/SVDInterpreter.py |
55 |
1 |
0 |
14 |
1 |
97% |
| transformer_lens/__init__.py |
19 |
2 |
0 |
0 |
0 |
89% |
| transformer_lens/benchmarks/__init__.py |
11 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/benchmarks/activation_cache.py |
69 |
15 |
0 |
36 |
14 |
72% |
| transformer_lens/benchmarks/audio.py |
160 |
160 |
0 |
66 |
0 |
0% |
| transformer_lens/benchmarks/backward_gradients.py |
199 |
41 |
0 |
110 |
33 |
72% |
| transformer_lens/benchmarks/component_benchmark.py |
34 |
20 |
0 |
18 |
3 |
33% |
| transformer_lens/benchmarks/component_outputs.py |
400 |
179 |
0 |
182 |
35 |
52% |
| transformer_lens/benchmarks/forward_pass.py |
103 |
59 |
0 |
48 |
11 |
36% |
| transformer_lens/benchmarks/generation.py |
43 |
10 |
0 |
16 |
7 |
71% |
| transformer_lens/benchmarks/granular_weight_processing.py |
161 |
161 |
0 |
84 |
0 |
0% |
| transformer_lens/benchmarks/hook_registration.py |
238 |
66 |
0 |
122 |
36 |
68% |
| transformer_lens/benchmarks/hook_structure.py |
152 |
141 |
0 |
88 |
0 |
5% |
| transformer_lens/benchmarks/main_benchmark.py |
971 |
585 |
0 |
552 |
140 |
35% |
| transformer_lens/benchmarks/multimodal.py |
89 |
89 |
0 |
38 |
0 |
0% |
| transformer_lens/benchmarks/text_quality.py |
110 |
17 |
0 |
38 |
14 |
78% |
| transformer_lens/benchmarks/utils.py |
155 |
63 |
0 |
58 |
10 |
56% |
| transformer_lens/benchmarks/weight_processing.py |
322 |
136 |
0 |
152 |
44 |
52% |
| transformer_lens/cache/__init__.py |
1 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/cache/key_value_cache.py |
37 |
4 |
2 |
10 |
1 |
85% |
| transformer_lens/cache/key_value_cache_entry.py |
21 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/components/__init__.py |
22 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/components/abstract_attention.py |
341 |
116 |
0 |
122 |
38 |
62% |
| transformer_lens/components/attention.py |
20 |
4 |
0 |
4 |
2 |
75% |
| transformer_lens/components/bert_block.py |
45 |
4 |
0 |
2 |
1 |
89% |
| transformer_lens/components/bert_embed.py |
30 |
9 |
0 |
2 |
0 |
66% |
| transformer_lens/components/bert_mlm_head.py |
19 |
3 |
0 |
0 |
0 |
84% |
| transformer_lens/components/bert_nsp_head.py |
16 |
1 |
0 |
0 |
0 |
94% |
| transformer_lens/components/bert_pooler.py |
19 |
3 |
0 |
0 |
0 |
84% |
| transformer_lens/components/embed.py |
17 |
1 |
0 |
4 |
2 |
86% |
| transformer_lens/components/grouped_query_attention.py |
66 |
7 |
0 |
6 |
1 |
89% |
| transformer_lens/components/layer_norm.py |
25 |
1 |
0 |
4 |
1 |
93% |
| transformer_lens/components/layer_norm_pre.py |
19 |
1 |
0 |
2 |
1 |
90% |
| transformer_lens/components/mlps/can_be_used_as_mlp.py |
31 |
1 |
0 |
6 |
1 |
95% |
| transformer_lens/components/mlps/gated_mlp.py |
33 |
4 |
0 |
6 |
3 |
82% |
| transformer_lens/components/mlps/gated_mlp_4bit.py |
32 |
18 |
0 |
4 |
1 |
42% |
| transformer_lens/components/mlps/gpt_oss_moe.py |
62 |
1 |
0 |
4 |
1 |
97% |
| transformer_lens/components/mlps/mlp.py |
25 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/components/mlps/moe.py |
60 |
2 |
0 |
6 |
2 |
94% |
| transformer_lens/components/pos_embed.py |
23 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/components/rms_norm.py |
26 |
14 |
0 |
6 |
0 |
38% |
| transformer_lens/components/rms_norm_pre.py |
18 |
7 |
0 |
2 |
0 |
55% |
| transformer_lens/components/t5_attention.py |
50 |
34 |
0 |
10 |
0 |
27% |
| transformer_lens/components/t5_block.py |
64 |
49 |
0 |
12 |
0 |
20% |
| transformer_lens/components/token_typed_embed.py |
12 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/components/transformer_block.py |
110 |
24 |
0 |
56 |
12 |
71% |
| transformer_lens/components/unembed.py |
19 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/config/HookedTransformerConfig.py |
134 |
7 |
0 |
32 |
5 |
93% |
| transformer_lens/config/TransformerBridgeConfig.py |
84 |
1 |
0 |
4 |
2 |
97% |
| transformer_lens/config/TransformerLensConfig.py |
62 |
3 |
0 |
12 |
2 |
93% |
| transformer_lens/config/__init__.py |
4 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/__init__.py |
2 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/conversion_steps/__init__.py |
13 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/conversion_steps/arithmetic_tensor_conversion.py |
39 |
11 |
0 |
16 |
1 |
64% |
| transformer_lens/conversion_utils/conversion_steps/attention_auto_conversion.py |
51 |
25 |
0 |
22 |
2 |
38% |
| transformer_lens/conversion_utils/conversion_steps/base_tensor_conversion.py |
14 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/conversion_steps/callable_tensor_conversion.py |
10 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/conversion_steps/chain_tensor_conversion.py |
15 |
4 |
0 |
4 |
0 |
58% |
| transformer_lens/conversion_utils/conversion_steps/rearrange_tensor_conversion.py |
18 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/conversion_steps/repeat_tensor_conversion.py |
14 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/conversion_steps/split_tensor_conversion.py |
12 |
1 |
0 |
0 |
0 |
92% |
| transformer_lens/conversion_utils/conversion_steps/tensor_conversion_set.py |
53 |
17 |
0 |
18 |
1 |
61% |
| transformer_lens/conversion_utils/conversion_steps/ternary_tensor_conversion.py |
37 |
0 |
0 |
14 |
1 |
98% |
| transformer_lens/conversion_utils/conversion_steps/transpose_tensor_conversion.py |
17 |
4 |
0 |
8 |
4 |
68% |
| transformer_lens/conversion_utils/conversion_steps/zeros_like_conversion.py |
7 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/helpers/__init__.py |
3 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/conversion_utils/helpers/find_property.py |
7 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/conversion_utils/helpers/merge_quantiziation_fields.py |
17 |
1 |
0 |
10 |
1 |
93% |
| transformer_lens/conversion_utils/hook_conversion_utils.py |
23 |
7 |
0 |
10 |
1 |
70% |
| transformer_lens/conversion_utils/param_processing_conversion.py |
22 |
1 |
0 |
4 |
2 |
88% |
| transformer_lens/evals.py |
222 |
59 |
0 |
54 |
6 |
72% |
| transformer_lens/factories/__init__.py |
0 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/factories/activation_function_factory.py |
14 |
2 |
0 |
6 |
2 |
80% |
| transformer_lens/factories/architecture_adapter_factory.py |
13 |
0 |
0 |
4 |
1 |
94% |
| transformer_lens/factories/mlp_factory.py |
17 |
0 |
0 |
6 |
0 |
100% |
| transformer_lens/head_detector.py |
84 |
2 |
0 |
28 |
2 |
96% |
| transformer_lens/hook_points.py |
323 |
61 |
5 |
146 |
22 |
76% |
| transformer_lens/lit/__init__.py |
61 |
36 |
0 |
24 |
1 |
31% |
| transformer_lens/lit/constants.py |
80 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/lit/dataset.py |
187 |
82 |
3 |
26 |
2 |
50% |
| transformer_lens/lit/model.py |
227 |
162 |
3 |
66 |
3 |
23% |
| transformer_lens/lit/utils.py |
122 |
50 |
0 |
54 |
6 |
55% |
| transformer_lens/loading_from_pretrained.py |
459 |
205 |
0 |
314 |
69 |
51% |
| transformer_lens/model_bridge/__init__.py |
7 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/architecture_adapter.py |
397 |
117 |
0 |
226 |
51 |
68% |
| transformer_lens/model_bridge/bridge.py |
1567 |
387 |
3 |
836 |
146 |
71% |
| transformer_lens/model_bridge/compat.py |
22 |
20 |
0 |
10 |
0 |
6% |
| transformer_lens/model_bridge/component_setup.py |
101 |
11 |
2 |
46 |
7 |
86% |
| transformer_lens/model_bridge/composition_scores.py |
49 |
7 |
0 |
6 |
3 |
82% |
| transformer_lens/model_bridge/exceptions.py |
6 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/generalized_components/__init__.py |
38 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/generalized_components/alibi_joint_qkv_attention.py |
69 |
6 |
0 |
20 |
7 |
83% |
| transformer_lens/model_bridge/generalized_components/alibi_utils.py |
19 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/model_bridge/generalized_components/attention.py |
331 |
38 |
0 |
152 |
32 |
83% |
| transformer_lens/model_bridge/generalized_components/audio_feature_extractor.py |
16 |
7 |
0 |
4 |
0 |
45% |
| transformer_lens/model_bridge/generalized_components/base.py |
209 |
42 |
0 |
110 |
17 |
76% |
| transformer_lens/model_bridge/generalized_components/block.py |
100 |
10 |
0 |
44 |
12 |
82% |
| transformer_lens/model_bridge/generalized_components/bloom_attention.py |
100 |
53 |
0 |
26 |
4 |
44% |
| transformer_lens/model_bridge/generalized_components/bloom_block.py |
42 |
28 |
0 |
16 |
0 |
24% |
| transformer_lens/model_bridge/generalized_components/bloom_mlp.py |
18 |
9 |
0 |
6 |
0 |
38% |
| transformer_lens/model_bridge/generalized_components/clip_vision_encoder.py |
39 |
17 |
0 |
12 |
1 |
45% |
| transformer_lens/model_bridge/generalized_components/codegen_attention.py |
85 |
17 |
0 |
18 |
6 |
72% |
| transformer_lens/model_bridge/generalized_components/conv1d.py |
20 |
12 |
0 |
4 |
0 |
33% |
| transformer_lens/model_bridge/generalized_components/conv_pos_embed.py |
16 |
7 |
0 |
4 |
0 |
45% |
| transformer_lens/model_bridge/generalized_components/depthwise_conv1d.py |
22 |
10 |
0 |
4 |
1 |
50% |
| transformer_lens/model_bridge/generalized_components/embedding.py |
44 |
12 |
0 |
16 |
7 |
65% |
| transformer_lens/model_bridge/generalized_components/gated_delta_net.py |
126 |
87 |
2 |
32 |
5 |
28% |
| transformer_lens/model_bridge/generalized_components/gated_mlp.py |
102 |
34 |
0 |
48 |
12 |
61% |
| transformer_lens/model_bridge/generalized_components/gated_rms_norm.py |
16 |
1 |
0 |
4 |
2 |
85% |
| transformer_lens/model_bridge/generalized_components/joint_gate_up_mlp.py |
73 |
23 |
0 |
20 |
1 |
61% |
| transformer_lens/model_bridge/generalized_components/joint_qkv_attention.py |
225 |
16 |
0 |
70 |
25 |
86% |
| transformer_lens/model_bridge/generalized_components/joint_qkv_position_embeddings_attention.py |
76 |
23 |
0 |
12 |
2 |
65% |
| transformer_lens/model_bridge/generalized_components/linear.py |
47 |
13 |
0 |
22 |
8 |
64% |
| transformer_lens/model_bridge/generalized_components/mla_attention.py |
141 |
36 |
0 |
34 |
4 |
68% |
| transformer_lens/model_bridge/generalized_components/mlp.py |
23 |
1 |
0 |
6 |
3 |
86% |
| transformer_lens/model_bridge/generalized_components/moe.py |
45 |
13 |
0 |
18 |
4 |
60% |
| transformer_lens/model_bridge/generalized_components/mpt_alibi_attention.py |
69 |
15 |
0 |
16 |
6 |
71% |
| transformer_lens/model_bridge/generalized_components/normalization.py |
65 |
9 |
0 |
26 |
9 |
80% |
| transformer_lens/model_bridge/generalized_components/pos_embed.py |
29 |
2 |
0 |
10 |
3 |
87% |
| transformer_lens/model_bridge/generalized_components/position_embedding_hooks_mixin.py |
17 |
0 |
0 |
2 |
1 |
95% |
| transformer_lens/model_bridge/generalized_components/position_embeddings_attention.py |
243 |
59 |
0 |
90 |
15 |
71% |
| transformer_lens/model_bridge/generalized_components/rms_normalization.py |
9 |
0 |
2 |
2 |
1 |
91% |
| transformer_lens/model_bridge/generalized_components/rotary_embedding.py |
50 |
24 |
0 |
22 |
4 |
42% |
| transformer_lens/model_bridge/generalized_components/siglip_vision_encoder.py |
39 |
17 |
0 |
12 |
1 |
45% |
| transformer_lens/model_bridge/generalized_components/ssm2_mixer.py |
70 |
8 |
0 |
18 |
5 |
81% |
| transformer_lens/model_bridge/generalized_components/ssm_block.py |
53 |
13 |
0 |
24 |
7 |
66% |
| transformer_lens/model_bridge/generalized_components/ssm_mixer.py |
22 |
7 |
0 |
12 |
4 |
56% |
| transformer_lens/model_bridge/generalized_components/symbolic.py |
8 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/generalized_components/t5_block.py |
92 |
21 |
0 |
36 |
12 |
68% |
| transformer_lens/model_bridge/generalized_components/unembedding.py |
59 |
17 |
0 |
20 |
8 |
63% |
| transformer_lens/model_bridge/generalized_components/vision_projection.py |
18 |
7 |
0 |
4 |
0 |
50% |
| transformer_lens/model_bridge/get_params_util.py |
118 |
1 |
0 |
30 |
3 |
97% |
| transformer_lens/model_bridge/sources/__init__.py |
2 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/sources/transformers.py |
335 |
108 |
0 |
190 |
50 |
67% |
| transformer_lens/model_bridge/supported_architectures/__init__.py |
54 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/apertus.py |
79 |
52 |
0 |
20 |
0 |
27% |
| transformer_lens/model_bridge/supported_architectures/bert.py |
22 |
3 |
0 |
2 |
0 |
79% |
| transformer_lens/model_bridge/supported_architectures/bloom.py |
39 |
20 |
0 |
0 |
0 |
49% |
| transformer_lens/model_bridge/supported_architectures/codegen.py |
33 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/cohere.py |
44 |
7 |
0 |
16 |
2 |
75% |
| transformer_lens/model_bridge/supported_architectures/deepseek_v3.py |
22 |
6 |
0 |
6 |
0 |
57% |
| transformer_lens/model_bridge/supported_architectures/falcon.py |
109 |
33 |
0 |
42 |
10 |
64% |
| transformer_lens/model_bridge/supported_architectures/gemma1.py |
46 |
23 |
0 |
16 |
0 |
37% |
| transformer_lens/model_bridge/supported_architectures/gemma2.py |
40 |
16 |
2 |
20 |
2 |
43% |
| transformer_lens/model_bridge/supported_architectures/gemma3.py |
40 |
18 |
0 |
20 |
0 |
37% |
| transformer_lens/model_bridge/supported_architectures/gemma3_multimodal.py |
49 |
24 |
0 |
24 |
1 |
36% |
| transformer_lens/model_bridge/supported_architectures/gpt2.py |
52 |
12 |
0 |
14 |
3 |
65% |
| transformer_lens/model_bridge/supported_architectures/gpt2_lm_head_custom.py |
10 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/gpt_bigcode.py |
63 |
0 |
0 |
10 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/gpt_oss.py |
26 |
1 |
0 |
8 |
3 |
88% |
| transformer_lens/model_bridge/supported_architectures/gptj.py |
16 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/granite.py |
41 |
11 |
0 |
10 |
1 |
61% |
| transformer_lens/model_bridge/supported_architectures/granite_moe.py |
5 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/granite_moe_hybrid.py |
26 |
2 |
0 |
6 |
3 |
84% |
| transformer_lens/model_bridge/supported_architectures/hubert.py |
39 |
9 |
0 |
4 |
0 |
70% |
| transformer_lens/model_bridge/supported_architectures/internlm2.py |
160 |
39 |
0 |
46 |
5 |
69% |
| transformer_lens/model_bridge/supported_architectures/llama.py |
27 |
6 |
0 |
8 |
1 |
63% |
| transformer_lens/model_bridge/supported_architectures/llava.py |
49 |
19 |
0 |
22 |
2 |
48% |
| transformer_lens/model_bridge/supported_architectures/llava_next.py |
3 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/llava_onevision.py |
16 |
11 |
0 |
10 |
0 |
19% |
| transformer_lens/model_bridge/supported_architectures/mamba.py |
20 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/mamba2.py |
46 |
2 |
0 |
8 |
2 |
93% |
| transformer_lens/model_bridge/supported_architectures/mingpt.py |
10 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/mistral.py |
15 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/mixtral.py |
31 |
12 |
0 |
14 |
0 |
42% |
| transformer_lens/model_bridge/supported_architectures/mpt.py |
26 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/nanogpt.py |
18 |
5 |
0 |
4 |
0 |
59% |
| transformer_lens/model_bridge/supported_architectures/neel_solu_old.py |
27 |
14 |
0 |
12 |
0 |
33% |
| transformer_lens/model_bridge/supported_architectures/neo.py |
34 |
8 |
0 |
4 |
0 |
68% |
| transformer_lens/model_bridge/supported_architectures/neox.py |
53 |
4 |
0 |
6 |
0 |
83% |
| transformer_lens/model_bridge/supported_architectures/olmo.py |
66 |
37 |
0 |
26 |
1 |
33% |
| transformer_lens/model_bridge/supported_architectures/olmo2.py |
34 |
12 |
0 |
16 |
1 |
46% |
| transformer_lens/model_bridge/supported_architectures/olmo3.py |
3 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/olmoe.py |
39 |
13 |
0 |
16 |
1 |
49% |
| transformer_lens/model_bridge/supported_architectures/openelm.py |
85 |
55 |
0 |
30 |
1 |
27% |
| transformer_lens/model_bridge/supported_architectures/opt.py |
26 |
3 |
0 |
6 |
3 |
81% |
| transformer_lens/model_bridge/supported_architectures/phi.py |
35 |
15 |
0 |
14 |
0 |
41% |
| transformer_lens/model_bridge/supported_architectures/phi3.py |
130 |
86 |
0 |
48 |
0 |
25% |
| transformer_lens/model_bridge/supported_architectures/pythia.py |
51 |
37 |
0 |
6 |
0 |
25% |
| transformer_lens/model_bridge/supported_architectures/qwen.py |
48 |
30 |
0 |
8 |
0 |
32% |
| transformer_lens/model_bridge/supported_architectures/qwen2.py |
23 |
6 |
0 |
6 |
0 |
59% |
| transformer_lens/model_bridge/supported_architectures/qwen3.py |
65 |
18 |
0 |
24 |
1 |
61% |
| transformer_lens/model_bridge/supported_architectures/qwen3_5.py |
17 |
3 |
0 |
4 |
1 |
71% |
| transformer_lens/model_bridge/supported_architectures/qwen3_moe.py |
32 |
12 |
0 |
16 |
1 |
44% |
| transformer_lens/model_bridge/supported_architectures/qwen3_next.py |
12 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/model_bridge/supported_architectures/stablelm.py |
73 |
39 |
0 |
28 |
2 |
36% |
| transformer_lens/model_bridge/supported_architectures/t5.py |
20 |
2 |
0 |
2 |
1 |
86% |
| transformer_lens/model_bridge/supported_architectures/xglm.py |
27 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/model_bridge/types.py |
11 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/patching.py |
142 |
36 |
34 |
14 |
6 |
73% |
| transformer_lens/pretrained/__init__.py |
0 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/pretrained/weight_conversions/__init__.py |
28 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/pretrained/weight_conversions/apertus.py |
70 |
7 |
0 |
14 |
4 |
87% |
| transformer_lens/pretrained/weight_conversions/bert.py |
37 |
33 |
0 |
2 |
0 |
10% |
| transformer_lens/pretrained/weight_conversions/bloom.py |
40 |
36 |
0 |
2 |
0 |
10% |
| transformer_lens/pretrained/weight_conversions/coder.py |
43 |
38 |
0 |
2 |
0 |
11% |
| transformer_lens/pretrained/weight_conversions/gemma.py |
54 |
2 |
0 |
14 |
3 |
93% |
| transformer_lens/pretrained/weight_conversions/gpt2.py |
43 |
1 |
0 |
4 |
1 |
96% |
| transformer_lens/pretrained/weight_conversions/gptj.py |
36 |
31 |
0 |
2 |
0 |
13% |
| transformer_lens/pretrained/weight_conversions/hubert.py |
69 |
11 |
0 |
36 |
12 |
78% |
| transformer_lens/pretrained/weight_conversions/llama.py |
45 |
39 |
0 |
8 |
0 |
11% |
| transformer_lens/pretrained/weight_conversions/mingpt.py |
40 |
36 |
0 |
2 |
0 |
10% |
| transformer_lens/pretrained/weight_conversions/mistral.py |
36 |
31 |
0 |
2 |
0 |
13% |
| transformer_lens/pretrained/weight_conversions/mixtral.py |
37 |
32 |
0 |
4 |
0 |
12% |
| transformer_lens/pretrained/weight_conversions/nanogpt.py |
52 |
47 |
0 |
10 |
0 |
8% |
| transformer_lens/pretrained/weight_conversions/neel_solu_old.py |
17 |
14 |
0 |
12 |
0 |
10% |
| transformer_lens/pretrained/weight_conversions/neo.py |
40 |
0 |
0 |
4 |
0 |
100% |
| transformer_lens/pretrained/weight_conversions/neox.py |
34 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/pretrained/weight_conversions/olmo.py |
36 |
31 |
0 |
2 |
0 |
13% |
| transformer_lens/pretrained/weight_conversions/olmo2.py |
40 |
34 |
0 |
2 |
0 |
14% |
| transformer_lens/pretrained/weight_conversions/olmo3.py |
42 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/pretrained/weight_conversions/olmoe.py |
43 |
38 |
0 |
4 |
0 |
11% |
| transformer_lens/pretrained/weight_conversions/openai.py |
49 |
4 |
0 |
8 |
2 |
89% |
| transformer_lens/pretrained/weight_conversions/opt.py |
40 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/pretrained/weight_conversions/phi.py |
41 |
37 |
0 |
2 |
0 |
9% |
| transformer_lens/pretrained/weight_conversions/phi3.py |
41 |
35 |
0 |
2 |
0 |
14% |
| transformer_lens/pretrained/weight_conversions/qwen.py |
38 |
33 |
0 |
2 |
0 |
12% |
| transformer_lens/pretrained/weight_conversions/qwen2.py |
41 |
36 |
0 |
2 |
0 |
12% |
| transformer_lens/pretrained/weight_conversions/qwen3.py |
43 |
37 |
0 |
4 |
0 |
13% |
| transformer_lens/pretrained/weight_conversions/t5.py |
33 |
29 |
0 |
4 |
0 |
11% |
| transformer_lens/supported_models.py |
5 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/tools/__init__.py |
2 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/tools/model_registry/__init__.py |
5 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/tools/model_registry/alias_drift.py |
61 |
26 |
0 |
20 |
2 |
48% |
| transformer_lens/tools/model_registry/api.py |
142 |
43 |
0 |
52 |
9 |
62% |
| transformer_lens/tools/model_registry/discover_architectures.py |
100 |
100 |
0 |
30 |
0 |
0% |
| transformer_lens/tools/model_registry/exceptions.py |
36 |
18 |
0 |
10 |
1 |
41% |
| transformer_lens/tools/model_registry/generate_report.py |
107 |
107 |
0 |
30 |
0 |
0% |
| transformer_lens/tools/model_registry/hf_scraper.py |
243 |
243 |
0 |
80 |
0 |
0% |
| transformer_lens/tools/model_registry/registry_io.py |
90 |
7 |
0 |
32 |
4 |
88% |
| transformer_lens/tools/model_registry/relevancy.py |
40 |
0 |
0 |
18 |
0 |
100% |
| transformer_lens/tools/model_registry/schemas.py |
123 |
2 |
0 |
16 |
4 |
96% |
| transformer_lens/tools/model_registry/validate.py |
236 |
79 |
0 |
138 |
36 |
58% |
| transformer_lens/tools/model_registry/verification.py |
48 |
0 |
0 |
8 |
1 |
98% |
| transformer_lens/tools/model_registry/verify_models.py |
638 |
555 |
0 |
310 |
1 |
9% |
| transformer_lens/train.py |
75 |
45 |
0 |
32 |
0 |
28% |
| transformer_lens/utilities/__init__.py |
17 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/utilities/activation_functions.py |
35 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/utilities/addmm.py |
10 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/utilities/aliases.py |
59 |
8 |
0 |
36 |
2 |
87% |
| transformer_lens/utilities/architectures.py |
49 |
8 |
0 |
20 |
9 |
75% |
| transformer_lens/utilities/attention.py |
15 |
2 |
0 |
4 |
2 |
79% |
| transformer_lens/utilities/attribute_utils.py |
11 |
0 |
0 |
4 |
0 |
100% |
| transformer_lens/utilities/bridge_components.py |
41 |
5 |
0 |
24 |
6 |
83% |
| transformer_lens/utilities/cache.py |
6 |
0 |
0 |
2 |
0 |
100% |
| transformer_lens/utilities/components_utils.py |
29 |
3 |
0 |
18 |
3 |
87% |
| transformer_lens/utilities/defaults_utils.py |
34 |
0 |
0 |
10 |
0 |
100% |
| transformer_lens/utilities/devices.py |
57 |
0 |
5 |
34 |
3 |
97% |
| transformer_lens/utilities/exploratory_utils.py |
48 |
4 |
0 |
16 |
5 |
86% |
| transformer_lens/utilities/gpu_utils.py |
5 |
1 |
0 |
0 |
0 |
80% |
| transformer_lens/utilities/hf_utils.py |
73 |
34 |
0 |
30 |
6 |
48% |
| transformer_lens/utilities/initialization_utils.py |
41 |
0 |
0 |
8 |
0 |
100% |
| transformer_lens/utilities/library_utils.py |
4 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/utilities/lm_utils.py |
22 |
5 |
0 |
6 |
1 |
71% |
| transformer_lens/utilities/logits_utils.py |
40 |
19 |
0 |
16 |
4 |
52% |
| transformer_lens/utilities/matrix.py |
23 |
1 |
0 |
6 |
1 |
93% |
| transformer_lens/utilities/multi_gpu.py |
40 |
6 |
2 |
10 |
1 |
82% |
| transformer_lens/utilities/slice.py |
46 |
2 |
0 |
18 |
2 |
94% |
| transformer_lens/utilities/tensors.py |
84 |
37 |
0 |
40 |
2 |
48% |
| transformer_lens/utilities/tokenize_utils.py |
110 |
3 |
0 |
38 |
6 |
94% |
| transformer_lens/utils.py |
4 |
0 |
0 |
0 |
0 |
100% |
| transformer_lens/weight_processing.py |
822 |
183 |
46 |
396 |
102 |
73% |