From 201edaae83959bb9b11ee670061d533c76a90ae7 Mon Sep 17 00:00:00 2001 From: bryce13950 Date: Tue, 31 Dec 2024 02:22:15 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Transfor?= =?UTF-8?q?merLensOrg/TransformerLens@f103debd1084cd79969164ac98ed9059a863?= =?UTF-8?q?54bc=20=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../generated/model_properties_table.md.txt | 9 +- ...7285d613390727b_can_be_used_as_mlp_py.html | 4 +- .../d_37285d613390727b_gated_mlp_4bit_py.html | 4 +- .../d_37285d613390727b_gated_mlp_py.html | 4 +- .../coverage/d_37285d613390727b_mlp_py.html | 4 +- .../coverage/d_37285d613390727b_moe_py.html | 4 +- ...bfb219_activation_function_factory_py.html | 4 +- .../d_65d4430f90bfb219_mlp_factory_py.html | 4 +- .../d_712808f24eb400fe___init___py.html | 4 +- ...d_af97b5493da09a14_ActivationCache_py.html | 4 +- .../d_af97b5493da09a14_FactoredMatrix_py.html | 4 +- ...7b5493da09a14_HookedEncoderDecoder_py.html | 4 +- .../d_af97b5493da09a14_HookedEncoder_py.html | 4 +- ...493da09a14_HookedTransformerConfig_py.html | 12 +- ...af97b5493da09a14_HookedTransformer_py.html | 1105 +++--- .../d_af97b5493da09a14_SVDInterpreter_py.html | 4 +- .../d_af97b5493da09a14___init___py.html | 4 +- .../coverage/d_af97b5493da09a14_evals_py.html | 4 +- .../d_af97b5493da09a14_head_detector_py.html | 4 +- .../d_af97b5493da09a14_hook_points_py.html | 4 +- ...493da09a14_loading_from_pretrained_py.html | 3503 +++++++++-------- ...5493da09a14_past_key_value_caching_py.html | 4 +- .../d_af97b5493da09a14_patching_py.html | 4 +- .../coverage/d_af97b5493da09a14_train_py.html | 4 +- .../coverage/d_af97b5493da09a14_utils_py.html | 4 +- .../d_b2114f845e0399b7___init___py.html | 4 +- ...14f845e0399b7_activation_functions_py.html | 4 +- .../coverage/d_b2114f845e0399b7_addmm_py.html | 4 +- .../d_b2114f845e0399b7_attention_py.html | 4 +- .../d_b2114f845e0399b7_devices_py.html | 4 +- .../d_c1ea89878f9b2ac7___init___py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_bert_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_bloom_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_coder_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_gemma_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_gpt2_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_gptj_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_llama_py.html | 4 +- .../d_c1ea89878f9b2ac7_mingpt_py.html | 4 +- .../d_c1ea89878f9b2ac7_mistral_py.html | 4 +- .../d_c1ea89878f9b2ac7_mixtral_py.html | 4 +- .../d_c1ea89878f9b2ac7_nanogpt_py.html | 4 +- .../d_c1ea89878f9b2ac7_neel_solu_old_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_neo_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_neox_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_opt_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_phi3_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_phi_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_qwen2_py.html | 84 +- .../coverage/d_c1ea89878f9b2ac7_qwen_py.html | 4 +- .../coverage/d_c1ea89878f9b2ac7_t5_py.html | 4 +- .../d_db46118ef83ad831___init___py.html | 4 +- ...b46118ef83ad831_abstract_attention_py.html | 4 +- .../d_db46118ef83ad831_attention_py.html | 4 +- .../d_db46118ef83ad831_bert_block_py.html | 4 +- .../d_db46118ef83ad831_bert_embed_py.html | 4 +- .../d_db46118ef83ad831_bert_mlm_head_py.html | 4 +- .../coverage/d_db46118ef83ad831_embed_py.html | 4 +- ...8ef83ad831_grouped_query_attention_py.html | 4 +- .../d_db46118ef83ad831_layer_norm_pre_py.html | 4 +- .../d_db46118ef83ad831_layer_norm_py.html | 4 +- .../d_db46118ef83ad831_pos_embed_py.html | 4 +- .../d_db46118ef83ad831_rms_norm_pre_py.html | 4 +- .../d_db46118ef83ad831_rms_norm_py.html | 4 +- .../d_db46118ef83ad831_t5_attention_py.html | 4 +- .../d_db46118ef83ad831_t5_block_py.html | 4 +- ...db46118ef83ad831_token_typed_embed_py.html | 4 +- ...db46118ef83ad831_transformer_block_py.html | 18 +- .../d_db46118ef83ad831_unembed_py.html | 4 +- _static/coverage/index.html | 48 +- _static/coverage/status.json | 2 +- ...nsformer_lens.loading_from_pretrained.html | 2 +- .../demos/Exploratory_Analysis_Demo.html | 102 +- .../demos/Exploratory_Analysis_Demo.ipynb | 1814 ++++----- generated/demos/Main_Demo.html | 107 +- generated/demos/Main_Demo.ipynb | 2447 ++++++------ generated/model_properties_table.html | 264 +- searchindex.js | 2 +- 78 files changed, 4893 insertions(+), 4878 deletions(-) diff --git a/_sources/generated/model_properties_table.md.txt b/_sources/generated/model_properties_table.md.txt index b653ccf5a..66e6ebe90 100644 --- a/_sources/generated/model_properties_table.md.txt +++ b/_sources/generated/model_properties_table.md.txt @@ -109,14 +109,15 @@ | meta-llama/Meta-Llama-3-8B-Instruct | 7.8B | 32 | 4096 | 32 | silu | 8192 | 128256 | 128 | 14336 | 8 | | meta-llama/Meta-Llama-3-70B | 78B | 80 | 8192 | 64 | silu | 8192 | 128256 | 128 | 28672 | 8 | | meta-llama/Meta-Llama-3-70B-Instruct | 78B | 80 | 8192 | 64 | silu | 8192 | 128256 | 128 | 28672 | 8 | -| meta-llama/Llama-3.2-1B | 1.1B | 16 | 2048 | 32 | silu | 2048 | 128256 | 64 | 8192 | 8 | -| meta-llama/Llama-3.2-3B | 3.2B | 28 | 3072 | 24 | silu | 2048 | 128256 | 128 | 8192 | 8 | -| meta-llama/Llama-3.2-1B-Instruct | 1.1B | 16 | 2048 | 32 | silu | 2048 | 128256 | 64 | 8192 | 8 | -| meta-llama/Llama-3.2-3B-Instruct | 3.2B | 28 | 3072 | 24 | silu | 2048 | 128256 | 128 | 8192 | 8 | | meta-llama/Llama-3.1-70B | 78B | 80 | 8192 | 64 | silu | 2048 | 128256 | 128 | 28672 | 8 | | meta-llama/Llama-3.1-8B | 7.8B | 32 | 4096 | 32 | silu | 2048 | 128256 | 128 | 14336 | 8 | | meta-llama/Llama-3.1-8B-Instruct | 7.8B | 32 | 4096 | 32 | silu | 2048 | 128256 | 128 | 14336 | 8 | | meta-llama/Llama-3.1-70B-Instruct | 78B | 80 | 8192 | 64 | silu | 2048 | 128256 | 128 | 28672 | 8 | +| meta-llama/Llama-3.2-1B | 1.1B | 16 | 2048 | 32 | silu | 2048 | 128256 | 64 | 8192 | 8 | +| meta-llama/Llama-3.2-3B | 3.2B | 28 | 3072 | 24 | silu | 2048 | 128256 | 128 | 8192 | 8 | +| meta-llama/Llama-3.2-1B-Instruct | 1.1B | 16 | 2048 | 32 | silu | 2048 | 128256 | 64 | 8192 | 8 | +| meta-llama/Llama-3.2-3B-Instruct | 3.2B | 28 | 3072 | 24 | silu | 2048 | 128256 | 128 | 8192 | 8 | +| meta-llama/Llama-3.3-70B-Instruct | 78B | 80 | 8192 | 64 | silu | 2048 | 128256 | 128 | 28672 | 8 | | othello-gpt | 25M | 8 | 512 | 8 | gelu | 59 | 61 | 64 | 2048 | | | bert-base-cased | 85M | 12 | 768 | 12 | gelu | 512 | 28996 | 64 | 3072 | | | tiny-stories-1M | 393K | 8 | 64 | 16 | gelu | 2048 | 50257 | 4 | 256 | | diff --git a/_static/coverage/d_37285d613390727b_can_be_used_as_mlp_py.html b/_static/coverage/d_37285d613390727b_can_be_used_as_mlp_py.html index bfe5dd961..fa8b40624 100644 --- a/_static/coverage/d_37285d613390727b_can_be_used_as_mlp_py.html +++ b/_static/coverage/d_37285d613390727b_can_be_used_as_mlp_py.html @@ -67,7 +67,7 @@ » next coverage.py v7.4.4, - created at 2024-12-14 00:54 +0000 + created at 2024-12-31 02:13 +0000