From f582d274a55b44361a13d7b7db3e5dc58f658fcb Mon Sep 17 00:00:00 2001 From: JadenFiottoKaufman Date: Mon, 2 Sep 2024 01:42:17 -0400 Subject: [PATCH] Attribution patching fixes --- public/_modules/index.html | 4 ++-- .../_modules/nnsight/contexts/Conditional/index.html | 4 ++-- .../nnsight/contexts/GraphBasedContext/index.html | 4 ++-- public/_modules/nnsight/contexts/Invoker/index.html | 4 ++-- public/_modules/nnsight/contexts/Tracer/index.html | 4 ++-- public/_modules/nnsight/contexts/index.html | 4 ++-- .../nnsight/contexts/session/Iterator/index.html | 4 ++-- .../nnsight/contexts/session/Session/index.html | 4 ++-- public/_modules/nnsight/envoy/index.html | 4 ++-- public/_modules/nnsight/intervention/index.html | 4 ++-- .../_modules/nnsight/models/LanguageModel/index.html | 4 ++-- .../_modules/nnsight/models/NNsightModel/index.html | 4 ++-- .../nnsight/models/UnifiedTransformer/index.html | 4 ++-- public/_modules/nnsight/patching/index.html | 4 ++-- public/_modules/nnsight/schema/Config/index.html | 4 ++-- public/_modules/nnsight/schema/Response/index.html | 4 ++-- .../_modules/nnsight/schema/format/types/index.html | 4 ++-- public/_modules/nnsight/tracing/Bridge/index.html | 4 ++-- public/_modules/nnsight/tracing/Graph/index.html | 4 ++-- public/_modules/nnsight/tracing/Node/index.html | 4 ++-- public/_modules/nnsight/tracing/Proxy/index.html | 4 ++-- public/_modules/nnsight/tracing/protocols/index.html | 4 ++-- public/_modules/nnsight/util/index.html | 4 ++-- .../tutorials/attribution_patching.ipynb.txt | 9 ++++----- public/about/index.html | 4 ++-- public/documentation/contexts/index.html | 4 ++-- public/documentation/envoy/index.html | 4 ++-- public/documentation/index.html | 4 ++-- public/documentation/intervention/index.html | 4 ++-- public/documentation/models/index.html | 4 ++-- public/documentation/patching/index.html | 4 ++-- public/documentation/schema/index.html | 4 ++-- public/documentation/tracing/index.html | 4 ++-- public/documentation/util/index.html | 4 ++-- public/features/index.html | 4 ++-- public/genindex/index.html | 4 ++-- public/index.html | 4 ++-- public/notebooks/features/conditionals/index.html | 4 ++-- public/notebooks/features/cross_prompt/index.html | 4 ++-- public/notebooks/features/custom_functions/index.html | 4 ++-- public/notebooks/features/early_stopping/index.html | 4 ++-- public/notebooks/features/getting/index.html | 4 ++-- public/notebooks/features/gradients/index.html | 4 ++-- public/notebooks/features/iterator/index.html | 4 ++-- public/notebooks/features/lora_training/index.html | 4 ++-- public/notebooks/features/model_editing/index.html | 4 ++-- public/notebooks/features/modules/index.html | 4 ++-- public/notebooks/features/multiple_token/index.html | 4 ++-- public/notebooks/features/operations/index.html | 4 ++-- public/notebooks/features/remote_execution/index.html | 4 ++-- public/notebooks/features/scan_validate/index.html | 4 ++-- public/notebooks/features/sessions/index.html | 4 ++-- public/notebooks/features/setting/index.html | 4 ++-- .../tutorials/activation_patching/index.html | 4 ++-- public/notebooks/tutorials/attribution_patching.ipynb | 9 ++++----- .../tutorials/attribution_patching/index.html | 11 +++++------ public/notebooks/tutorials/boundless_DAS/index.html | 4 ++-- public/notebooks/tutorials/dict_learning/index.html | 4 ++-- public/notebooks/tutorials/logit_lens/index.html | 4 ++-- public/notebooks/tutorials/walkthrough/index.html | 4 ++-- public/py-modindex/index.html | 4 ++-- public/search/index.html | 4 ++-- public/searchindex.js | 2 +- public/start/index.html | 4 ++-- public/status/index.html | 4 ++-- public/tutorials/index.html | 4 ++-- 66 files changed, 138 insertions(+), 141 deletions(-) diff --git a/public/_modules/index.html b/public/_modules/index.html index 5047cc6..91f7354 100644 --- a/public/_modules/index.html +++ b/public/_modules/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/contexts/Conditional/index.html b/public/_modules/nnsight/contexts/Conditional/index.html index 4025e9b..57517d0 100644 --- a/public/_modules/nnsight/contexts/Conditional/index.html +++ b/public/_modules/nnsight/contexts/Conditional/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/contexts/GraphBasedContext/index.html b/public/_modules/nnsight/contexts/GraphBasedContext/index.html index b56a4f8..878741c 100644 --- a/public/_modules/nnsight/contexts/GraphBasedContext/index.html +++ b/public/_modules/nnsight/contexts/GraphBasedContext/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/contexts/Invoker/index.html b/public/_modules/nnsight/contexts/Invoker/index.html index 6150c96..4355e0b 100644 --- a/public/_modules/nnsight/contexts/Invoker/index.html +++ b/public/_modules/nnsight/contexts/Invoker/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/contexts/Tracer/index.html b/public/_modules/nnsight/contexts/Tracer/index.html index 0f876e7..898b4a6 100644 --- a/public/_modules/nnsight/contexts/Tracer/index.html +++ b/public/_modules/nnsight/contexts/Tracer/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/contexts/index.html b/public/_modules/nnsight/contexts/index.html index dbd26a5..17d303f 100644 --- a/public/_modules/nnsight/contexts/index.html +++ b/public/_modules/nnsight/contexts/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/contexts/session/Iterator/index.html b/public/_modules/nnsight/contexts/session/Iterator/index.html index b93cd8e..1f770ea 100644 --- a/public/_modules/nnsight/contexts/session/Iterator/index.html +++ b/public/_modules/nnsight/contexts/session/Iterator/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/contexts/session/Session/index.html b/public/_modules/nnsight/contexts/session/Session/index.html index 6d1cf46..222ad79 100644 --- a/public/_modules/nnsight/contexts/session/Session/index.html +++ b/public/_modules/nnsight/contexts/session/Session/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/envoy/index.html b/public/_modules/nnsight/envoy/index.html index 15dedce..f6acb7b 100644 --- a/public/_modules/nnsight/envoy/index.html +++ b/public/_modules/nnsight/envoy/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/intervention/index.html b/public/_modules/nnsight/intervention/index.html index c862bca..a4ca111 100644 --- a/public/_modules/nnsight/intervention/index.html +++ b/public/_modules/nnsight/intervention/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/models/LanguageModel/index.html b/public/_modules/nnsight/models/LanguageModel/index.html index 39d4e72..3234c9d 100644 --- a/public/_modules/nnsight/models/LanguageModel/index.html +++ b/public/_modules/nnsight/models/LanguageModel/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/models/NNsightModel/index.html b/public/_modules/nnsight/models/NNsightModel/index.html index d39cf4b..5311066 100644 --- a/public/_modules/nnsight/models/NNsightModel/index.html +++ b/public/_modules/nnsight/models/NNsightModel/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/models/UnifiedTransformer/index.html b/public/_modules/nnsight/models/UnifiedTransformer/index.html index e9bf6f1..be0c87a 100644 --- a/public/_modules/nnsight/models/UnifiedTransformer/index.html +++ b/public/_modules/nnsight/models/UnifiedTransformer/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/patching/index.html b/public/_modules/nnsight/patching/index.html index 8119197..e024997 100644 --- a/public/_modules/nnsight/patching/index.html +++ b/public/_modules/nnsight/patching/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/schema/Config/index.html b/public/_modules/nnsight/schema/Config/index.html index de59675..a5b7a33 100644 --- a/public/_modules/nnsight/schema/Config/index.html +++ b/public/_modules/nnsight/schema/Config/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/schema/Response/index.html b/public/_modules/nnsight/schema/Response/index.html index 2e2dfcf..b81e02c 100644 --- a/public/_modules/nnsight/schema/Response/index.html +++ b/public/_modules/nnsight/schema/Response/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/schema/format/types/index.html b/public/_modules/nnsight/schema/format/types/index.html index f0a4155..440a6ac 100644 --- a/public/_modules/nnsight/schema/format/types/index.html +++ b/public/_modules/nnsight/schema/format/types/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/tracing/Bridge/index.html b/public/_modules/nnsight/tracing/Bridge/index.html index 217ceb4..70413b1 100644 --- a/public/_modules/nnsight/tracing/Bridge/index.html +++ b/public/_modules/nnsight/tracing/Bridge/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/tracing/Graph/index.html b/public/_modules/nnsight/tracing/Graph/index.html index 829bdf9..73e063c 100644 --- a/public/_modules/nnsight/tracing/Graph/index.html +++ b/public/_modules/nnsight/tracing/Graph/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/tracing/Node/index.html b/public/_modules/nnsight/tracing/Node/index.html index 150a35f..059502c 100644 --- a/public/_modules/nnsight/tracing/Node/index.html +++ b/public/_modules/nnsight/tracing/Node/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/tracing/Proxy/index.html b/public/_modules/nnsight/tracing/Proxy/index.html index 7169544..9193b20 100644 --- a/public/_modules/nnsight/tracing/Proxy/index.html +++ b/public/_modules/nnsight/tracing/Proxy/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/tracing/protocols/index.html b/public/_modules/nnsight/tracing/protocols/index.html index e61937a..ed1abae 100644 --- a/public/_modules/nnsight/tracing/protocols/index.html +++ b/public/_modules/nnsight/tracing/protocols/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_modules/nnsight/util/index.html b/public/_modules/nnsight/util/index.html index cb98e49..27fdb71 100644 --- a/public/_modules/nnsight/util/index.html +++ b/public/_modules/nnsight/util/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/_sources/notebooks/tutorials/attribution_patching.ipynb.txt b/public/_sources/notebooks/tutorials/attribution_patching.ipynb.txt index ae5f775..ad416a2 100644 --- a/public/_sources/notebooks/tutorials/attribution_patching.ipynb.txt +++ b/public/_sources/notebooks/tutorials/attribution_patching.ipynb.txt @@ -128,8 +128,7 @@ ], "source": [ "def get_logit_diff(logits, answer_token_indices=answer_token_indices):\n", - " if len(logits.shape) == 3:\n", - " logits = logits[:, -1, :]\n", + " logits = logits[:, -1, :]\n", " correct_logits = logits.gather(1, answer_token_indices[:, 0].unsqueeze(1))\n", " incorrect_logits = logits.gather(1, answer_token_indices[:, 1].unsqueeze(1))\n", " return (correct_logits - incorrect_logits).mean()\n", @@ -222,13 +221,13 @@ " with tracer.invoke(clean_tokens) as invoker_clean:\n", "\n", " for layer in model.transformer.h:\n", - " attn_out = layer.attn.c_proj.input[0][0]\n", + " attn_out = layer.attn.c_proj.input\n", " clean_out.append(attn_out.save())\n", "\n", " with tracer.invoke(corrupted_tokens) as invoker_corrupted:\n", "\n", " for layer in model.transformer.h:\n", - " attn_out = layer.attn.c_proj.input[0][0]\n", + " attn_out = layer.attn.c_proj.input\n", " corrupted_out.append(attn_out.save())\n", " corrupted_grads.append(attn_out.grad.save())\n", "\n", @@ -2648,7 +2647,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.1.0" + "version": "3.10.13" } }, "nbformat": 4, diff --git a/public/about/index.html b/public/about/index.html index 9ea1e8b..08be5dc 100644 --- a/public/about/index.html +++ b/public/about/index.html @@ -56,8 +56,8 @@ - - + + diff --git a/public/documentation/contexts/index.html b/public/documentation/contexts/index.html index 80f7081..ded2dca 100644 --- a/public/documentation/contexts/index.html +++ b/public/documentation/contexts/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/documentation/envoy/index.html b/public/documentation/envoy/index.html index c9934c1..c3ce30d 100644 --- a/public/documentation/envoy/index.html +++ b/public/documentation/envoy/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/documentation/index.html b/public/documentation/index.html index 0325940..9100302 100644 --- a/public/documentation/index.html +++ b/public/documentation/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/documentation/intervention/index.html b/public/documentation/intervention/index.html index ee8974a..7c9463e 100644 --- a/public/documentation/intervention/index.html +++ b/public/documentation/intervention/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/documentation/models/index.html b/public/documentation/models/index.html index fbcfe95..043fc86 100644 --- a/public/documentation/models/index.html +++ b/public/documentation/models/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/documentation/patching/index.html b/public/documentation/patching/index.html index 6ff5e29..fbdda7f 100644 --- a/public/documentation/patching/index.html +++ b/public/documentation/patching/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/documentation/schema/index.html b/public/documentation/schema/index.html index 67cfffb..0e366d3 100644 --- a/public/documentation/schema/index.html +++ b/public/documentation/schema/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/documentation/tracing/index.html b/public/documentation/tracing/index.html index 5b6f9cb..b10b7c4 100644 --- a/public/documentation/tracing/index.html +++ b/public/documentation/tracing/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/documentation/util/index.html b/public/documentation/util/index.html index 6c86e68..0e747a4 100644 --- a/public/documentation/util/index.html +++ b/public/documentation/util/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/features/index.html b/public/features/index.html index 56079f0..58e7da3 100644 --- a/public/features/index.html +++ b/public/features/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/genindex/index.html b/public/genindex/index.html index b42d082..204c2ed 100644 --- a/public/genindex/index.html +++ b/public/genindex/index.html @@ -54,8 +54,8 @@ - - + + diff --git a/public/index.html b/public/index.html index 517c2ed..a0ba255 100644 --- a/public/index.html +++ b/public/index.html @@ -56,8 +56,8 @@ - - + + diff --git a/public/notebooks/features/conditionals/index.html b/public/notebooks/features/conditionals/index.html index b4be316..b6aaa7e 100644 --- a/public/notebooks/features/conditionals/index.html +++ b/public/notebooks/features/conditionals/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/cross_prompt/index.html b/public/notebooks/features/cross_prompt/index.html index 2f03c86..0447809 100644 --- a/public/notebooks/features/cross_prompt/index.html +++ b/public/notebooks/features/cross_prompt/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/custom_functions/index.html b/public/notebooks/features/custom_functions/index.html index 0a6ceb0..e5ff9bd 100644 --- a/public/notebooks/features/custom_functions/index.html +++ b/public/notebooks/features/custom_functions/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/early_stopping/index.html b/public/notebooks/features/early_stopping/index.html index c9c7ed4..84180a3 100644 --- a/public/notebooks/features/early_stopping/index.html +++ b/public/notebooks/features/early_stopping/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/getting/index.html b/public/notebooks/features/getting/index.html index 90d1c4b..24f278d 100644 --- a/public/notebooks/features/getting/index.html +++ b/public/notebooks/features/getting/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/gradients/index.html b/public/notebooks/features/gradients/index.html index 34988d1..7289414 100644 --- a/public/notebooks/features/gradients/index.html +++ b/public/notebooks/features/gradients/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/iterator/index.html b/public/notebooks/features/iterator/index.html index 31466b3..b272674 100644 --- a/public/notebooks/features/iterator/index.html +++ b/public/notebooks/features/iterator/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/lora_training/index.html b/public/notebooks/features/lora_training/index.html index 3a570a3..f4b5142 100644 --- a/public/notebooks/features/lora_training/index.html +++ b/public/notebooks/features/lora_training/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/model_editing/index.html b/public/notebooks/features/model_editing/index.html index f765cd8..2d5a3ca 100644 --- a/public/notebooks/features/model_editing/index.html +++ b/public/notebooks/features/model_editing/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/modules/index.html b/public/notebooks/features/modules/index.html index e9e120f..cf8f580 100644 --- a/public/notebooks/features/modules/index.html +++ b/public/notebooks/features/modules/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/multiple_token/index.html b/public/notebooks/features/multiple_token/index.html index 274ea64..e8f22b0 100644 --- a/public/notebooks/features/multiple_token/index.html +++ b/public/notebooks/features/multiple_token/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/operations/index.html b/public/notebooks/features/operations/index.html index 2e08c0a..da44ee5 100644 --- a/public/notebooks/features/operations/index.html +++ b/public/notebooks/features/operations/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/remote_execution/index.html b/public/notebooks/features/remote_execution/index.html index 3ec5937..f956be4 100644 --- a/public/notebooks/features/remote_execution/index.html +++ b/public/notebooks/features/remote_execution/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/scan_validate/index.html b/public/notebooks/features/scan_validate/index.html index 1a55ba4..7f6af18 100644 --- a/public/notebooks/features/scan_validate/index.html +++ b/public/notebooks/features/scan_validate/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/sessions/index.html b/public/notebooks/features/sessions/index.html index 6d06d63..75223d2 100644 --- a/public/notebooks/features/sessions/index.html +++ b/public/notebooks/features/sessions/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/features/setting/index.html b/public/notebooks/features/setting/index.html index eb11820..d9b57a7 100644 --- a/public/notebooks/features/setting/index.html +++ b/public/notebooks/features/setting/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/tutorials/activation_patching/index.html b/public/notebooks/tutorials/activation_patching/index.html index c4a74de..6c9be69 100644 --- a/public/notebooks/tutorials/activation_patching/index.html +++ b/public/notebooks/tutorials/activation_patching/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/tutorials/attribution_patching.ipynb b/public/notebooks/tutorials/attribution_patching.ipynb index 6fc071b..27c1bb7 100644 --- a/public/notebooks/tutorials/attribution_patching.ipynb +++ b/public/notebooks/tutorials/attribution_patching.ipynb @@ -128,8 +128,7 @@ ], "source": [ "def get_logit_diff(logits, answer_token_indices=answer_token_indices):\n", - " if len(logits.shape) == 3:\n", - " logits = logits[:, -1, :]\n", + " logits = logits[:, -1, :]\n", " correct_logits = logits.gather(1, answer_token_indices[:, 0].unsqueeze(1))\n", " incorrect_logits = logits.gather(1, answer_token_indices[:, 1].unsqueeze(1))\n", " return (correct_logits - incorrect_logits).mean()\n", @@ -222,13 +221,13 @@ " with tracer.invoke(clean_tokens) as invoker_clean:\n", "\n", " for layer in model.transformer.h:\n", - " attn_out = layer.attn.c_proj.input[0][0]\n", + " attn_out = layer.attn.c_proj.input\n", " clean_out.append(attn_out.save())\n", "\n", " with tracer.invoke(corrupted_tokens) as invoker_corrupted:\n", "\n", " for layer in model.transformer.h:\n", - " attn_out = layer.attn.c_proj.input[0][0]\n", + " attn_out = layer.attn.c_proj.input\n", " corrupted_out.append(attn_out.save())\n", " corrupted_grads.append(attn_out.grad.save())\n", "\n", @@ -2648,7 +2647,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.1.0" + "version": "3.10.13" } }, "nbformat": 4, diff --git a/public/notebooks/tutorials/attribution_patching/index.html b/public/notebooks/tutorials/attribution_patching/index.html index d494eb6..97e694d 100644 --- a/public/notebooks/tutorials/attribution_patching/index.html +++ b/public/notebooks/tutorials/attribution_patching/index.html @@ -60,8 +60,8 @@ - - + + @@ -639,8 +639,7 @@

1️⃣ IOI Patching Setup

def get_logit_diff(logits, answer_token_indices=answer_token_indices):
-    if len(logits.shape) == 3:
-        logits = logits[:, -1, :]
+    logits = logits[:, -1, :]
     correct_logits = logits.gather(1, answer_token_indices[:, 0].unsqueeze(1))
     incorrect_logits = logits.gather(1, answer_token_indices[:, 1].unsqueeze(1))
     return (correct_logits - incorrect_logits).mean()
@@ -721,13 +720,13 @@ 

2️⃣ Attribution Patching Over Components

with tracer.invoke(clean_tokens) as invoker_clean: for layer in model.transformer.h: - attn_out = layer.attn.c_proj.input[0][0] + attn_out = layer.attn.c_proj.input clean_out.append(attn_out.save()) with tracer.invoke(corrupted_tokens) as invoker_corrupted: for layer in model.transformer.h: - attn_out = layer.attn.c_proj.input[0][0] + attn_out = layer.attn.c_proj.input corrupted_out.append(attn_out.save()) corrupted_grads.append(attn_out.grad.save()) diff --git a/public/notebooks/tutorials/boundless_DAS/index.html b/public/notebooks/tutorials/boundless_DAS/index.html index edb0260..7cd5514 100644 --- a/public/notebooks/tutorials/boundless_DAS/index.html +++ b/public/notebooks/tutorials/boundless_DAS/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/tutorials/dict_learning/index.html b/public/notebooks/tutorials/dict_learning/index.html index ec6de37..9ec05de 100644 --- a/public/notebooks/tutorials/dict_learning/index.html +++ b/public/notebooks/tutorials/dict_learning/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/tutorials/logit_lens/index.html b/public/notebooks/tutorials/logit_lens/index.html index aee07f7..1efac0d 100644 --- a/public/notebooks/tutorials/logit_lens/index.html +++ b/public/notebooks/tutorials/logit_lens/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/notebooks/tutorials/walkthrough/index.html b/public/notebooks/tutorials/walkthrough/index.html index 7e87643..b0295d7 100644 --- a/public/notebooks/tutorials/walkthrough/index.html +++ b/public/notebooks/tutorials/walkthrough/index.html @@ -60,8 +60,8 @@ - - + + diff --git a/public/py-modindex/index.html b/public/py-modindex/index.html index 262716f..9d83679 100644 --- a/public/py-modindex/index.html +++ b/public/py-modindex/index.html @@ -55,8 +55,8 @@ - - + + diff --git a/public/search/index.html b/public/search/index.html index 9c2fa68..6898a78 100644 --- a/public/search/index.html +++ b/public/search/index.html @@ -56,8 +56,8 @@ - - + + diff --git a/public/searchindex.js b/public/searchindex.js index 8083de8..b0afee4 100644 --- a/public/searchindex.js +++ b/public/searchindex.js @@ -1 +1 @@ -Search.setIndex({"docnames": ["about", "documentation", "documentation/contexts", "documentation/envoy", "documentation/intervention", "documentation/models", "documentation/patching", "documentation/schema", "documentation/tracing", "documentation/util", "features", "index", "notebooks/features/conditionals", "notebooks/features/cross_prompt", "notebooks/features/custom_functions", "notebooks/features/early_stopping", "notebooks/features/getting", "notebooks/features/gradients", "notebooks/features/iterator", "notebooks/features/lora_training", "notebooks/features/model_editing", "notebooks/features/modules", "notebooks/features/multiple_token", "notebooks/features/operations", "notebooks/features/remote_execution", "notebooks/features/scan_validate", "notebooks/features/sessions", "notebooks/features/setting", "notebooks/tutorials/activation_patching", "notebooks/tutorials/attribution_patching", "notebooks/tutorials/boundless_DAS", "notebooks/tutorials/dict_learning", "notebooks/tutorials/logit_lens", "notebooks/tutorials/walkthrough", "start", "status", "tutorials"], "filenames": ["about.rst", "documentation.rst", "documentation/contexts.rst", "documentation/envoy.rst", "documentation/intervention.rst", "documentation/models.rst", "documentation/patching.rst", "documentation/schema.rst", "documentation/tracing.rst", "documentation/util.rst", "features.rst", "index.rst", "notebooks/features/conditionals.ipynb", "notebooks/features/cross_prompt.ipynb", "notebooks/features/custom_functions.ipynb", "notebooks/features/early_stopping.ipynb", "notebooks/features/getting.ipynb", "notebooks/features/gradients.ipynb", "notebooks/features/iterator.ipynb", "notebooks/features/lora_training.ipynb", "notebooks/features/model_editing.ipynb", "notebooks/features/modules.ipynb", "notebooks/features/multiple_token.ipynb", "notebooks/features/operations.ipynb", "notebooks/features/remote_execution.ipynb", "notebooks/features/scan_validate.ipynb", "notebooks/features/sessions.ipynb", "notebooks/features/setting.ipynb", "notebooks/tutorials/activation_patching.ipynb", "notebooks/tutorials/attribution_patching.ipynb", "notebooks/tutorials/boundless_DAS.ipynb", "notebooks/tutorials/dict_learning.ipynb", "notebooks/tutorials/logit_lens.ipynb", "notebooks/tutorials/walkthrough.ipynb", "start.rst", "status.rst", "tutorials.rst"], "titles": ["About NNsight", "Documentation", "nnsight.contexts", "nnsight.envoy", "nnsight.intervention", "nnsight.models", "nnsight.patching", "nnsight.schema", "nnsight.tracing", "nnsight.util", "Features", "nnsight", "Conditional Interventions", "Cross-Prompt Intervention", "Custom Functions", "Early Stopping", "Getting Values", "Gradients", "Iterative Interventions", "LoRA", "Model Editing", "Modules", "Multiple Token Generation", "Operations", "Remote Execution", "Scan and Validate", "Sessions", "Setting Values", "Activation Patching", "Attribution Patching", "Boundless DAS", "Dictionary Learning", "Logit Lens", "Walkthrough", "Getting Started", "Status", "Tutorials"], "terms": {"can": [0, 2, 3, 5, 8, 12, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35], "you": [0, 2, 5, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36], "studi": 0, "intern": [0, 11, 33, 34], "deep": [0, 33, 34], "network": [0, 11, 28, 30, 33], "too": 0, "larg": [0, 29, 33], "run": [0, 2, 4, 5, 8, 9, 15, 18, 19, 24, 25, 26, 28, 29, 33, 35], "In": [0, 2, 5, 12, 13, 15, 17, 20, 23, 24, 25, 26, 27, 29, 30, 33], "thi": [0, 2, 3, 4, 5, 7, 8, 9, 12, 13, 14, 15, 17, 18, 19, 20, 23, 24, 25, 26, 27, 29, 30, 32, 33], "era": [0, 33], "scale": [0, 18, 33], "learn": [0, 30, 33, 34, 36], "most": [0, 2, 3, 5, 15, 23, 25, 29, 33], "interest": [0, 15, 26, 28, 29, 31, 33], "model": [0, 1, 2, 3, 4, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 34, 35, 36], "ar": [0, 2, 3, 5, 8, 9, 14, 15, 16, 17, 19, 20, 23, 25, 26, 30, 32, 33, 35], "massiv": [0, 33], "hard": [0, 33], "ordinari": [0, 33], "commerci": [0, 33], "infer": [0, 19, 33], "servic": [0, 2, 33], "let": [0, 5, 8, 19, 20, 24, 25, 26, 28, 29, 36], "interact": [0, 2, 4, 5, 8, 17, 33], "huge": [0, 36], "thei": [0, 2, 3, 8, 15, 19, 25, 33], "see": [0, 2, 5, 8, 12, 13, 14, 17, 18, 19, 20, 23, 25, 26, 27, 29, 31, 33, 34], "The": [0, 2, 4, 5, 6, 8, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 32, 33, 35], "librari": [0, 8, 14, 25, 33, 35], "differ": [0, 2, 8, 26, 28, 29, 32, 33], "give": [0, 5, 9, 33, 34], "full": [0, 33, 34], "access": [0, 2, 3, 4, 5, 8, 10, 11, 15, 16, 17, 24, 26, 32, 33], "all": [0, 2, 3, 4, 5, 8, 9, 14, 17, 18, 19, 20, 24, 25, 26, 28, 29, 30, 32, 33, 35], "neural": [0, 11, 30, 33], "when": [0, 2, 3, 4, 5, 8, 13, 19, 20, 22, 24, 25, 29, 33], "togeth": [0, 2, 26, 33], "remot": [0, 2, 5, 10, 19, 26, 30, 35], "like": [0, 4, 5, 12, 17, 19, 21, 25, 29, 33], "nation": [0, 33], "fabric": [0, 33], "ndif": [0, 7, 13, 15, 24, 25, 26, 33, 34, 35], "experi": [0, 26, 28, 33, 35], "open": [0, 2, 5, 13, 19, 22, 24, 33, 34], "easili": [0, 5, 11, 33], "also": [0, 2, 5, 6, 12, 13, 14, 17, 18, 19, 21, 25, 26, 30, 33], "terrif": 0, "smaller": 0, "local": [0, 2, 5, 24, 26, 29, 32, 33, 35], "overview": 0, "pipelin": 0, "research": [0, 33], "write": [0, 30], "simpl": [0, 5, 8, 9, 14, 18, 19, 20, 24, 33], "python": [0, 8, 18, 33], "code": [0, 25, 30, 32, 33], "along": [0, 3, 4, 24, 33], "unlik": [0, 8, 20, 32, 33], "read": [0, 30, 32, 33, 34], "ani": [0, 2, 4, 5, 6, 7, 8, 9, 11, 14, 15, 21, 25, 33], "state": [0, 2, 5, 11, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 33], "being": [0, 4, 22, 26, 33], "creat": [0, 2, 3, 4, 5, 8, 18, 19, 20, 25, 27, 30, 32, 33], "comput": [0, 2, 4, 5, 8, 9, 10, 15, 21, 23, 25, 27, 29, 32, 33], "graph": [0, 2, 3, 4, 5, 7, 8, 10, 14, 18, 19, 23, 25, 33], "sent": [0, 19, 33], "interleav": [0, 4, 5, 33], "execut": [0, 2, 4, 5, 8, 10, 12, 14, 15, 17, 18, 19, 25, 26], "built": [0, 3, 8, 18, 33], "pytorch": [0, 5, 11, 14, 25, 33], "veri": [0, 19, 25, 33], "similar": [0, 30], "your": [0, 5, 20, 24, 25, 26, 32, 33], "own": [0, 19, 25, 26, 33], "workstat": 0, "fact": [0, 33], "same": [0, 2, 8, 9, 13, 24, 25, 26, 29, 32, 33], "small": [0, 29, 36], "just": [0, 5, 8, 12, 17, 19, 24, 25, 26, 28, 29, 33], "chang": [0, 19, 20, 23, 25, 27, 29, 33], "few": [0, 5, 33], "argument": [0, 2, 3, 5, 8, 9, 14, 33], "between": [0, 2, 8, 13, 20, 26, 28, 29, 30, 33], "normal": [0, 8, 17, 19, 25, 28, 32, 33], "treat": 0, "opaqu": 0, "instead": [0, 5, 9, 15, 29, 33], "set": [0, 2, 3, 4, 5, 8, 10, 12, 13, 14, 15, 17, 18, 19, 20, 22, 24, 25, 26, 29, 30, 32], "up": [0, 5, 8, 24, 28, 29, 31, 33], "context": [0, 1, 3, 4, 5, 6, 8, 12, 14, 15, 16, 17, 18, 19, 20, 24, 25, 26, 28, 30], "enabl": [0, 2, 4, 5, 8, 11, 20, 25, 26, 30, 33], "get": [0, 2, 3, 4, 5, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 36], "direct": [0, 5, 8, 33], "while": [0, 2, 9, 22, 29, 32, 33], "here": [0, 2, 5, 13, 18, 19, 21, 22, 25, 28, 29, 30, 32, 33], "look": [0, 5, 21, 26, 28, 33], "from": [0, 2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "import": [0, 5, 8, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "languagemodel": [0, 2, 5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32], "meta": [0, 2, 3, 5, 24, 25, 26, 33], "llama": [0, 24, 26, 33], "2": [0, 2, 5, 8, 12, 13, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 36], "70b": [0, 24, 26, 33], "hf": 0, "trace": [0, 1, 2, 4, 5, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 32], "eiffel": [0, 4, 5, 11, 12, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 32, 33], "tower": [0, 4, 5, 11, 12, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 32, 33], "citi": [0, 4, 5, 11, 12, 13, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 32, 33], "true": [0, 2, 5, 7, 8, 12, 13, 14, 17, 18, 19, 20, 24, 25, 26, 29, 30, 31, 32, 33], "hidden_st": [0, 4, 16, 17, 21, 23, 24, 33], "layer": [0, 15, 17, 19, 21, 22, 24, 26, 28, 29, 30, 31, 33], "10": [0, 5, 12, 13, 19, 22, 24, 25, 30, 32, 33], "input": [0, 2, 3, 4, 5, 8, 9, 11, 16, 17, 19, 25, 28, 29, 30, 32, 33], "0": [0, 3, 5, 8, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "save": [0, 2, 4, 5, 8, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "one": [0, 2, 3, 4, 5, 8, 9, 10, 12, 15, 19, 22, 24, 25, 26, 28, 29, 30, 33], "hidden": [0, 5, 11, 16, 17, 19, 20, 21, 22, 23, 25, 26, 27, 28, 33], "11": [0, 5, 17, 20, 22, 24, 25, 26, 27, 30, 32, 33], "mlp": [0, 3, 5, 11, 19, 29, 31, 32, 33], "output": [0, 2, 3, 4, 5, 8, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "modul": [0, 2, 3, 4, 5, 6, 8, 9, 10, 11, 15, 16, 19, 22, 25, 33], "print": [0, 2, 4, 5, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33], "predict": [0, 19, 20, 26, 28, 32, 33], "wa": [0, 5, 8, 12, 14, 15, 18, 19, 20, 22, 24, 25, 26, 29, 33], "easi": [0, 2, 33], "huggingfac": [0, 5, 12, 14, 18, 19, 20, 24, 25, 26, 29, 32, 33], "load": [0, 5, 24, 28, 30, 31, 32, 33], "object": [0, 2, 3, 4, 5, 6, 8, 9, 11, 14, 16, 18, 19, 26, 28, 29, 32, 33], "line": [0, 15, 25, 33], "notic": [0, 33], "we": [0, 3, 4, 5, 8, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33], "70": [0, 21], "billion": 0, "paramet": [0, 2, 3, 4, 5, 6, 8, 9, 19, 24, 30, 33], "which": [0, 2, 3, 5, 8, 9, 18, 19, 20, 21, 29, 30, 33, 35], "ordinarili": 0, "pretti": [0, 33], "difficult": 0, "regular": 0, "sinc": [0, 9, 15, 26, 29, 33], "would": [0, 5, 8, 14, 15, 17, 19, 31, 33], "take": [0, 2, 5, 9, 20, 26, 29, 33], "140": 0, "280": 0, "gigabyt": 0, "gpu": [0, 5, 33], "ram": 0, "store": [0, 2, 4, 8, 15, 26, 28, 33], "trick": [0, 33], "u": [0, 5, 17, 18, 21, 24, 25, 27, 31, 32, 33], "work": [0, 2, 13, 15, 17, 23, 24, 25, 32, 33], "3": [0, 5, 13, 15, 16, 17, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36], "flag": [0, 18, 25, 33], "indic": [0, 4, 5, 31, 33], "want": [0, 2, 8, 12, 13, 17, 18, 25, 27, 29, 33], "actual": [0, 2, 8, 19, 21, 24, 28, 33], "By": [0, 8, 23, 32, 33], "default": [0, 2, 3, 4, 5, 7, 8, 12, 14, 17, 18, 19, 20, 24, 25, 33], "If": [0, 2, 3, 4, 5, 8, 9, 10, 12, 13, 15, 17, 20, 25, 29, 33], "quickli": 0, "could": [0, 5, 13, 15, 19, 29, 32, 33], "leav": [0, 25, 30, 33], "fals": [0, 2, 3, 5, 7, 8, 9, 12, 14, 18, 19, 20, 24, 25, 26, 29, 30, 31, 32, 33], "Then": [0, 19, 25, 29, 33], "invok": [0, 2, 5, 11, 13, 25, 28, 29, 30, 31, 32, 33], "call": [0, 2, 3, 4, 5, 6, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33], "function": [0, 2, 3, 4, 5, 6, 7, 8, 9, 10, 18, 19, 29, 32, 34], "manag": [0, 2, 4, 5, 6, 35], "reason": [0, 23], "doe": [0, 2, 8, 14, 32, 33], "provid": [0, 2, 4, 5, 17, 25, 30, 32, 33, 34], "4": [0, 16, 19, 23, 24, 25, 27, 28, 30, 31, 32, 33], "6": [0, 16, 19, 23, 24, 25, 27, 30, 32, 33], "On": [0, 2, 33], "grab": [0, 8, 13, 28, 33], "5": [0, 5, 12, 15, 16, 17, 19, 23, 24, 25, 26, 27, 30, 31, 32, 33], "insid": [0, 12, 18, 33], "transform": [0, 3, 5, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 32, 33], "block": [0, 5, 13, 33], "through": [0, 2, 4, 5, 9, 25, 28, 32, 33, 34], "calcul": [0, 28], "complet": [0, 4, 8, 24, 26, 29, 30, 33], "defin": [0, 2, 7, 8, 9, 14, 15, 18, 19, 20, 26, 28, 30, 33], "server": [0, 10, 19, 26, 33, 35], "": [0, 2, 3, 4, 5, 8, 9, 15, 16, 17, 19, 20, 21, 24, 25, 26, 28, 29, 30, 31, 32, 36], "done": [0, 5, 8, 15, 29, 33], "result": [0, 2, 4, 8, 15, 18, 22, 24, 26, 27, 32, 33], "shown": [0, 13], "7": [0, 16, 19, 22, 23, 24, 25, 27, 28, 30, 33], "8": [0, 12, 16, 19, 22, 23, 24, 25, 27, 28, 30, 31, 32, 33], "help": [0, 20, 25, 33], "understand": [0, 32, 33], "oper": [0, 2, 5, 8, 10, 13, 14, 17, 18, 19, 25, 27, 29, 35], "immedi": [0, 5, 33], "add": [0, 2, 3, 4, 6, 8, 10, 14, 23, 25, 27, 28, 33], "intervent": [0, 1, 2, 3, 5, 8, 10, 11, 14, 15, 19, 20, 22, 25, 26, 28, 30, 36], "alongsid": [0, 33], "upon": [0, 2, 4, 33], "exit": [0, 2, 4, 16, 18, 26, 33], "exampl": [0, 2, 4, 5, 8, 12, 15, 17, 23, 25, 26, 27, 30, 33], "seen": 0, "below": [0, 15, 29, 30, 33], "node": [0, 2, 4, 5, 7, 8, 15, 25, 30, 33], "depend": [0, 2, 4, 5, 8, 12, 25, 33], "well": [0, 2, 5, 8, 14, 25, 33], "other": [0, 8, 14, 26, 33], "chosen": 0, "request": [0, 3, 4, 10, 25, 26, 30, 33], "inject": [0, 4, 8, 33], "basic": [0, 5, 23, 33, 34, 36], "lot": [0, 33], "insight": [0, 32, 33], "go": [0, 19, 24, 33], "For": [0, 2, 5, 9, 12, 14, 18, 19, 20, 22, 25, 29, 33], "logit": [0, 4, 5, 17, 19, 24, 28, 29, 30, 33, 36], "len": [0, 25, 28, 29, 30, 36], "text": [0, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "And": [0, 26, 33], "causal": [0, 30, 36], "path": [0, 3, 4, 5, 8, 9], "patch": [0, 1, 36], "circuit": [0, 29], "discoveri": [0, 29], "method": [0, 2, 4, 5, 8, 9, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32], "locat": [0, 13, 20, 33], "compon": [0, 29, 33], "within": [0, 2, 3, 8, 9, 12, 13, 14, 15, 17, 18, 20, 26, 28, 32, 33], "plai": 0, "decis": 0, "role": 0, "make": [0, 2, 4, 5, 10, 19, 20, 25, 28, 29, 33], "gradient": [0, 5, 8, 10, 29], "optim": [0, 19, 26, 30, 33], "out": [0, 2, 5, 6, 8, 14, 17, 18, 19, 21, 22, 25, 29, 33, 34], "order": [0, 2, 3, 4, 5, 8, 15, 21, 26, 33], "applic": [0, 14, 33], "cross": [0, 10, 19, 33], "prompt": [0, 2, 5, 10, 19, 22, 28, 29, 30, 31, 32, 33], "mani": [0, 2, 4, 8, 10, 18], "more": [0, 3, 5, 8, 12, 14, 18, 19, 20, 22, 25, 29, 30, 32, 33], "featur": [0, 20, 25, 31, 33, 34], "start": [0, 7, 11, 24, 26, 30, 36], "page": [0, 33], "inform": [0, 2, 4, 8, 25, 27, 29, 33], "project": [0, 15, 25, 29, 33, 34], "current": [0, 2, 3, 4, 8, 24, 25, 26, 33], "alpha": [0, 19, 33], "pre": [0, 2, 8, 13, 33], "releas": [0, 8, 30], "earli": [0, 8, 10, 18, 26], "user": [0, 3, 4, 5, 8, 13, 19, 25, 26, 33], "contributor": 0, "contribut": [0, 29, 33], "feedback": [0, 33], "join": [0, 33], "discord": [0, 33], "updat": [0, 2, 4, 8, 9, 12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 30, 31, 32, 33], "bug": 0, "report": 0, "opportun": 0, "effort": 0, "nnsight": [1, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34], "envoi": [1, 2, 5, 8, 19, 33], "schema": 1, "util": [1, 19, 25, 28, 30, 32, 33], "contain": [2, 4, 5, 8, 19, 30, 33], "logic": [2, 4, 8, 33], "primari": [2, 4, 5], "two": [2, 8, 12, 13, 17, 28, 29, 30, 33], "class": [2, 3, 4, 5, 6, 7, 8, 9, 11, 19, 33], "involv": [2, 4, 8, 36], "tracer": [2, 3, 5, 7, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 32, 33], "around": [2, 5, 33], "underli": [2, 3, 5, 8, 15, 33], "an": [2, 3, 4, 5, 6, 7, 8, 9, 15, 17, 18, 19, 20, 24, 25, 26, 29, 30, 31, 33, 35], "track": [2, 4, 5, 8], "perform": [2, 5, 9, 17], "said": [2, 8, 36], "expos": [2, 11, 16, 18, 33], "attribut": [2, 3, 4, 5, 6, 8, 9, 16, 17, 32, 33, 36], "To": [2, 24, 26, 30, 32, 33, 34, 35], "do": [2, 3, 5, 10, 14, 15, 17, 19, 21, 24, 25, 28, 29, 33], "need": [2, 4, 5, 9, 10, 14, 19, 20, 24, 25, 28, 29, 30, 33], "know": [2, 19, 33], "about": [2, 4, 7, 11, 30, 31, 32, 33], "so": [2, 3, 4, 5, 8, 16, 19, 24, 25, 29, 33], "each": [2, 5, 8, 18, 22, 26, 29, 30, 32, 33], "i": [2, 3, 4, 5, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 36], "keep": [2, 4, 25, 33], "batch_siz": [2, 4, 19, 30, 33], "recent": [2, 3, 15, 25, 33], "gener": [2, 3, 4, 5, 8, 10, 13, 19, 32, 33, 35], "index": [2, 4, 5, 8, 19, 25, 28, 32, 33], "multi": [2, 33], "iter": [2, 3, 4, 7, 10, 19, 28, 33], "made": [2, 12, 20, 33], "dure": [2, 8, 15, 17, 21, 27, 33], "its": [2, 5, 8, 14, 16, 20, 24, 25, 26, 29, 33], "batched_input": 2, "ad": [2, 4, 5, 8, 18, 19, 23, 33], "should": [2, 3, 4, 5, 7, 8, 9, 19, 22, 25, 33], "format": [2, 7, 30, 33], "where": [2, 5, 8, 15, 17, 25, 28, 29, 30, 33], "batch": [2, 4, 5, 19, 28, 29, 30], "allow": [2, 4, 5, 8, 18, 20, 21, 25, 33, 35], "thing": [2, 10, 17, 21, 33], "consist": 2, "valid": [2, 5, 8, 10, 24, 30, 33], "both": [2, 4, 5, 19, 33], "becom": 2, "case": [2, 5, 8, 13, 19, 29, 33], "regardless": 2, "whether": [2, 8, 30], "string": [2, 3, 5, 9, 32, 33], "process": [2, 5, 8, 17, 24, 26, 32, 33], "dictionari": [2, 4, 7, 8, 33, 36], "id": [2, 5, 7, 8, 19, 32, 33], "onli": [2, 3, 4, 5, 8, 9, 12, 15, 19, 22, 24, 25, 27, 30, 33], "us": [2, 4, 5, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35], "carri": [2, 6, 8], "what": [2, 5, 19, 25, 27, 28, 32, 33], "accept": 2, "parent": [2, 5, 6, 8], "appropri": [2, 5, 8, 30, 33], "respect": [2, 3, 29, 33], "enter": [2, 5, 13, 28, 33], "some": [2, 5, 8, 9, 19, 25, 31, 33], "leverag": [2, 5, 33], "prepar": [2, 5, 8, 33], "version": [2, 5, 8, 13, 20, 26, 29, 32, 33], "size": [2, 4, 12, 22, 25, 33], "It": [2, 12, 14, 18, 19, 20, 24, 25, 26, 31, 33], "meta_model": [2, 5], "dtype": [2, 4, 7, 24, 33], "base": [2, 4, 5, 8, 18, 20, 30, 33], "characterist": 2, "come": [2, 13, 33], "extens": 2, "remotetrac": 2, "check_for_depend": 2, "data": [2, 4, 7, 9, 19, 25, 26, 30, 33], "tupl": [2, 3, 4, 5, 7, 28, 30, 33], "bool": [2, 3, 5, 7, 8, 9, 33], "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 24, 30, 33, 34], "check": [2, 3, 4, 8, 12, 14, 18, 19, 20, 25, 29, 33, 34], "proxi": [2, 3, 4, 5, 8, 14, 15, 17, 23, 25, 28, 33], "convert": [2, 8], "them": [2, 4, 5, 8, 9, 13, 14, 23, 25, 28, 30, 33], "bridg": [2, 8], "lock": [2, 8], "later": [2, 26, 33], "valu": [2, 4, 5, 7, 8, 10, 13, 15, 17, 19, 23, 25, 26, 28, 29, 30, 31, 32, 33], "return": [2, 3, 4, 5, 8, 9, 14, 15, 19, 22, 25, 29, 30, 33], "replac": [2, 6, 7, 8, 13, 19, 25, 26, 33], "were": [2, 5, 8, 15, 28, 33], "type": [2, 3, 4, 5, 6, 7, 8, 9, 15, 25, 32, 33], "resolve_depend": [2, 33], "turn": [2, 25, 33], "find": [2, 28, 29, 30, 31, 32, 33], "resolv": 2, "backend": [2, 5, 25, 33], "none": [2, 3, 4, 5, 6, 7, 8, 19, 25, 30, 33], "return_context": [2, 5, 18, 19, 33], "kwarg": [2, 3, 4, 5, 7, 8, 9, 25, 33], "_model": [2, 5, 33], "nnsightmodel": [2, 5, 33], "th": 2, "_graph": 2, "_arg": [2, 5], "posit": [2, 3, 5, 8, 12, 19, 28, 29, 30, 32, 33], "pass": [2, 3, 4, 5, 8, 9, 10, 15, 17, 18, 20, 28, 29, 33], "list": [2, 3, 4, 5, 6, 7, 8, 9, 18, 30, 32, 33], "_kwarg": [2, 5, 33], "keyword": [2, 5, 8, 33], "dict": [2, 4, 5, 7, 8, 9, 33], "str": [2, 3, 4, 5, 6, 7, 8, 9, 15, 25, 33], "_invoker_input": 2, "invoc": [2, 13, 28], "_invok": 2, "edit_backend_execut": 2, "handl": [2, 4, 5, 6, 8, 26, 33], "editmixin": 2, "edit": [2, 4, 5, 10, 11, 27], "dor": 2, "given": [2, 4, 8, 9, 11, 25, 28, 29, 32, 33], "rais": [2, 5, 8, 15, 25, 30, 33], "except": [2, 7, 8, 33], "alreadi": [2, 3, 4, 5, 8, 24, 26, 33], "local_backend_execut": [2, 33], "remotemixin": 2, "next": [2, 8, 20, 22, 32], "increment": [2, 4, 8, 33], "int": [2, 3, 4, 5, 7, 8, 12, 19, 30, 33], "1": [2, 5, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36], "call_it": [2, 4], "how": [2, 4, 8, 19, 20, 22, 23, 25, 29, 30, 31, 32, 33], "onc": [2, 3, 16, 24, 25, 33], "remote_backend_get_model_kei": 2, "model_kei": 2, "specifi": [2, 8, 12, 14, 24, 32, 33], "kei": [2, 4, 5, 6, 24, 25, 29, 33, 35], "remote_backend_handle_result_valu": 2, "postprocess": 2, "remote_backend_postprocess_result": 2, "local_result": 2, "move": [2, 8, 26, 29, 33], "tensor": [2, 3, 4, 5, 7, 8, 10, 12, 13, 14, 16, 17, 19, 21, 22, 23, 24, 25, 27, 29, 30, 33], "cpu": [2, 29, 30, 31, 33], "detach": [2, 29, 30, 32], "etc": [2, 8, 26, 33], "post": [2, 29, 32, 33], "scan": [2, 5, 10, 19, 30, 33], "meant": 2, "tandem": 2, "initi": [2, 3, 5, 22, 33], "_prepare_input": [2, 5], "faketensor": [2, 8], "potenti": [2, 4, 19, 30, 33], "correctli": [2, 25, 33], "free": [2, 8, 30, 35], "wise": 2, "mai": [2, 33], "loop": [2, 10, 18, 19, 25], "shape": [2, 3, 4, 5, 8, 10, 17, 19, 22, 25, 27, 29, 30, 33], "error": [2, 8, 25, 33], "have": [2, 4, 5, 8, 12, 13, 19, 25, 26, 29, 31, 33], "first": [2, 3, 4, 5, 9, 13, 15, 17, 19, 28, 36], "graphbasedcontext": [2, 25, 33], "globaltracingcontext": [2, 25, 33], "global": 2, "without": [2, 19, 20, 26, 33, 35], "refer": [2, 3, 4, 7, 8, 26, 33], "There": [2, 5, 8, 17, 33], "global_tracing_context": [2, 25, 33], "torch_handl": 2, "torch": [2, 3, 4, 5, 8, 9, 11, 12, 14, 17, 19, 21, 22, 23, 24, 27, 29, 30, 31, 32, 33], "globaltracingexit": [2, 25, 33], "globaltracingtorchhandl": [2, 25, 33], "static": 2, "deregist": 2, "graph_based_context": 2, "regist": [2, 4, 9, 35], "try_deregist": 2, "attempt": [2, 4, 8, 25, 33], "Will": 2, "w": 2, "success": [2, 33], "otherwis": [2, 3, 4, 5, 8, 25, 30, 33], "try_regist": 2, "appli": [2, 4, 5, 8, 9, 10, 14, 19, 20, 21, 22, 25, 28, 29, 32, 33], "target": [2, 7, 8, 9, 25, 33], "callabl": [2, 3, 4, 5, 8, 9, 32], "arg": [2, 3, 4, 5, 7, 8, 9, 19, 25, 33], "interventionproxi": [2, 3, 4, 5, 8], "helper": [2, 5], "directli": [2, 5, 8, 20, 25, 33], "try": [2, 8, 25, 33], "fakemod": 2, "test": [2, 5, 13, 30], "traceabl": [2, 8, 33], "bridge_backend_handl": 2, "self": [2, 5, 15, 19, 25, 33], "capac": 2, "bytearrai": [2, 33], "byte": [2, 33], "complex": [2, 8, 11, 33], "number": [2, 5, 8, 30, 31, 33], "cond": [2, 12, 18, 33], "condit": [2, 7, 8, 10], "entrypoint": [2, 5], "act": [2, 3, 5, 32, 33], "evalu": [2, 8, 30], "boolean": [2, 8, 30, 33], "bodi": [2, 18, 33], "union": [2, 4, 5, 7, 8, 25, 33], "setup": [2, 8, 36], "ex": [2, 4, 8], "sequenti": [2, 5, 7, 8, 11, 19, 26, 33], "earlystopprotocol": [2, 8, 33], "float": [2, 7, 19, 33], "log": [2, 7, 8, 12, 18, 19, 26, 33], "via": [2, 4, 5, 8, 17, 18, 24, 33], "vi": [2, 8], "visual": [2, 4, 8], "A": [2, 8, 18, 22, 25, 29, 33], "conting": 2, "_condit": 2, "conditionalmanag": [2, 8], "attach": [2, 4, 5, 8, 15, 25, 33], "_conditional_dict": 2, "map": [2, 4, 7, 8, 30], "conditionalprotocol": [2, 8], "name": [2, 3, 4, 5, 7, 8, 14, 15, 25, 29, 33], "_conditioned_nodes_dict": 2, "condition": 2, "_conditional_stack": 2, "stack": [2, 8, 31], "visit": [2, 8], "conditonalprotocol": 2, "add_conditioned_nod": [2, 8], "conditon": [2, 8], "latest": [2, 8], "is_node_condit": [2, 8], "peek": 2, "lastest": 2, "non": [2, 33], "empti": 2, "option": [2, 3, 4, 5, 8, 19, 20, 32, 33], "pop": [2, 8], "push": 2, "conditional_nod": 2, "session": [2, 5, 7, 10, 18, 19, 32], "root": [2, 3, 4, 8, 9, 33], "collect": [2, 3, 4, 5, 8, 9, 25, 30, 33], "new": [2, 4, 5, 8, 12, 13, 17, 19, 20, 25, 27, 33], "subsequ": [2, 4, 22, 33], "referenc": 2, "item": [2, 14, 18, 28, 29, 30, 31, 33], "over": [2, 5, 18, 19, 29, 33], "module_path": [3, 4, 8, 33], "tree": [3, 21], "repres": [3, 5, 6, 8, 28, 30], "rel": [3, 4, 8], "separ": [3, 8, 9, 14, 29, 33], "e": [3, 9, 26, 33], "x": [3, 5, 8, 9, 28, 30, 32, 33], "h": [3, 5, 9, 11, 14, 15, 16, 17, 19, 20, 21, 22, 23, 25, 27, 28, 29, 32, 33], "_fake_output": 3, "_scan": 3, "multipl": [3, 5, 8, 10, 20, 26, 28, 33], "than": [3, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33], "_fake_input": 3, "reset": [3, 5, 8], "forward": [3, 5, 8, 9, 15, 19, 20, 28, 29, 30, 33], "_call_it": 3, "integ": [3, 12, 33], "_tracer": 3, "must": [3, 8, 14, 33], "manual": [3, 33], "properti": [3, 4, 5, 8, 15, 33], "denot": [3, 4, 22], "wish": [3, 4, 5, 20, 33], "therefor": [3, 4, 8, 14, 15, 33], "time": [3, 4, 5, 8, 10, 12, 19, 31, 33], "include_fn": 3, "ran": [3, 33], "against": 3, "includ": [3, 17, 33], "final": [3, 5, 33], "itself": [3, 5, 8, 19, 33], "named_modul": 3, "overrid": [3, 5], "nn": [3, 4, 5, 8, 11, 19, 30, 31, 32, 33], "extend": [4, 18, 33], "easier": 4, "interven": [4, 10, 13, 27, 33], "entri": 4, "hook": [4, 5, 8, 9, 29, 33], "hookmodel": 4, "remov": [4, 5, 8, 13, 20, 33], "hookhandl": [4, 5, 33], "module_kei": 4, "input_hook": [4, 33], "output_hook": [4, 33], "__enter__": [4, 6, 25, 33], "__exit__": [4, 6, 25, 33], "design": [4, 33], "signatur": 4, "removablehandl": 4, "interventionhandl": [4, 5, 33], "batch_group": [4, 33], "interventionprotocol": [4, 33], "total": [4, 14, 33], "counter": 4, "ha": [4, 5, 8, 9, 24, 26, 30, 33], "been": [4, 5, 8, 9, 15, 19, 24, 26, 33], "count": [4, 8], "tri": [4, 33], "protocol": [4, 8, 33], "overal": 4, "classmethod": [4, 8], "proxy_valu": [4, 8, 15, 25, 33], "module1": [4, 8], "module2": [4, 8], "_description_": [4, 5], "get_intervent": [4, 33], "interventionnod": 4, "activ": [4, 5, 26, 29, 31, 32, 33, 36], "intervention_handl": [4, 33], "form": [4, 5, 8, 14, 33], "exist": [4, 5, 8, 32], "batch_start": 4, "readi": [4, 8], "yet": [4, 5, 32, 33], "continu": [4, 30, 33], "narrow": [4, 33], "select": 4, "relev": [4, 8, 33], "view": [4, 8, 25, 30, 33], "oppos": 4, "copi": [4, 5, 8, 30], "downstream": [4, 5], "origin": [4, 5, 6, 8, 11, 13, 20, 25, 26, 30, 33], "prevent": [4, 31], "effect": [4, 11, 20, 29, 33], "bath": 4, "outsid": [4, 8, 33], "preview": 4, "either": [4, 5, 24, 26, 33], "handler": 4, "modifi": [4, 20, 25, 26, 33], "style": [4, 8], "sub": [4, 5, 8, 33], "addit": [4, 19, 26, 33], "delet": [4, 16, 33], "listen": [4, 8, 33], "lm_head": [4, 5, 11, 19, 20, 21, 26, 28, 29, 32, 33], "devic": [4, 5, 8, 14, 16, 17, 21, 22, 23, 25, 27, 30, 33], "retriev": [4, 9, 19, 33], "real": [4, 5, 25, 30, 33], "grad": [4, 8, 17, 29, 33], "stop": [4, 7, 8, 10, 26], "after": [4, 5, 9, 16, 17, 19, 22, 24, 26, 28, 29, 32, 33], "creation": 4, "updateprotocol": [4, 8], "main": [5, 33], "wrap": [5, 8, 9, 11, 14, 33], "gpt2": [5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 33, 36], "repo": 5, "device_map": [5, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33], "cuda": [5, 16, 17, 21, 22, 23, 27, 28, 30, 31], "declar": 5, "entail": 5, "automodelforcausallm": [5, 33], "unus": [5, 30], "acceler": 5, "packag": [5, 9, 11, 12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 32, 33, 34], "encompass": 5, "displai": [5, 8, 32, 33], "structur": 5, "abil": [5, 29], "gpt2lmheadmodel": [5, 32, 33], "gpt2model": [5, 32, 33], "wte": [5, 13, 32, 33], "embed": [5, 13, 32, 33], "50257": [5, 32, 33], "768": [5, 19, 22, 25, 32, 33], "wpe": [5, 32, 33], "1024": [5, 19, 32, 33], "drop": [5, 32, 33], "dropout": [5, 32, 33], "p": [5, 32, 33], "inplac": [5, 9, 20, 32, 33], "modulelist": [5, 32, 33], "12": [5, 12, 14, 18, 19, 20, 21, 25, 26, 29, 30, 32, 33], "gpt2block": [5, 32, 33], "ln_1": [5, 32, 33], "layernorm": [5, 32, 33], "ep": [5, 32, 33], "1e": [5, 30, 32, 33], "05": [5, 32, 33], "elementwise_affin": [5, 32, 33], "attn": [5, 29, 32, 33], "gpt2attentionalt": 5, "c_attn": [5, 32, 33], "conv1d": [5, 32, 33], "c_proj": [5, 29, 32, 33], "attn_dropout": [5, 32, 33], "resid_dropout": [5, 32, 33], "queri": 5, "wrappermodul": [5, 9, 32, 33], "ln_2": [5, 32, 33], "gpt2mlp": [5, 32, 33], "c_fc": [5, 32, 33], "newgeluactiv": [5, 32, 33], "ln_f": [5, 21, 32, 33], "linear": [5, 11, 29, 31, 32, 33], "in_featur": [5, 31, 32, 33], "out_featur": [5, 31, 32, 33], "bia": [5, 31, 32, 33], "explicit": [5, 33], "control": [5, 33], "level": [5, 9, 15, 30, 33], "specif": [5, 29, 33], "spawn": 5, "runner": [5, 24, 33], "metadispatch": 5, "_dispatch_kei": 5, "becaus": [5, 28], "evil": 5, "ty": 5, "caden": [5, 17, 27, 31], "implement": [5, 8, 34], "wrapper": [5, 9, 33], "gain": [5, 32], "proxy_class": [5, 8, 25, 33], "_model_kei": 5, "kind": [5, 9, 18, 33], "usual": [5, 12, 21, 33], "hug": [5, 32], "face": [5, 32], "checkpoint": [5, 31], "custom": [5, 10], "_dispatch": 5, "_custom_model": 5, "repoid_path_model": 5, "_envoi": [5, 25, 33], "_session": 5, "clear_edit": [5, 20, 33], "dispatch_model": 5, "dispatch": [5, 29, 30, 32, 33], "_load": 5, "futur": 5, "place": [5, 17, 19, 20, 33], "editor": [5, 20, 33], "_execut": [5, 33], "raw": 5, "openai": [5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 32, 33], "commun": [5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 32, 33], "complexmodul": 5, "def": [5, 14, 15, 19, 25, 29, 30, 33], "__init__": [5, 8, 9, 19, 25, 33], "super": [5, 19, 25, 33], "l0": 5, "gpt2_edit": 5, "msg_prompt": 5, "clone": [5, 17, 25, 27, 33, 34], "original_output": [5, 25], "edited_output": 5, "fn": [5, 8, 9, 33], "intervention_graph": [5, 33], "re": [5, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "compil": 5, "last": [5, 8, 15, 17, 19, 20, 21, 22, 25, 26, 33], "total_batch_s": 5, "garbag": 5, "clear": [5, 20, 33], "memori": [5, 8, 25, 30, 33], "group": 5, "alia": 5, "popul": [5, 8, 15, 16, 19, 33], "fake": [5, 8, 25, 33], "tenor": 5, "dim": [5, 11, 19, 20, 21, 25, 26, 29, 30, 31, 32, 33], "noop": 5, "remotebackend": 5, "url": 5, "invoker_arg": [5, 33], "short": 5, "inspect": [5, 8, 15, 25, 33], "complic": 5, "prepare_input": [5, 8, 25, 33], "valueerror": [5, 8, 15, 33], "noth": [5, 8, 31], "wai": [5, 17, 19, 25, 28, 31, 33], "extrem": 5, "our": [5, 10, 12, 14, 19, 25, 26, 28, 29, 30, 33], "ordereddict": [5, 11, 33], "input_s": [5, 11, 33], "hidden_dim": [5, 11, 33], "output_s": [5, 11, 33], "layer1": [5, 11, 33], "sigma1": 5, "sigmoid": 5, "layer2": [5, 11, 33], "sigma2": 5, "example_input": 5, "rand": [5, 12, 33], "singl": [5, 8, 18, 26, 30, 33], "l2_input": [5, 33], "l2_output": 5, "second": [5, 13, 17, 33], "divid": 5, "scope": [5, 33], "inner": [5, 19, 32, 33], "simpli": [5, 19, 24, 33], "expect": [5, 20, 33], "example_input2": 5, "output1": 5, "output2": 5, "languag": [5, 24, 33], "token": [5, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "custom_model": 5, "generationmixin": 5, "config": [5, 7, 24, 26, 28, 30, 33], "file": [5, 15, 24, 25, 33], "repositori": 5, "pretrainedconfig": 5, "lm": 5, "pretrainedtoken": 5, "automodel": 5, "auto": [5, 12, 13, 14, 15, 17, 18, 19, 20, 25, 26, 27, 29, 31, 32, 33], "pretrainedmodel": 5, "languagemodelproxi": 5, "idx": [5, 30, 33], "t": [5, 8, 14, 19, 25, 26, 28, 29, 31, 32, 33], "pad": [5, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33], "mean": [5, 8, 25, 26, 29, 33], "shift": [5, 32], "care": [5, 9, 33], "_type_": 5, "tokenindex": 5, "dimens": [5, 19, 25, 29, 30, 31, 33], "neg": 5, "left": [5, 22, 30], "equival": 5, "aid": 5, "unifiedtransform": 5, "transformerlen": 5, "hookedtransform": 5, "constructor": 5, "from_pretrained_no_process": 5, "from_pretrain": 5, "obj": [6, 33], "restor": [6, 20, 33], "patcher": [6, 25, 33], "apiconfigmodel": 7, "host": [7, 26, 33], "dev": 7, "ssl": 7, "apikei": 7, "job_id": 7, "model_config": 7, "classvar": 7, "configdict": 7, "configur": [7, 24, 33], "conform": 7, "pydant": 7, "model_field": 7, "fieldinfo": 7, "annot": [7, 32], "nonetyp": 7, "requir": [7, 24, 29, 31, 33, 35], "metadata": 7, "field": [7, 30, 33], "__fields__": 7, "v1": 7, "appconfigmodel": 7, "remote_log": 7, "configmodel": 7, "api": [7, 24, 33, 35], "app": 7, "respons": [7, 8, 29, 30], "responsemodel": 7, "statu": [7, 33], "jobstatu": 7, "descript": 7, "receiv": [7, 24, 26, 33], "datetim": 7, "session_id": 7, "enumer": [7, 28, 30, 32], "resultmodel": 7, "basennsightmodel": 7, "type_nam": 7, "liter": 7, "arbitrary_types_allow": 7, "dictmodel": 7, "tracermodel": 7, "iteratormodel": 7, "sessionmodel": 7, "nodemodel": 7, "slicemodel": 7, "tensormodel": 7, "primitivemodel": 7, "tuplemodel": 7, "listmodel": 7, "ellipsismodel": 7, "discrimin": 7, "aftervalid": 7, "slice": 7, "strict": 7, "ellipsi": 7, "functionmodel": 7, "function_nam": 7, "functionwhitelisterror": 7, "graphmodel": 7, "forwardref": 7, "graphtyp": 7, "node_refer": 7, "nodereferencetyp": 7, "primitivetyp": 7, "valuetyp": 7, "builtin_function_or_method": 7, "method_descriptor": 7, "primit": 7, "step": [7, 19, 23, 30, 31, 32, 33], "invoker_input": [7, 33], "individu": [8, 29], "graph_id": 8, "compos": [8, 33], "preserv": [8, 20, 33], "extra": 8, "aliv": [8, 25, 33], "consid": [8, 29], "still": [8, 32, 33], "name_idx": 8, "target_nam": 8, "previou": [8, 33], "uniqu": 8, "possibl": [8, 13, 24, 26, 33], "essenti": 8, "faketensormod": [8, 25, 33], "catch": [8, 25, 33], "fulfil": [8, 33], "These": 8, "construct": 8, "recurs": 8, "newli": [8, 25, 33], "titl": [8, 28, 29, 32], "graphic": 8, "pygraphviz": 8, "param": [8, 30], "directori": 8, "content": 8, "show": [8, 19, 28, 29, 32, 33], "imag": 8, "action": [8, 33], "AND": 8, "ones": [8, 33], "datatyp": [8, 33], "set_valu": [8, 33], "bi": 8, "similarli": [8, 33], "ceas": 8, "destroi": [8, 15, 33], "remain": 8, "weak": 8, "arg_depend": [8, 33], "cond_depend": 8, "weakref": 8, "dead": 8, "clean": [8, 28, 29], "v": [8, 24, 30, 33], "assum": [8, 17, 33], "destruct": 8, "els": [8, 12, 15, 25, 29, 30, 33], "remaining_depend": [8, 33], "less": 8, "correct": [8, 19, 22, 25, 28, 29, 30, 33], "preprocess": 8, "redund": 8, "remaining_listen": [8, 33], "event": 8, "now": [8, 19, 20, 28, 32, 33], "_valu": [8, 15, 33], "_empti": [8, 15, 25, 33], "never": [8, 15, 19, 24, 25, 31, 33], "viz_graph": 8, "agraph": 8, "backend_nam": 8, "edg": 8, "inher": 8, "differenti": 8, "magic": 8, "__torch_function__": [8, 25, 33], "proxy_wrapp": 8, "problemat": 8, "sometim": 8, "applymoduleprotocol": 8, "__call__": [8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "wont": 8, "trigger": 8, "set_modul": 8, "applymodul": 8, "get_modul": 8, "bridgeprotocol": 8, "connect": 8, "anoth": [8, 21, 26, 33], "bridgeexcept": 8, "get_bridg": 8, "set_bridg": 8, "has_bridg": 8, "peek_graph": 8, "statement": [8, 12, 18, 33], "get_condit": 8, "cond_node_nam": 8, "has_condit": 8, "peek_condit": 8, "pop_condit": 8, "push_condit": 8, "earlystopexcept": [8, 33], "stop_point_nod": 8, "gradprotocol": 8, "backward": [8, 17, 19, 29, 30, 33], "register_hook": [8, 17], "backward_idx": 8, "localbackendexecuteprotocol": 8, "localmixin": [8, 33], "lockprotocol": 8, "who": [8, 11], "won": [8, 33], "might": [8, 33], "power": [8, 32, 33], "swapprotocol": [8, 33], "swap": [8, 17, 26, 30, 33], "get_swap": [8, 33], "new_valu": 8, "valueprotocol": 8, "facilit": 8, "matter": [8, 19, 33], "id_to_graph": 8, "graph_stack": 8, "bridged_nod": 8, "defaultdict": 8, "entiti": 8, "ti": [8, 15, 33], "add_bridge_proxi": 8, "bridge_proxi": 8, "correspond": [8, 32, 33], "get_bridge_proxi": 8, "get_graph": 8, "hierarch": 8, "pop_graph": 8, "throughout": [9, 25], "element": [9, 14, 33], "everi": [9, 26, 29, 31, 32, 33], "overridden": 9, "subclass": [9, 33], "although": 9, "recip": 9, "instanc": [9, 20, 30, 33], "afterward": 9, "former": [9, 33], "latter": [9, 33], "silent": 9, "ignor": [9, 33, 36], "cl": [9, 33], "member": 9, "fetch_attr": 9, "hierarchi": [9, 33], "fetch": 9, "__class__": 9, "debug": [10, 25, 33], "persist": [10, 20, 33], "lora": 10, "train": [10, 15, 19, 30], "interpret": [11, 33, 34], "\u025bn": [11, 34], "sa\u026at": [11, 34], "manipul": [11, 34], "doc": [11, 33], "tutori": [11, 29, 30, 33, 34], "capabl": [11, 33], "net": [11, 33], "39": [11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33], "walkthrough": [11, 29, 34, 36], "invent": 11, "hidden_state_output": 11, "hidden_state_input": 11, "develop": [11, 33], "measur": 11, "argmax": [11, 20, 21, 26, 30, 33], "met": [12, 33], "rand_int": [12, 33], "randint": [12, 33], "low": [12, 33], "high": [12, 30, 31, 33], "random": [12, 30, 33], "even": [12, 15, 17, 21, 33], "odd": [12, 33], "opt": [12, 14, 18, 19, 20, 25, 26, 33], "homebrew": [12, 14, 18, 19, 20, 25, 26, 33], "anaconda3": [12, 14, 18, 19, 20, 25, 26, 33], "env": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 33], "nnsight_loc": [12, 14, 18, 19, 20, 25, 26, 33], "lib": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 32, 33], "python3": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 32, 33], "site": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 33], "tqdm": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 30, 31], "py": [12, 13, 14, 15, 17, 18, 19, 20, 25, 26, 27, 31, 32, 33], "21": [12, 13, 14, 17, 18, 19, 20, 24, 25, 26, 27, 29, 31, 33], "tqdmwarn": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "iprogress": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "found": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 33], "pleas": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34], "jupyt": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "ipywidget": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "http": [12, 13, 14, 17, 18, 19, 20, 24, 25, 26, 27, 31, 32, 33], "readthedoc": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "io": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "en": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "stabl": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "user_instal": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "html": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "autonotebook": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "notebook_tqdm": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "tokenization_utils_bas": [12, 14, 18, 19, 20, 25, 33], "1601": [12, 14, 18, 19, 20, 25, 33], "futurewarn": [12, 13, 14, 18, 19, 20, 25, 33], "clean_up_tokenization_spac": [12, 14, 18, 19, 20, 25, 33], "behavior": [12, 14, 18, 19, 20, 25, 30, 33], "deprec": [12, 13, 14, 18, 19, 20, 25, 33], "v4": [12, 14, 18, 19, 20, 25, 33], "45": [12, 14, 15, 18, 19, 20, 25, 32, 33], "detail": [12, 14, 18, 19, 20, 25, 29, 33], "issu": [12, 14, 18, 19, 20, 25, 33], "github": [12, 14, 18, 19, 20, 25, 33, 34], "com": [12, 14, 18, 19, 20, 25, 33], "31884": [12, 14, 18, 19, 20, 25, 33], "warn": [12, 13, 14, 18, 19, 20, 24, 25, 26, 30, 32, 33], "gpt2tokenizerfast": [12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 32, 33], "note": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33], "fast": [12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "faster": [12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "encod": [12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "follow": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "abov": [12, 20, 25, 26, 29, 33], "mutual": [12, 33], "exclus": [12, 33], "nest": [12, 18, 33], "non_rand_int": [12, 33], "madison": 13, "squar": 13, "garden": 13, "rockinglikebalboa": 13, "huggingface_hub": [13, 32], "file_download": 13, "1132": 13, "resume_download": 13, "download": [13, 24, 26, 33], "alwai": [13, 19, 20, 33], "resum": 13, "forc": 13, "force_download": 13, "max_new_token": [13, 22, 33], "_": [13, 18, 19, 28, 32, 33], "batch_decod": [13, 19, 33], "pad_token_id": [13, 19, 22, 33], "eos_token_id": [13, 19, 22, 33], "50256": [13, 19, 22, 33], "end": [13, 19, 22, 28, 33], "york": 13, "everyth": [14, 33], "part": [14, 31, 33], "box": [14, 33], "support": [14, 18, 33, 34], "einop": [14, 29, 33], "don": [14, 25, 26, 28, 29, 33], "anyth": [14, 25, 33], "special": [14, 33], "sum": [14, 17, 23, 29, 30, 31, 33], "tensor_sum": [14, 33], "flat": [14, 33], "flatten": [14, 30, 33], "coma": [14, 33], "custom_sum": [14, 33], "npytorch": 14, "191": 14, "2442": 14, "mp": [14, 25, 33], "grad_fn": [14, 16, 17, 21, 23, 25, 27], "lt": [14, 16, 17, 21, 23, 24, 25, 26, 27, 30, 33], "sumbackward0": [14, 23], "gt": [14, 15, 16, 17, 21, 23, 25, 27, 30, 33], "wide": [14, 33], "intermedi": [15, 18, 26, 30, 32, 33], "halt": [15, 33], "reduc": [15, 29, 33], "runtim": [15, 17, 33], "conserv": [15, 33], "resourc": [15, 33], "One": [15, 29, 30, 33], "particularli": [15, 33], "sae": [15, 33], "l1_out": [15, 33], "l1": [15, 33], "necessarili": [15, 33], "associ": [15, 32, 33], "As": [15, 25, 33], "termin": [15, 26, 33], "link": [15, 33], "beyond": [15, 33], "point": [15, 21, 33], "skip": [15, 29, 33], "earlier": [15, 26, 33], "cannot": [15, 33], "l2_out": [15, 33], "l2": [15, 33], "traceback": [15, 25, 33], "cell": [15, 25, 32, 33], "34": [15, 21, 25, 33], "src": [15, 25, 33], "56": [15, 33], "__str__": [15, 33], "52": [15, 17, 30, 33], "54": [15, 30, 33], "58": [15, 33], "f": [15, 28, 29, 30, 33], "__name__": [15, 25, 33], "50": [15, 30, 33], "42": [15, 30, 33], "43": [15, 30, 33], "44": [15, 33], "46": [15, 33], "47": [15, 30, 33], "48": [15, 33], "182": [15, 33], "172": [15, 33], "173": [15, 33], "174": [15, 33], "178": [15, 33], "179": [15, 33], "181": [15, 33], "befor": [15, 17, 22, 24, 25, 26, 28, 31, 33], "184": [15, 24, 33], "desir": 16, "0505": [16, 23, 27], "1728": [16, 23, 27], "1690": [16, 23, 27], "0096": [16, 23, 27], "1280": [16, 23, 27], "0687": [16, 23, 27], "7494": [16, 23, 27], "9057": [16, 23, 27], "3024": [16, 23, 27], "0418": [16, 23, 27], "2964": [16, 23, 27], "8677": [16, 23, 27], "2960": [16, 23, 27], "6686": [16, 23, 27], "6642": [16, 23, 27], "2391": [16, 23, 27], "6064": [16, 23, 27], "2263": [16, 23, 27], "1537": [16, 23, 27], "8917": [16, 23, 27], "8651": [16, 23, 27], "0588": [16, 23, 27], "9866": [16, 23, 27], "9188": [16, 23, 27], "4460": [16, 23, 27], "4285": [16, 23, 27], "9": [16, 19, 23, 24, 25, 27, 30, 33], "3065": [16, 23, 27], "0528": [16, 23, 27], "7946": [16, 23, 27], "5556": [16, 23, 27], "6286": [16, 23, 27], "7258": [16, 23, 27], "7969": [16, 23, 24, 27, 33], "6714": [16, 23, 27], "0683": [16, 23, 27], "0481": [16, 23, 27], "addbackward0": [16, 17, 23], "coupl": [17, 33], "requires_grad": [17, 19, 33], "share": [17, 27, 31, 33], "conda": [17, 27, 31], "interp": [17, 27, 31], "hello": [17, 19, 33], "world": [17, 31], "5216": 17, "1755": 17, "4617": 17, "1919": 17, "0204": 17, "0075": 17, "9841": 17, "2175": 17, "5851": 17, "5212": 17, "2286": 17, "7334": 17, "retain_grad": 17, "hidden_states_grad": 17, "28": [17, 33], "7976": 17, "282": 17, "5981": 17, "868": 17, "7354": 17, "120": 17, "1743": 17, "2264": 17, "168": 17, "6449": 17, "79": [17, 26, 33], "4181": 17, "253": 17, "6225": 17, "1322": [17, 19], "1293": 17, "208": 17, "3980": 17, "19": [17, 29, 33], "5545": 17, "509": 17, "9857": 17, "better": [17, 33], "demonstr": [17, 20, 24, 25, 29, 33], "ablat": [17, 33], "zero": [17, 19, 32, 33], "hidden_states_grad_befor": 17, "hidden_states_grad_aft": 17, "scalabl": [18, 29, 33], "sequenc": [18, 33], "close": [18, 33], "mimic": [18, 33], "convent": [18, 33], "syntax": [18, 33], "li": [18, 33], "append": [18, 28, 29, 30, 31, 32, 33], "num": [18, 33], "rang": [18, 28, 29, 30, 32, 33], "li2": [18, 33], "item_2": [18, 33], "nlist": [18, 33], "pari": [19, 20, 21, 26, 33], "r": [19, 33], "init": [19, 33], "randn": [19, 27, 33], "wb": [19, 33], "much": [19, 29, 33], "alter": [19, 20, 33], "a_x": [19, 33], "matmul": [19, 33], "ba_x": [19, 33], "variabl": [19, 24, 26, 30, 33], "answer": [19, 28, 29, 33], "answer_token": [19, 33], "lora_dim": [19, 33], "fulli": [19, 33], "achiev": [19, 33], "dataload": [19, 30, 33], "isn": [19, 33], "transmit": [19, 33], "dataset": [19, 30, 32, 33], "100": [19, 24, 25, 26, 30, 33], "pair": [19, 30, 33], "blank": [19, 33], "adamw": [19, 33], "lr": [19, 30, 33], "correct_token": [19, 33], "entropi": [19, 33], "loss": [19, 30, 33], "cross_entropi": [19, 33], "arent": [19, 33], "zero_grad": [19, 30, 33], "weight": [19, 30, 31, 33], "inde": [19, 33], "5262": 19, "6452": 19, "8448": 19, "7407": 19, "4497": 19, "7200": 19, "0452": 19, "0630": 19, "7231": 19, "0991": 19, "3883": 19, "1719": 19, "0024": 19, "1490": 19, "5580": 19, "9070": 19, "1946": 19, "8469": 19, "8173": 19, "8333": 19, "1722": 19, "8518": 19, "5542": 19, "3361": 19, "6813": 19, "4550": 19, "9903": 19, "5476": 19, "3310": 19, "5932": 19, "9087": 19, "0441": 19, "7201": 19, "0849": 19, "3954": 19, "1480": 19, "1580": 19, "9589": 19, "3856": 19, "0354": 19, "3153": 19, "6950": 19, "8893": 19, "9347": 19, "4812": 19, "4821": 19, "1935": 19, "6101": 19, "2552": [19, 21], "3574": 19, "9555": 19, "4472": 19, "2370": 19, "4913": 19, "7973": 19, "8731": 19, "2148": 19, "8610": 19, "5298": 19, "0569": 19, "7628": 19, "8462": 19, "2901": 19, "9117": 19, "6102": 19, "5902": 19, "0834": 19, "0093": 19, "4495": 19, "3539": 19, "0740": 19, "3545": 19, "7871": 19, "8562": 19, "4963": 19, "9433": 19, "7392": 19, "9859": 19, "2827": 19, "3862": 19, "7453": 19, "4021": 19, "0508": 19, "5621": 19, "2794": 19, "3303": 19, "7909": 19, "4538": 19, "1313": 19, "0819": 19, "6503": 19, "5484": 19, "9757": 19, "8230": 19, "5514": 19, "9135": 19, "0300": 19, "0671": 19, "7480": 19, "1516": 19, "9534": 19, "1927": 19, "4806": 19, "6110": 19, "9870": 19, "6541": 19, "2833": 19, "7793": 19, "5076": 19, "5269": 19, "0037": 19, "7067": 19, "3638": 19, "2859": 19, "9272": 19, "7984": 19, "2132": 19, "0050": [19, 33], "7416": 19, "1828": 19, "0524": 19, "0584": 19, "7789": 19, "1404": 19, "9479": 19, "1800": 19, "4593": 19, "6158": 19, "0084": 19, "6854": 19, "2958": 19, "7769": 19, "5156": [19, 24, 33], "5044": 19, "9969": 19, "7388": 19, "3761": 19, "2705": 19, "9826": 19, "8277": 19, "2302": 19, "9683": 19, "7128": 19, "2308": 19, "8993": 19, "8751": 19, "6339": 19, "9546": 19, "7678": 19, "9929": 19, "2638": 19, "4456": 19, "8543": 19, "5411": 19, "1332": 19, "5998": 19, "3486": 19, "3077": 19, "8154": 19, "5951": 19, "2131": 19, "0807": 19, "8615": 19, "6812": 19, "0719": 19, "7578": 19, "5100": 19, "6025": 19, "5490": 19, "3451": 19, "6261": 19, "4447": 19, "6631": 19, "9259": 19, "5568": 19, "2529": 19, "8272": 19, "2799": 19, "0383": 19, "9686": 19, "4911": 19, "3074": 19, "9068": 19, "7484": 19, "5957": 19, "3908": 19, "7700": 19, "4054": 19, "1650": 19, "8296": 19, "1858": 19, "1039": 19, "9361": 19, "1787": 19, "0026": 19, "2144": 19, "4693": 19, "6995": 19, "1395": [19, 21], "8447": 19, "4018": 19, "8409": 19, "6084": 19, "5108": 19, "0477": 19, "8995": [19, 27], "4809": 19, "2972": 19, "2091": 19, "9804": 19, "3483": 19, "7015": 19, "4362": 19, "6675": 19, "5581": 19, "4253": 19, "6306": 19, "4597": 19, "6652": 19, "9124": 19, "1657": 19, "6208": 19, "3349": 19, "8752": 19, "3011": 19, "0775": 19, "9528": 19, "5035": 19, "3898": 19, "9537": 19, "7455": 19, "4682": 19, "8253": 19, "3640": 19, "1378": [19, 27], "9405": 19, "de": [19, 33], "With": [19, 24, 33], "produc": [19, 30, 33], "temporari": [20, 33], "variant": [20, 33], "across": [20, 22, 33], "compar": [20, 26, 28, 33], "explor": [20, 32, 33], "hs11": [20, 33], "model_edit": 20, "unmodifi": [20, 33], "vatican": [20, 33], "original_token": [20, 33], "modified_token": [20, 33], "norigin": [20, 25, 33], "decod": [20, 21, 22, 26, 28, 30, 31, 32, 33, 36], "rome": [20, 33], "safe": [20, 33], "experiment": [20, 33], "cautious": [20, 33], "consequ": [20, 33], "ve": [20, 33], "revert": [20, 33], "chain": 21, "vocabularli": 21, "space": [21, 28, 30], "softmax": [21, 32], "vocabulari": 21, "36": [21, 33], "2875": 21, "35": [21, 33], "0115": 21, "38": [21, 30, 33], "0794": 21, "40": [21, 33], "5164": 21, "41": [21, 33], "3760": 21, "9194": 21, "68": 21, "8886": 21, "1562": [21, 24, 33], "71": 21, "8408": 21, "80": [21, 30, 33], "4194": 21, "78": 21, "1206": 21, "82": 21, "2950": 21, "81": 21, "6519": 21, "83": [21, 30], "9940": 21, "94": [21, 25, 33], "4878": 21, "5194": 21, "85": 21, "6997": 21, "113": [21, 25, 33], "8675": 21, "111": [21, 25, 33], "8628": 21, "6634": 21, "116": 21, "7652": 21, "114": [21, 26], "8267": 21, "112": 21, "3621": 21, "8531": 21, "3007": 21, "91": [21, 25, 33], "8193": 21, "92": [21, 25, 30, 33], "9943": 21, "89": [21, 25, 33], "8382": 21, "6898": 21, "103": [21, 25, 33], "9307": 21, "102": [21, 33], "5054": 21, "105": 21, "1563": 21, "109": [21, 25, 33], "3099": 21, "110": [21, 25, 33], "4196": 21, "unsafeviewbackward0": 21, "198": [21, 33], "417": [21, 22, 33], "8765": [21, 22, 33], "318": [21, 22, 33], "257": [21, 33], "262": [21, 22, 33], "3504": [21, 33], "7372": [21, 33], "6342": [21, 22, 33], "el": 21, "middl": 21, "centr": 21, "three": 22, "hidden_states1": 22, "hidden_states2": 22, "hidden_states3": 22, "architectur": [22, 36], "right": [22, 33], "detect": 22, "padding_sid": 22, "464": [22, 33], "412": [22, 33], "733": [22, 33], "287": [22, 33], "1748": [22, 33], "286": [22, 33], "290": [22, 33], "themselv": [23, 33], "whatev": 23, "variou": [23, 32, 33], "hidden_states_pr": [23, 27], "hs_sum": 23, "hs_edit": 23, "501": 23, "2959": 23, "3464": 23, "1231": 23, "1269": 23, "500": 23, "2863": 23, "4239": 23, "2272": 23, "510": 23, "0453": 23, "504": 23, "2016": 23, "506": 23, "5983": 23, "493": 23, "2541": 23, "502": 23, "5923": 23, "498": 23, "4282": 23, "5919": 23, "505": 23, "9645": 23, "497": 23, "6317": 23, "5350": 23, "6895": 23, "5222": 23, "503": 23, "4496": 23, "508": 23, "1876": 23, "1610": 23, "3547": 23, "499": 23, "3093": 23, "507": 23, "2147": 23, "8499": 23, "7244": 23, "491": 23, "9894": 23, "3487": 23, "5013": 23, "8515": 23, "9245": 23, "0217": 23, "0928": 23, "9673": 23, "3641": 23, "3440": 23, "login": [24, 33], "sign": [24, 33], "set_default_api_kei": [24, 26, 33], "your_api_kei": [24, 26, 33], "instal": [24, 32, 33], "larger": [24, 33], "o": [24, 26, 33], "llama3": [24, 33], "gate": [24, 33], "environ": [24, 26, 33], "hf_token": [24, 26, 32, 33], "your_hugging_face_token": [24, 26, 33], "ll": [24, 32, 33], "2024": [24, 26, 33], "08": [24, 26, 33], "30": [24, 26, 33], "07": [24, 33], "150": [24, 33], "mainprocess": [24, 26, 33], "nnsight_remot": [24, 26, 33], "info": [24, 26, 33], "36ff46f0": [24, 33], "d81a": [24, 33], "4586": [24, 33], "b7e7": [24, 33], "eaf6f97d6c0b": [24, 33], "job": [24, 26, 33], "wait": [24, 26, 33], "approv": [24, 26, 33], "206": [24, 33], "398": [24, 33], "00": [24, 25, 26, 30, 33], "48m": [24, 33], "b": [24, 30, 33], "got": [24, 26, 33], "fork": [24, 26, 33], "parallel": [24, 26, 30, 33], "disabl": [24, 26, 33], "avoid": [24, 26, 33], "deadlock": [24, 26, 33], "explicitli": [24, 26, 33], "tokenizers_parallel": [24, 26, 33], "02": [24, 25, 33], "21mb": [24, 33], "4688": [24, 33], "9062": [24, 33], "2344": [24, 33], "6875": [24, 33], "9609": [24, 33], "2578": [24, 33], "5469": [24, 33], "6172": [24, 33], "4531": [24, 33], "1406": [24, 33], "1250": [24, 33], "7812": [24, 33], "8906": [24, 33], "1875": [24, 33], "1680": [24, 33], "5625": [24, 33], "9453": [24, 33], "3711": [24, 33], "3516": [24, 33], "3828": [24, 33], "9297": [24, 33], "3672": [24, 33], "2617": [24, 33], "4414": [24, 33], "6758": [24, 33], "6094": [24, 33], "0938": [24, 33], "7031": [24, 33], "8672": [24, 33], "1328": [24, 33], "5000": [24, 30, 33], "bfloat16": [24, 30, 33], "dynamiccach": [24, 33], "3750": [24, 33], "6250": [24, 33], "13": [24, 25, 29, 30, 33], "0000": [24, 29, 33], "8594": [24, 33], "9375": [24, 33], "5938": [24, 33], "5781": [24, 33], "0796": [24, 33], "8750": [24, 33], "4062": [24, 33], "9844": [24, 33], "2500": [24, 33], "7188": [24, 33], "realli": [24, 33], "techniqu": [24, 29, 33, 34], "avail": [24, 33], "encount": 25, "situat": 25, "messag": 25, "suggest": 25, "compat": 25, "tool": [25, 26, 32, 33], "number_of_token": 25, "modified_output": 25, "indexerror": [25, 33], "exc_typ": [25, 33], "exc_val": [25, 33], "exc_tb": [25, 33], "98": [25, 33], "_reset": [25, 33], "216": [25, 33], "214": [25, 33], "215": [25, 33], "218": [25, 33], "14": [25, 29, 30, 33], "16": [25, 29, 30, 31, 33], "18": [25, 29, 33], "__setitem__": [25, 33], "88": [25, 30, 32, 33], "90": [25, 33], "setitem": [25, 33], "270": [25, 33], "267": [25, 33], "269": [25, 33], "271": [25, 33], "272": [25, 28, 33], "273": [25, 33], "274": [25, 33], "275": [25, 33], "276": [25, 33], "106": [25, 33], "107": [25, 33], "108": [25, 33], "96": [25, 33], "93": [25, 30, 33], "theres": [25, 33], "131": [25, 33], "128": [25, 33], "did": [25, 33], "129": [25, 33], "133": [25, 33], "134": [25, 33], "135": [25, 33], "136": [25, 33], "isinst": [25, 30, 33], "137": [25, 33], "138": [25, 33], "20": [25, 29, 31, 33], "15": [25, 26, 29, 30, 33], "allow_non_fake_input": [25, 33], "shape_env": [25, 33], "shapeenv": [25, 33], "assume_static_by_default": [25, 33], "17": [25, 29, 33], "fake_mod": [25, 33], "fakecopymod": [25, 33], "exit_global_tracing_context": [25, 33], "22": [25, 33], "24": [25, 33], "25": [25, 30, 33], "26": [25, 33], "27": [25, 33], "330": [25, 33], "326": [25, 33], "328": [25, 33], "baseexcept": [25, 33], "312": [25, 33], "func": [25, 33], "305": [25, 33], "_variablefunctionsclass": [25, 33], "__qualname__": [25, 33], "306": [25, 33], "307": [25, 33], "308": [25, 33], "309": [25, 33], "310": [25, 33], "bound": [25, 30, 33], "ah": [25, 33], "cours": [25, 33], "abl": [25, 32, 33], "though": [25, 33], "under": [25, 33], "record": [25, 33], "doesn": [25, 33], "incur": [25, 33], "cost": [25, 30, 33], "throught": [25, 33], "least": [25, 33], "word": [25, 28, 32, 33], "caution": [25, 33], "relat": [25, 33], "effici": [25, 26, 29, 33], "off": [25, 31, 33], "best": [25, 33], "unsur": [25, 33], "again": [25, 33], "6286e": 25, "7258e": 25, "7969e": 25, "8255e": 25, "0698e": 25, "4242e": 25, "2749e": 25, "0404e": 25, "2988e": 25, "7030e": 25, "9210e": 25, "01": [25, 30], "5507e": 25, "4831e": 25, "4496e": 25, "2496e": 25, "4764e": 25, "5587e": 25, "8417e": 25, "7383e": 25, "9535e": 25, "1625e": 25, "4659e": 25, "9305e": 25, "2014e": 25, "6166e": 25, "3293e": 25, "1797e": 25, "6870e": 25, "9511e": 25, "3648e": 25, "5362e": 25, "2539e": 25, "4988e": 25, "2232e": 25, "4482e": 25, "8883e": 25, "5206e": 25, "3218e": 25, "5060e": 25, "2041e": 25, "8520e": 25, "3440e": 25, "0114e": 25, "7492e": 25, "4499e": 25, "5314e": 25, "0311e": 25, "3609e": 25, "4801e": 25, "6725e": 25, "0538e": 25, "5054e": 25, "9737e": 25, "5169e": 25, "9845e": 25, "4548e": 25, "7004e": 25, "8162e": 25, "5651e": 25, "8362e": 25, "5023e": 25, "9528e": 25, "4438e": 25, "7818e": 25, "0992e": 25, "8575e": 25, "1478e": 25, "6564e": 25, "2905e": 25, "3264e": 25, "9211e": 25, "6120e": 25, "6601e": 25, "5331e": 25, "2056e": 25, "6827e": 25, "7709e": 25, "1225e": 25, "9829e": 25, "9273e": 25, "6971e": 25, "6272e": 25, "2709e": 25, "0965e": 25, "4081e": 25, "4534e": 25, "4642e": 25, "0931e": 25, "8111e": 25, "1471e": 25, "9692e": 25, "1457e": 25, "1235e": 25, "2517e": 25, "2227e": 25, "2003e": 25, "1090e": 25, "8102e": 25, "4567e": 25, "7879e": 25, "2834e": 25, "7080e": 25, "6301e": 25, "9053e": 25, "9357e": 25, "7841e": 25, "0679e": 25, "0271e": 25, "0579e": 25, "7195e": 25, "1443e": 25, "7420e": 25, "3746e": 25, "5129e": 25, "9945e": 25, "1595e": 25, "5102e": 25, "2280e": 25, "4264e": 25, "5586e": 25, "8480e": 25, "8030e": 25, "3625e": 25, "1234e": 25, "5630e": 25, "4384e": 25, "0834e": 25, "3671e": 25, "9106e": 25, "9593e": 25, "0443e": 25, "2028e": 25, "1285e": 25, "6665e": 25, "1522e": 25, "0780e": 25, "5473e": 25, "9861e": 25, "5902e": 25, "2159e": 25, "0041e": 25, "03": 25, "4291e": 25, "5786e": 25, "3004e": 25, "3246e": 25, "4886e": 25, "1515e": 25, "5345e": 25, "1293e": 25, "2794e": 25, "1508e": 25, "1936e": 25, "7968e": 25, "2526e": 25, "0222e": 25, "4691e": 25, "1648e": 25, "6389e": 25, "7188e": 25, "1339e": 25, "8595e": 25, "7614e": 25, "3966e": 25, "0889e": 25, "5380e": 25, "0410e": 25, "5772e": 25, "4345e": 25, "2805e": 25, "1078e": 25, "2193e": 25, "4413e": 25, "2237e": 25, "5395e": 25, "3000e": 25, "7484e": 25, "1002e": 25, "5656e": 25, "1450e": 25, "1324e": 25, "2751e": 25, "7061e": 25, "3499e": 25, "0883e": 25, "2036e": 25, "4077e": 25, "0958e": 25, "4460e": 25, "6134e": 25, "8703e": 25, "2674e": 25, "2317e": 25, "0362e": 25, "1834e": 25, "3516e": 25, "0807e": 25, "0336e": 25, "0479e": 25, "9521e": 25, "9104e": 25, "0803e": 25, "2048e": 25, "7705e": 25, "8135e": 25, "4048e": 25, "3258e": 25, "1608e": 25, "2787e": 25, "8557e": 25, "1077e": 25, "0518e": 25, "6806e": 25, "2934e": 25, "4432e": 25, "5619e": 25, "1031e": 25, "2877e": 25, "0819e": 25, "9329e": 25, "8585e": 25, "9784e": 25, "1124e": 25, "2287e": 25, "7348e": 25, "0236e": 25, "4054e": 25, "5393e": 25, "5170e": 25, "5092e": 25, "3856e": 25, "0673e": 25, "6784e": 25, "3701e": 25, "4999e": 25, "3039e": 25, "5358e": 25, "9126e": 25, "1336e": 25, "2421e": 25, "4454e": 25, "0309e": 25, "3034e": 25, "0879e": 25, "4193e": 25, "5885e": 25, "5374e": 25, "4802e": 25, "9640e": 25, "6382e": 25, "5199e": 25, "1697e": 25, "1011e": 25, "9947e": 25, "5317e": 25, "3526e": 25, "4459e": 25, "6096e": 25, "6977e": 25, "5488e": 25, "9472e": 25, "5825e": 25, "1431e": 25, "7997e": 25, "4164e": 25, "7173e": 25, "5707e": 25, "2898e": 25, "0544e": 25, "1279e": 25, "0761e": 25, "0572e": 25, "4155e": 25, "1557e": 25, "0821e": 25, "4200e": 25, "1833e": 25, "3272e": 25, "4302e": 25, "4085e": 25, "8076e": 25, "1994e": 25, "6751e": 25, "7346e": 25, "0669e": 25, "9313e": 25, "0663e": 25, "6838e": 25, "5756e": 25, "8478e": 25, "4335e": 25, "1085e": 25, "5366e": 25, "3190e": 25, "4223e": 25, "6886e": 25, "7125e": 25, "6715e": 25, "9403e": 25, "6051e": 25, "9405e": 25, "9342e": 25, "0049e": 25, "0645e": 25, "4900e": 25, "7649e": 25, "0025e": 25, "6692e": 25, "1792e": 25, "7743e": 25, "0210e": 25, "8536e": 25, "3734e": 25, "2150e": 25, "1420e": 25, "3237e": 25, "1060e": 25, "8375e": 25, "4864e": 25, "0235e": 25, "7014e": 25, "0699e": 25, "2431e": 25, "2326e": 25, "2734e": 25, "1882e": 25, "0536e": 25, "6773e": 25, "9881e": 25, "4860e": 25, "0162e": 25, "5636e": 25, "0074e": 25, "6067e": 25, "3144e": 25, "1818e": 25, "4546e": 25, "0912e": 25, "1206e": 25, "3724e": 25, "7155e": 25, "4178e": 25, "2956e": 25, "6902e": 25, "5223e": 25, "4952e": 25, "7531e": 25, "1116e": 25, "8512e": 25, "7123e": 25, "6355e": 25, "8020e": 25, "8983e": 25, "3574e": 25, "3467e": 25, "8905e": 25, "3620e": 25, "8599e": 25, "2110e": 25, "5844e": 25, "4734e": 25, "9198e": 25, "9884e": 25, "7416e": 25, "6009e": 25, "6512e": 25, "0772e": 25, "8859e": 25, "4945e": 25, "9834e": 25, "2670e": 25, "6965e": 25, "0969e": 25, "9006e": 25, "9760e": 25, "3006e": 25, "3767e": 25, "9463e": 25, "3662e": 25, "5842e": 25, "1415e": 25, "5953e": 25, "7413e": 25, "7179e": 25, "1987e": 25, "8265e": 25, "9532e": 25, "1599e": 25, "9978e": 25, "8641e": 25, "0306e": 25, "1554e": 25, "0086e": 25, "8663e": 25, "8928e": 25, "1998e": 25, "5062e": 25, "2103e": 25, "7206e": 25, "5376e": 25, "5671e": 25, "2228e": 25, "6561e": 25, "8118e": 25, "8825e": 25, "8699e": 25, "3017e": 25, "3756e": 25, "2634e": 25, "6821e": 25, "7862e": 25, "6553e": 25, "7938e": 25, "6224e": 25, "7574e": 25, "0822e": 25, "9101e": 25, "3470e": 25, "4396e": 25, "8533e": 25, "3989e": 25, "3025e": 25, "0689e": 25, "5526e": 25, "0326e": 25, "0746e": 25, "0950e": 25, "1649e": 25, "4935e": 25, "1394e": 25, "0906e": 25, "1690e": 25, "2226e": 25, "2760e": 25, "4431e": 25, "0973e": 25, "3528e": 25, "9426e": 25, "5969e": 25, "5405e": 25, "7662e": 25, "4922e": 25, "4357e": 25, "8989e": 25, "2059e": 25, "9071e": 25, "3410e": 25, "0605e": 25, "5846e": 25, "7736e": 25, "0953e": 25, "5078e": 25, "7121e": 25, "4718e": 25, "8174e": 25, "7044e": 25, "0058e": 25, "1485e": 25, "8376e": 25, "5943e": 25, "8444e": 25, "8978e": 25, "0776e": 25, "0642e": 25, "3514e": 25, "2874e": 25, "2097e": 25, "6646e": 25, "6328e": 25, "2562e": 25, "4275e": 25, "6121e": 25, "4209e": 25, "1070e": 25, "9542e": 25, "7836e": 25, "0035e": 25, "0094e": 25, "7393e": 25, "4366e": 25, "8556e": 25, "2903e": 25, "5690e": 25, "6298e": 25, "2884e": 25, "0525e": 25, "3517e": 25, "1991e": 25, "9318e": 25, "2929e": 25, "2494e": 25, "4547e": 25, "6449e": 25, "0015e": 25, "5933e": 25, "1539e": 25, "7483e": 25, "9571e": 25, "6167e": 25, "1041e": 25, "1621e": 25, "2981e": 25, "2509e": 25, "9099e": 25, "9714e": 25, "3853e": 25, "2267e": 25, "2992e": 25, "8448e": 25, "9776e": 25, "0985e": 25, "9363e": 25, "0710e": 25, "9856e": 25, "9332e": 25, "8208e": 25, "6373e": 25, "4278e": 25, "3095e": 25, "1847e": 25, "4024e": 25, "2026e": 25, "0059e": 25, "7174e": 25, "0502e": 25, "2487e": 25, "4279e": 25, "2406e": 25, "9508e": 25, "2061e": 25, "5007e": 25, "5605e": 25, "6327e": 25, "6576e": 25, "1315e": 25, "5557e": 25, "7006e": 25, "6053e": 25, "9167e": 25, "5669e": 25, "4749e": 25, "2183e": 25, "4309e": 25, "5208e": 25, "1254e": 25, "7077e": 25, "9774e": 25, "3449e": 25, "4506e": 25, "2922e": 25, "2381e": 25, "1032e": 25, "7615e": 25, "3168e": 25, "8688e": 25, "5302e": 25, "0305e": 25, "4317e": 25, "4285e": 25, "6842e": 25, "0345e": 25, "0907e": 25, "3043e": 25, "8652e": 25, "4368e": 25, "0064e": 25, "9621e": 25, "6881e": 25, "6544e": 25, "9820e": 25, "2363e": 25, "4828e": 25, "5182e": 25, "0165e": 25, "8026e": 25, "3627e": 25, "1291e": 25, "0510e": 25, "2262e": 25, "6994e": 25, "1767e": 25, "2933e": 25, "8151e": 25, "8563e": 25, "1988e": 25, "6882e": 25, "8934e": 25, "4241e": 25, "5913e": 25, "1459e": 25, "3060e": 25, "9042e": 25, "1736e": 25, "4661e": 25, "1147e": 25, "0368e": 25, "1779e": 25, "8113e": 25, "0269e": 25, "9996e": 25, "8506e": 25, "3495e": 25, "3824e": 25, "6062e": 25, "2471e": 25, "6041e": 25, "8814e": 25, "3164e": 25, "5559e": 25, "3661e": 25, "7891e": 25, "9709e": 25, "2465e": 25, "9410e": 25, "3974e": 25, "8152e": 25, "7801e": 25, "4493e": 25, "0901e": 25, "9918e": 25, "8610e": 25, "2574e": 25, "8129e": 25, "2315e": 25, "0814e": 25, "8385e": 25, "2490e": 25, "4800e": 25, "8052e": 25, "3061e": 25, "8434e": 25, "5931e": 25, "2917e": 25, "9720e": 25, "3967e": 25, "4260e": 25, "1623e": 25, "1470e": 25, "2324e": 25, "5378e": 25, "0738e": 25, "3570e": 25, "2882e": 25, "0768e": 25, "7377e": 25, "5838e": 25, "1146e": 25, "9866e": 25, "3019e": 25, "8275e": 25, "4068e": 25, "7844e": 25, "6919e": 25, "9575e": 25, "8200e": 25, "8251e": 25, "5988e": 25, "7482e": 25, "0484e": 25, "6259e": 25, "5771e": 25, "8153e": 25, "3178e": 25, "6060e": 25, "5188e": 25, "0826e": 25, "3834e": 25, "7229e": 25, "6664e": 25, "6413e": 25, "0723e": 25, "3191e": 25, "4131e": 25, "6075e": 25, "2504e": 25, "3741e": 25, "7716e": 25, "4227e": 25, "3925e": 25, "5700e": 25, "7153e": 25, "3690e": 25, "1079e": 25, "3346e": 25, "9114e": 25, "0677e": 25, "0595e": 25, "8981e": 25, "1321e": 25, "9002e": 25, "9221e": 25, "1126e": 25, "5232e": 25, "5203e": 25, "8918e": 25, "8023e": 25, "7897e": 25, "6398e": 25, "3831e": 25, "3203e": 25, "7896e": 25, "1591e": 25, "2745e": 25, "0674e": 25, "1897e": 25, "5548e": 25, "0816e": 25, "4219e": 25, "2085e": 25, "0132e": 25, "1880e": 25, "2857e": 25, "3511e": 25, "3891e": 25, "3398e": 25, "5823e": 25, "1914e": 25, "7218e": 25, "5562e": 25, "9274e": 25, "1782e": 25, "9518e": 25, "3836e": 25, "5140e": 25, "8808e": 25, "9965e": 25, "6073e": 25, "4745e": 25, "4041e": 25, "8542e": 25, "0609e": 25, "0068e": 25, "6370e": 25, "4448e": 25, "0635e": 25, "6714e": 25, "0683e": 25, "0481e": 25, "selectbackward0": 25, "dispos": [25, 33], "nois": [25, 27, 33], "queue": [26, 33], "concurr": [26, 33], "offer": [26, 33], "benefit": [26, 29, 33], "back": [26, 33], "forth": [26, 33], "machin": [26, 33], "t1": [26, 33], "captur": [26, 33], "hs_79": [26, 33], "t1_tokens_out": [26, 33], "buckingham": [26, 33], "palac": [26, 33], "t2": [26, 33], "t2_tokens_out": [26, 33], "nt1": [26, 33], "49": [26, 30, 33], "072": 26, "1478bff8": 26, "622a": 26, "42cf": 26, "9ba0": 26, "78d3a0803a8b": 26, "097": 26, "423": 26, "69k": [26, 33], "20mb": 26, "strictli": [26, 33], "definit": [26, 33], "t3": [26, 33], "53": 26, "770": 26, "e794cd1a": 26, "3c4d": 26, "4300": 26, "ba68": 26, "6dcb6d8bda02": 26, "795": 26, "801": 26, "811": 26, "823": 26, "928": [26, 33], "66mb": 26, "mention": [26, 33], "vanilla": [26, 33], "instruct": [26, 30, 33], "entir": [26, 33], "often": [27, 33], "happen": [27, 28, 33], "flow": [27, 33], "assig": 27, "001": [27, 33], "hidden_states_post": 27, "clonebackward0": 27, "0244": 27, "1430": 27, "1384": 27, "0185": 27, "1173": 27, "0855": 27, "8112": 27, "3000": 27, "0057": 27, "3378": 27, "8778": 27, "2780": 27, "6427": 27, "6233": 27, "5877": 27, "2030": 27, "1590": 27, "9278": 27, "8584": 27, "0728": 27, "0145": 27, "9685": 27, "4962": 27, "4435": 27, "3371": 27, "1299": 27, "7784": 27, "5379": 27, "6941": 27, "7279": 27, "8105": 27, "6403": 27, "0599": 27, "0637": 27, "copyslic": 27, "indirect": [28, 29], "identif": 28, "task": [28, 29, 33, 36], "plotli": [28, 29], "express": [28, 29], "px": [28, 29], "corrupt": [28, 29], "clean_prompt": 28, "john": [28, 29], "mari": [28, 29], "went": [28, 29, 33], "gave": [28, 29], "bottl": 28, "milk": 28, "corrupted_prompt": 28, "That": [28, 33], "sure": [28, 33], "combin": [28, 29, 33], "correct_index": 28, "input_id": [28, 29, 30, 32], "incorrect_index": 28, "1757": 28, "5335": 28, "thank": 28, "whole": [28, 29, 33], "break": [28, 29], "n_layer": 28, "clean_token": [28, 29], "No": [28, 30], "clean_h": 28, "layer_idx": [28, 32], "clean_logit": [28, 29], "incorrect": 28, "clean_logit_diff": 28, "corrupted_logit": [28, 29], "corrupted_logit_diff": 28, "ioi_patching_result": 28, "_ioi_patching_result": 28, "token_idx": 28, "patched_logit": 28, "patched_logit_diff": 28, "improv": 28, "patched_result": 28, "3f": 28, "lambda": [28, 33], "token_label": 28, "fig": [28, 29], "imshow": [28, 29], "color_continuous_midpoint": [28, 29], "color_continuous_scal": [28, 29], "rdbu": [28, 29], "label": [28, 30, 32], "y": 28, "residu": [28, 29], "stream": [28, 29], "ioi": [28, 29], "124": 28, "adapt": 29, "neel": 29, "nanda": 29, "blog": [29, 32], "outperform": 29, "autom": 29, "colab": [29, 32, 33], "section": [29, 33], "scenario": [29, 33], "arena": 29, "sentenc": [29, 30], "shop": 29, "bag": 29, "tom": 29, "jame": 29, "park": 29, "ball": 29, "dan": 29, "sid": 29, "appl": 29, "martin": 29, "ami": 29, "drink": 29, "return_tensor": 29, "pt": [29, 31], "corrupted_token": 29, "answer_token_indic": 29, "j": 29, "get_logit_diff": 29, "correct_logit": 29, "gather": 29, "unsqueez": 29, "incorrect_logit": 29, "clean_baselin": 29, "diff": 29, "4f": 29, "corrupted_baselin": 29, "8138": 29, "metric": 29, "subject": 29, "eg": 29, "ioi_metr": 29, "baselin": 29, "approxim": [29, 36], "assumpt": 29, "corrupted_x": 29, "clean_x": 29, "corrupted_grad_x": 29, "cach": 29, "down": 29, "nice": [29, 33], "attent": 29, "head": [29, 32], "represent": [29, 30], "implicitli": 29, "per": 29, "snippet": [29, 33], "clean_out": 29, "corrupted_out": 29, "corrupted_grad": 29, "invoker_clean": 29, "attn_out": 29, "invoker_corrupt": 29, "corrupted_grad_act": 29, "clean_act": 29, "corrupted_act": 29, "rearrang": 29, "estim": 29, "rather": 29, "patching_result": 29, "zip": [29, 30], "residual_attr": 29, "64": 29, "numpi": [29, 32], "update_layout": 29, "xaxis_titl": 29, "yaxis_titl": 29, "simulatan": 29, "serv": [29, 33], "heurist": 29, "practic": [29, 33], "howev": [29, 33, 35], "decent": 29, "bad": 29, "big": [29, 33], "exclud": 29, "accur": 29, "pictur": 29, "po": 29, "adap": 30, "pyven": 30, "paper": 30, "zhengxuan": 30, "wu": 30, "et": 30, "al": 30, "trang": 30, "boundlessrotatedspaceintervent": 30, "sklearn": 30, "model_select": 30, "train_test_split": 30, "hf_dataset": 30, "get_linear_schedule_with_warmup": 30, "gc": 30, "tutorial_price_tagging_util": 30, "factual_sampl": 30, "bound_alignment_sampl": 30, "lower_bound_alignment_example_sampl": 30, "is_avail": 30, "sharpbai": 30, "alpaca": [30, 36], "7b": 30, "merg": 30, "torch_dtyp": 30, "free_unused_cuda_memori": 30, "empty_cach": 30, "runtimeerror": 30, "calculate_loss": 30, "subspace_proj": 30, "mask_weight": 30, "vocab_s": 30, "32001": 30, "shift_logit": 30, "contigu": 30, "shift_label": 30, "loss_fct": 30, "crossentropyloss": 30, "boundary_loss": 30, "intervention_boundari": 30, "compute_metr": 30, "eval_pr": 30, "eval_label": 30, "generate_output": 30, "total_count": 30, "correct_count": 30, "label_idx": 30, "ne": 30, "nonzero": 30, "squeez": 30, "actual_test_label": 30, "tolist": 30, "pred_test_label": 30, "uncom": 30, "return_dict": 30, "accuraci": 30, "round": 30, "publicli": 30, "templat": 30, "core": [30, 33], "english": 30, "sai": [30, 33], "ye": 30, "xx": 30, "dollar": 30, "amount": 30, "drawn": 30, "uniform": 30, "distribut": [30, 33], "99": 30, "hypothesi": 30, "solv": [30, 33], "boundari": 30, "higher": 30, "lower": 30, "incorpor": 30, "focu": 30, "align": 30, "raw_prealign": 30, "pricing_tag": 30, "prealign_dataset": 30, "from_dict": 30, "set_format": 30, "column": 30, "prealign_dataload": 30, "appear": 30, "describ": [30, 33], "further": 30, "n": [30, 32], "npleas": 30, "n9": 30, "76": 30, "no_grad": 30, "k": 30, "eval_metr": 30, "eval_dict": 30, "TO": 30, "BE": 30, "good": [30, 33], "625": 30, "08it": 30, "goal": 30, "sampl": 30, "counterfactu": 30, "rotat": [30, 32], "lastli": 30, "matrix": 30, "trainabl": 30, "raw_data": 30, "10000": 30, "raw_train": 30, "raw_temp": 30, "test_siz": 30, "random_st": 30, "raw_ev": 30, "raw_test": 30, "unpack": 30, "create_dataset": 30, "source_input_id": 30, "intervention_id": 30, "with_format": 30, "train_dataload": 30, "eval_dataload": 30, "test_dataload": 30, "embed_dim": 30, "hidden_s": 30, "gradient_accumulation_step": 30, "epoch": 30, "temperature_start": 30, "temperature_end": 30, "intervention_lay": 30, "t_total": 30, "warm_up_step": 30, "optimizer_param": 30, "rotate_lay": 30, "adam": 30, "schedul": 30, "num_warmup_step": 30, "num_training_step": 30, "target_total_step": 30, "temperature_schedul": 30, "linspac": 30, "total_step": 30, "set_temperatur": 30, "parametrizedrotatelay": 30, "parametr": 30, "moduledict": 30, "parametrizationlist": 30, "_orthogon": 30, "batch_subspace_swap": 30, "subspace_swap": 30, "all_ind": 30, "arang": [30, 32], "base_prompt": 30, "source_prompt": 30, "mixed_out": 30, "save_out": 30, "del": 30, "output_logit": 30, "train_iter": 30, "desc": 30, "log_dict": 30, "epoch_iter": 30, "counterfactual_output": 30, "loss_str": 30, "acc": 30, "set_postfix": 30, "1000": 30, "llamatokenizerfast": 30, "63": 30, "51": 30, "2905": 30, "125": 30, "09it": 30, "dictionary_learn": 31, "autoencod": [31, 36], "weights_path": 31, "pythia": 31, "70m": 31, "dedup": 31, "mlp_out_layer0": 31, "0_8192": 31, "ae_99000": 31, "activation_dim": 31, "512": 31, "dictionary_s": 31, "ae": 31, "load_state_dict": 31, "8192": [31, 33], "eleutherai": 31, "me": [31, 33], "ishmael": 31, "year": 31, "ago": 31, "mind": 31, "long": 31, "precis": [31, 33], "littl": [31, 33], "monei": 31, "my": 31, "purs": 31, "particular": [31, 33], "shore": 31, "thought": [31, 36], "sail": 31, "wateri": 31, "drive": 31, "spleen": 31, "regul": 31, "circul": 31, "whenev": 31, "myself": 31, "grow": 31, "grim": 31, "mouth": 31, "damp": 31, "drizzli": 31, "novemb": 31, "soul": 31, "involuntarili": 31, "paus": 31, "coffin": 31, "warehous": 31, "bring": [31, 33], "rear": 31, "funer": 31, "meet": 31, "especi": [31, 33], "hypo": 31, "upper": 31, "hand": 31, "strong": 31, "moral": 31, "principl": [31, 33], "deliber": 31, "street": 31, "knock": 31, "peopl": 31, "hat": 31, "account": [31, 35], "sea": 31, "soon": 31, "mlp_0": 31, "gpt_neox": 31, "gptneoxtokenizerfast": 31, "summed_activ": 31, "ab": 31, "sort": 31, "max": [31, 32], "top_activations_indic": 31, "topk": 31, "top": [31, 32], "compound": 31, "circuitsvi": 31, "colored_tokens_multi": 31, "str_token": 31, "grant": 32, "simplifi": 32, "glimps": 32, "evolv": 32, "stage": 32, "tradit": 32, "approach": 32, "focus": 32, "belief": 32, "spotlight": 32, "believ": [32, 33], "junctur": 32, "nostalgebraist": 32, "lesswrong": 32, "pip": [32, 33, 34], "matplotlib": 32, "pyplot": 32, "plt": 32, "seaborn": 32, "sn": 32, "np": 32, "ipython": [32, 33], "clear_output": [32, 33], "usr": 32, "dist": 32, "_token": 32, "userwarn": 32, "secret": 32, "authent": 32, "hub": 32, "tab": 32, "co": [32, 33], "googl": 32, "restart": 32, "reus": 32, "notebook": 32, "recommend": 32, "public": 32, "gpt2attent": 32, "analyz": [32, 33], "probabl": 32, "aggreg": 32, "confid": 32, "probs_lay": 32, "layer_output": 32, "obtain": [32, 35], "prob": 32, "cat": 32, "maximum": 32, "max_prob": 32, "unicode_escap": 32, "layer_token": 32, "input_word": 32, "output_word": 32, "cmap": 32, "diverging_palett": 32, "255": 32, "as_cmap": 32, "figur": 32, "figsiz": 32, "ax": 32, "heatmap": 32, "arrai": 32, "fmt": 32, "linewidth": 32, "cbar_kw": 32, "xlabel": 32, "ylabel": 32, "ytick": 32, "gca": 32, "xaxi": 32, "tick_top": 32, "set_label_posit": 32, "xtick": 32, "vertic": 32, "axi": 32, "guess": 32, "accord": 32, "color": 32, "ai": 33, "black": 33, "transpar": 33, "team": [33, 34], "lab": 33, "independ": 33, "alik": 33, "passion": 33, "collabor": 33, "profoundli": 33, "tini": 33, "upgrad": 33, "submodul": 33, "complementari": 33, "requires_grad_": 33, "tiny_model": 33, "reflect": 33, "talk": 33, "conclud": 33, "common": [33, 34], "myfil": 33, "txt": 33, "Being": 33, "enough": 33, "discuss": 33, "intuit": 33, "But": 33, "explanatori": 33, "until": 33, "defer": 33, "eventu": 33, "put": 33, "oh": 33, "why": 33, "fix": 33, "2687": 33, "3314": 33, "discov": 33, "coincident": 33, "l1_output": 33, "2341": 33, "3416": 33, "8637": 33, "5382": 33, "3792": 33, "1253": 33, "4137": 33, "5758": 33, "3158": 33, "1226": 33, "rest": 33, "analysi": 33, "highest": 33, "l1_amax": 33, "seamlessli": 33, "hold": 33, "didn": 33, "3797": 33, "those": 33, "7796": 33, "ml": 33, "exactli": 33, "influenc": 33, "l1_output_befor": 33, "0th": 33, "l1_output_aft": 33, "seem": 33, "380": 33, "379": 33, "382": 33, "caus": 33, "localbackend": 33, "147": 33, "143": 33, "145": 33, "148": 33, "149": 33, "151": 33, "152": 33, "154": 33, "155": 33, "462": 33, "454": 33, "455": 33, "456": 33, "458": 33, "459": 33, "460": 33, "463": 33, "465": 33, "466": 33, "467": 33, "468": 33, "469": 33, "470": 33, "471": 33, "472": 33, "473": 33, "574": 33, "571": 33, "573": 33, "474": 33, "475": 33, "todo": 33, "476": 33, "584": 33, "prepared_input": 33, "581": 33, "582": 33, "585": 33, "586": 33, "587": 33, "1553": 33, "_wrapped_call_impl": 33, "1551": 33, "_compiled_call_impl": 33, "misc": 33, "1552": 33, "_call_impl": 33, "1603": 33, "1600": 33, "bw_hook": 33, "backwardhook": 33, "full_backward_hook": 33, "backward_pre_hook": 33, "setup_input_hook": 33, "forward_cal": 33, "1604": 33, "_global_forward_hook": 33, "_forward_hook": 33, "1605": 33, "hook_id": 33, "1606": 33, "1607": 33, "1608": 33, "1609": 33, "mark": 33, "219": 33, "217": 33, "220": 33, "1616": 33, "1614": 33, "hook_result": 33, "1615": 33, "1618": 33, "1619": 33, "559": 33, "558": 33, "449": 33, "442": 33, "443": 33, "444": 33, "445": 33, "446": 33, "448": 33, "451": 33, "452": 33, "453": 33, "410": 33, "407": 33, "409": 33, "413": 33, "387": 33, "383": 33, "385": 33, "388": 33, "389": 33, "391": 33, "392": 33, "setitem_0": 33, "6063279136": 33, "wrong": 33, "henc": 33, "feasibl": 33, "varianc": 33, "2283": 33, "3262": 33, "8443": 33, "5498": 33, "3424": 33, "1178": 33, "4780": 33, "5522": 33, "2394": 33, "1264": 33, "backpropag": 33, "layer1_output_grad": 33, "layer2_output_grad": 33, "propag": 33, "2777": 33, "1917": 33, "1359": 33, "2426": 33, "1477": 33, "0748": 33, "1204": 33, "1260": 33, "2847": 33, "previous": 33, "doubl": 33, "23": 33, "belt": 33, "bare": 33, "bone": 33, "excit": 33, "automat": 33, "gpt": 33, "llm": 33, "gpt2sdpaattent": 33, "evenli": 33, "model_doc": 33, "aren": 33, "simpler": 33, "token_id": 33, "ntoken": 33, "338": 33, "3576": 33, "london": 33, "piec": 33, "miss": 33, "Of": 33, "behind": 33, "scene": 33, "guarante": 33, "arbitrari": 33, "broadcast": 33, "laguagemodel": 33, "max_length": 33, "truncat": 33, "29": 33, "token_ids_intervent": 33, "token_ids_origin": 33, "affect": 33, "neat": 33, "cool": 33, "transfer": 33, "placehold": 33, "onto": 33, "At": 33, "match": 33, "31": 33, "token_ids_1": 33, "token_ids_2": 33, "token_ids_3": 33, "npredict": 33, "32": 33, "llm_edit": 33, "33": 33, "democrat": 33, "half": 33, "fairli": 33, "straightforward": 33, "json": 33, "amp": 33, "37": 33, "4a6576dd": 33, "b5fd": 33, "4f1f": 33, "9836": 33, "a619f8277057": 33, "207": 33, "416": 33, "30mb": 33, "900": 33, "28ac8e47": 33, "fa48": 33, "45a1": 33, "acb0": 33, "3e17960e36b8": 33, "934": 33, "935": 33, "951": 33, "953": 33, "11mb": 33, "problem": 33, "689": 33, "667c4310": 33, "9041": 33, "451d": 33, "99a5": 33, "f713f639abb8": 33, "708": 33, "726": 33, "332": 33, "49mb": 33, "315": 33, "8734ee75": 33, "b616": 33, "4270": 33, "9d4d": 33, "7cfabd6d63a": 33, "334": 33, "342": 33, "354": 33, "06k": 33, "7mb": 33, "friendli": 33, "interfac": 33, "Ins": 33, "compl": 33, "551": 33, "5f0b434d": 33, "178d": 33, "4807": 33, "913f": 33, "331f403eb0ea": 33, "593": 33, "594": 33, "610": 33, "611": 33, "630": 33, "992": 33, "68mb": 33, "niec": 33, "bunch": 33, "someon": 33, "delv": 33, "cover": 33, "091": 33, "3e78f88a": 33, "e620": 33, "4679": 33, "ac73": 33, "abeb4f14ce8": 33, "146": 33, "166": 33, "704": 33, "6289": 33, "1172": 33, "6719": 33, "1816": 33, "2715": 33, "5547": 33, "2812": 33, "8086": 33, "5820": 33, "7070": 33, "1094": 33, "2910": 33, "6016": 33, "6602": 33, "4590": 33, "3477": 33, "3438": 33, "1797": 33, "0312": 33, "0469": 33, "7930": 33, "4141": 33, "853": 33, "0859": 33, "6523": 33, "1758": 33, "2637": 33, "5391": 33, "2422": 33, "7852": 33, "0625": 33, "5664": 33, "0781": 33, "2832": 33, "6406": 33, "4453": 33, "3379": 33, "3047": 33, "0156": 33, "7695": 33, "4023": 33, "983": 33, "5898": 33, "0547": 33, "6328": 33, "1709": 33, "2559": 33, "5234": 33, "2031": 33, "7617": 33, "5508": 33, "6680": 33, "2754": 33, "6211": 33, "4316": 33, "3281": 33, "2656": 33, "9688": 33, "7461": 33, "3906": 33, "5703": 33, "0234": 33, "6133": 33, "1660": 33, "2480": 33, "5078": 33, "1641": 33, "7383": 33, "5352": 33, "6484": 33, "2676": 33, "4180": 33, "3184": 33, "2266": 33, "9414": 33, "9531": 33, "7227": 33, "3789": 33, "9922": 33, "1611": 33, "2402": 33, "4922": 33, "7148": 33, "5195": 33, "2598": 33, "4844": 33, "3086": 33, "9141": 33, "9258": 33, "6992": 33, "374": 33, "5742": 33, "2334": 33, "4766": 33, "1016": 33, "6953": 33, "5039": 33, "2520": 33, "3945": 33, "2988": 33, "1484": 33, "8867": 33, "8984": 33, "6797": 33, "3555": 33, "755": 33, "9336": 33, "5586": 33, "1514": 33, "4629": 33, "0703": 33, "4883": 33, "2441": 33, "2891": 33, "8711": 33, "3457": 33, "757": 33, "5430": 33, "1465": 33, "2197": 33, "4492": 33, "0391": 33, "6562": 33, "4727": 33, "2363": 33, "8320": 33, "8438": 33, "3359": 33, "8789": 33, "5273": 33, "1426": 33, "2129": 33, "4355": 33, "0078": 33, "6367": 33, "2295": 33, "3594": 33, "2734": 33, "8203": 33, "8516": 33, "5117": 33, "1387": 33, "2061": 33, "4219": 33, "9766": 33, "2227": 33, "3164": 33, "901": 33, "133k": 33, "571kb": 33, "c1c6e24c": 33, "9f3f": 33, "415b": 33, "8f90": 33, "de8404fc2e74": 33, "539": 33, "572": 33, "695": 33, "31k": 33, "88mb": 33, "begin_of_text": 33, "203": 33, "88838ccd": 33, "230d": 33, "485b": 33, "8f57": 33, "8399453c2250": 33, "224": 33, "231": 33, "350": 33, "93mb": 33, "caveat": 33, "websit": 33, "twitter": 33, "ndif_team": 33, "star": 34, "walk": 34, "system": 35, "boundless": 36, "da": 36, "identifi": 36, "mechan": 36, "spars": 36, "price": 36, "tag": 36, "game": 36, "prealign": 36, "bigger": 36}, "objects": {"nnsight": [[2, 0, 0, "-", "contexts"], [3, 0, 0, "-", "envoy"], [4, 0, 0, "-", "intervention"], [5, 0, 0, "-", "models"], [6, 0, 0, "-", "patching"], [7, 0, 0, "-", "schema"], [8, 0, 0, "-", "tracing"], [9, 0, 0, "-", "util"]], "nnsight.contexts": [[2, 0, 0, "-", "Conditional"], [2, 0, 0, "-", "GraphBasedContext"], [2, 0, 0, "-", "Invoker"], [2, 0, 0, "-", "Tracer"], [2, 4, 1, "", "check_for_dependencies"], [2, 4, 1, "", "resolve_dependencies"]], "nnsight.contexts.Conditional": [[2, 1, 1, "", "Conditional"], [2, 1, 1, "", "ConditionalManager"]], "nnsight.contexts.Conditional.Conditional": [[2, 2, 1, "", "_condition"], [2, 2, 1, "", "_graph"]], "nnsight.contexts.Conditional.ConditionalManager": [[2, 2, 1, "", "_conditional_dict"], [2, 2, 1, "", "_conditional_stack"], [2, 2, 1, "", "_conditioned_nodes_dict"], [2, 3, 1, "", "add_conditioned_node"], [2, 3, 1, "", "get"], [2, 3, 1, "", "is_node_conditioned"], [2, 3, 1, "", "peek"], [2, 3, 1, "", "pop"], [2, 3, 1, "", "push"]], "nnsight.contexts.GraphBasedContext": [[2, 1, 1, "", "GlobalTracingContext"], [2, 1, 1, "", "GraphBasedContext"]], "nnsight.contexts.GraphBasedContext.GlobalTracingContext": [[2, 1, 1, "", "GlobalTracingExit"], [2, 1, 1, "", "GlobalTracingTorchHandler"], [2, 3, 1, "", "deregister"], [2, 3, 1, "", "register"], [2, 3, 1, "", "try_deregister"], [2, 3, 1, "", "try_register"]], "nnsight.contexts.GraphBasedContext.GraphBasedContext": [[2, 3, 1, "", "apply"], [2, 3, 1, "", "bool"], [2, 3, 1, "", "bridge_backend_handle"], [2, 3, 1, "", "bytearray"], [2, 3, 1, "", "bytes"], [2, 3, 1, "", "complex"], [2, 3, 1, "", "cond"], [2, 3, 1, "", "dict"], [2, 3, 1, "", "exit"], [2, 3, 1, "", "float"], [2, 3, 1, "", "int"], [2, 3, 1, "", "list"], [2, 3, 1, "", "log"], [2, 3, 1, "", "set"], [2, 3, 1, "", "str"], [2, 3, 1, "", "tuple"], [2, 3, 1, "", "vis"]], "nnsight.contexts.Invoker": [[2, 1, 1, "", "Invoker"]], "nnsight.contexts.Invoker.Invoker": [[2, 2, 1, "", "inputs"], [2, 2, 1, "", "kwargs"], [2, 2, 1, "", "scan"], [2, 2, 1, "", "scanning"], [2, 2, 1, "", "tracer"]], "nnsight.contexts.Tracer": [[2, 1, 1, "", "Tracer"]], "nnsight.contexts.Tracer.Tracer": [[2, 2, 1, "", "_args"], [2, 2, 1, "", "_graph"], [2, 2, 1, "", "_invoker"], [2, 2, 1, "", "_invoker_inputs"], [2, 2, 1, "", "_kwargs"], [2, 2, 1, "", "_model"], [2, 3, 1, "", "edit_backend_execute"], [2, 3, 1, "", "invoke"], [2, 3, 1, "", "local_backend_execute"], [2, 3, 1, "", "next"], [2, 3, 1, "", "remote_backend_get_model_key"], [2, 3, 1, "", "remote_backend_handle_result_value"], [2, 3, 1, "", "remote_backend_postprocess_result"]], "nnsight.contexts.session": [[2, 0, 0, "-", "Iterator"], [2, 0, 0, "-", "Session"]], "nnsight.contexts.session.Iterator": [[2, 1, 1, "", "Iterator"]], "nnsight.contexts.session.Session": [[2, 1, 1, "", "Session"]], "nnsight.contexts.session.Session.Session": [[2, 2, 1, "", "backend"], [2, 2, 1, "", "bridge"], [2, 2, 1, "", "graph"], [2, 3, 1, "", "iter"], [2, 3, 1, "", "local_backend_execute"], [2, 2, 1, "", "model"], [2, 3, 1, "", "remote_backend_get_model_key"], [2, 3, 1, "", "remote_backend_handle_result_value"], [2, 3, 1, "", "remote_backend_postprocess_result"]], "nnsight.envoy": [[3, 1, 1, "", "Envoy"]], "nnsight.envoy.Envoy": [[3, 2, 1, "", "_call_iter"], [3, 2, 1, "", "_fake_inputs"], [3, 2, 1, "", "_fake_outputs"], [3, 2, 1, "", "_tracer"], [3, 5, 1, "id0", "input"], [3, 5, 1, "", "inputs"], [3, 3, 1, "", "modules"], [3, 3, 1, "", "named_modules"], [3, 5, 1, "id1", "output"], [3, 2, 1, "", "path"], [3, 3, 1, "", "to"]], "nnsight.intervention": [[4, 1, 1, "", "HookHandler"], [4, 1, 1, "", "InterventionHandler"], [4, 1, 1, "", "InterventionProtocol"], [4, 1, 1, "", "InterventionProxy"]], "nnsight.intervention.HookHandler": [[4, 2, 1, "", "handles"], [4, 2, 1, "", "input_hook"], [4, 2, 1, "", "model"], [4, 2, 1, "", "modules"], [4, 2, 1, "", "output_hook"]], "nnsight.intervention.InterventionHandler": [[4, 3, 1, "", "count"]], "nnsight.intervention.InterventionProtocol": [[4, 3, 1, "", "add"], [4, 3, 1, "", "get_interventions"], [4, 3, 1, "", "intervene"], [4, 3, 1, "", "style"]], "nnsight.intervention.InterventionProxy": [[4, 5, 1, "", "device"], [4, 5, 1, "", "dtype"], [4, 5, 1, "", "grad"], [4, 3, 1, "", "save"], [4, 5, 1, "", "shape"], [4, 3, 1, "", "stop"], [4, 3, 1, "", "update"]], "nnsight.models": [[5, 0, 0, "-", "LanguageModel"], [5, 0, 0, "-", "NNsightModel"], [5, 0, 0, "-", "UnifiedTransformer"]], "nnsight.models.LanguageModel": [[5, 1, 1, "", "LanguageModel"], [5, 1, 1, "", "LanguageModelProxy"], [5, 1, 1, "", "TokenIndexer"]], "nnsight.models.LanguageModel.LanguageModel": [[5, 2, 1, "", "automodel"], [5, 2, 1, "", "config"], [5, 2, 1, "", "model"], [5, 2, 1, "", "proxy_class"], [5, 2, 1, "", "tokenizer"]], "nnsight.models.LanguageModel.LanguageModelProxy": [[5, 5, 1, "", "t"], [5, 5, 1, "", "token"]], "nnsight.models.NNsightModel": [[5, 1, 1, "", "MetaDispatcher"], [5, 1, 1, "", "NNsight"]], "nnsight.models.NNsightModel.NNsight": [[5, 2, 1, "", "_args"], [5, 2, 1, "", "_custom_model"], [5, 2, 1, "", "_dispatched"], [5, 2, 1, "", "_envoy"], [5, 2, 1, "", "_kwargs"], [5, 2, 1, "", "_model"], [5, 2, 1, "", "_model_key"], [5, 2, 1, "", "_session"], [5, 3, 1, "", "clear_edits"], [5, 3, 1, "", "dispatch_model"], [5, 3, 1, "", "edit"], [5, 3, 1, "", "interleave"], [5, 2, 1, "", "proxy_class"], [5, 3, 1, "", "scan"], [5, 3, 1, "", "session"], [5, 3, 1, "", "to"], [5, 3, 1, "", "trace"]], "nnsight.models.UnifiedTransformer": [[5, 1, 1, "", "UnifiedTransformer"]], "nnsight.patching": [[6, 1, 1, "", "Patch"], [6, 1, 1, "", "Patcher"]], "nnsight.patching.Patch": [[6, 2, 1, "", "obj"], [6, 2, 1, "", "parent"], [6, 3, 1, "", "patch"], [6, 2, 1, "", "replacement"], [6, 3, 1, "", "restore"]], "nnsight.patching.Patcher": [[6, 3, 1, "", "add"], [6, 2, 1, "", "patches"]], "nnsight.schema": [[7, 0, 0, "-", "Config"], [7, 0, 0, "-", "Response"]], "nnsight.schema.Config": [[7, 1, 1, "", "ApiConfigModel"], [7, 1, 1, "", "AppConfigModel"], [7, 1, 1, "", "ConfigModel"]], "nnsight.schema.Config.ApiConfigModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.Config.AppConfigModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.Config.ConfigModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.Response": [[7, 1, 1, "", "ResponseModel"], [7, 1, 1, "", "ResultModel"]], "nnsight.schema.Response.ResponseModel": [[7, 1, 1, "", "JobStatus"], [7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.Response.ResultModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format": [[7, 0, 0, "-", "functions"], [7, 0, 0, "-", "types"]], "nnsight.schema.format.types": [[7, 1, 1, "", "BaseNNsightModel"], [7, 1, 1, "", "DictModel"], [7, 1, 1, "", "EllipsisModel"], [7, 1, 1, "", "FunctionModel"], [7, 6, 1, "", "FunctionWhitelistError"], [7, 1, 1, "", "GraphModel"], [7, 1, 1, "", "IteratorModel"], [7, 1, 1, "", "ListModel"], [7, 1, 1, "", "NodeModel"], [7, 1, 1, "", "PrimitiveModel"], [7, 1, 1, "", "SessionModel"], [7, 1, 1, "", "SliceModel"], [7, 1, 1, "", "TensorModel"], [7, 1, 1, "", "TracerModel"], [7, 1, 1, "", "TupleModel"]], "nnsight.schema.format.types.BaseNNsightModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.DictModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.EllipsisModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.FunctionModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.GraphModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.IteratorModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.ListModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.NodeModel": [[7, 1, 1, "", "Reference"], [7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.NodeModel.Reference": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.PrimitiveModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.SessionModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.SliceModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.TensorModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.TracerModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.TupleModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.tracing": [[8, 0, 0, "-", "Bridge"], [8, 0, 0, "-", "Graph"], [8, 0, 0, "-", "Node"], [8, 0, 0, "-", "Proxy"], [8, 0, 0, "-", "protocols"]], "nnsight.tracing.Bridge": [[8, 1, 1, "", "Bridge"]], "nnsight.tracing.Bridge.Bridge": [[8, 3, 1, "", "add"], [8, 3, 1, "", "add_bridge_proxy"], [8, 2, 1, "", "bridged_nodes"], [8, 3, 1, "", "get_bridge_proxy"], [8, 3, 1, "", "get_graph"], [8, 2, 1, "", "graph_stack"], [8, 2, 1, "", "id_to_graph"], [8, 2, 1, "", "locks"], [8, 3, 1, "", "peek_graph"], [8, 3, 1, "", "pop_graph"]], "nnsight.tracing.Graph": [[8, 1, 1, "", "Graph"]], "nnsight.tracing.Graph.Graph": [[8, 3, 1, "", "add"], [8, 2, 1, "", "alive"], [8, 2, 1, "", "attachments"], [8, 3, 1, "", "copy"], [8, 3, 1, "", "create"], [8, 3, 1, "", "execute"], [8, 2, 1, "", "name_idx"], [8, 2, 1, "", "nodes"], [8, 3, 1, "", "reset"], [8, 2, 1, "", "sequential"], [8, 2, 1, "", "validate"], [8, 3, 1, "", "vis"]], "nnsight.tracing.Node": [[8, 1, 1, "", "Node"]], "nnsight.tracing.Node.Node": [[8, 2, 1, "", "arg_dependencies"], [8, 2, 1, "", "args"], [8, 3, 1, "", "attached"], [8, 3, 1, "", "clean"], [8, 2, 1, "", "cond_dependency"], [8, 3, 1, "", "create"], [8, 3, 1, "", "destroy"], [8, 3, 1, "", "done"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "executed"], [8, 3, 1, "", "fulfilled"], [8, 2, 1, "", "graph"], [8, 2, 1, "", "kwargs"], [8, 2, 1, "", "listeners"], [8, 2, 1, "", "name"], [8, 3, 1, "", "prepare_inputs"], [8, 3, 1, "", "preprocess"], [8, 2, 1, "", "proxy"], [8, 2, 1, "", "proxy_value"], [8, 3, 1, "", "redundant"], [8, 3, 1, "", "reset"], [8, 3, 1, "", "set_value"], [8, 2, 1, "", "target"], [8, 5, 1, "id0", "value"], [8, 3, 1, "", "visualize"]], "nnsight.tracing.Proxy": [[8, 1, 1, "", "Proxy"], [8, 4, 1, "", "proxy_wrapper"]], "nnsight.tracing.Proxy.Proxy": [[8, 2, 1, "", "node"], [8, 5, 1, "", "value"]], "nnsight.tracing.protocols": [[8, 1, 1, "", "ApplyModuleProtocol"], [8, 1, 1, "", "BridgeProtocol"], [8, 1, 1, "", "ConditionalProtocol"], [8, 1, 1, "", "EarlyStopProtocol"], [8, 1, 1, "", "GradProtocol"], [8, 1, 1, "", "LocalBackendExecuteProtocol"], [8, 1, 1, "", "LockProtocol"], [8, 1, 1, "", "Protocol"], [8, 1, 1, "", "SwapProtocol"], [8, 1, 1, "", "UpdateProtocol"], [8, 1, 1, "", "ValueProtocol"]], "nnsight.tracing.protocols.ApplyModuleProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "get_module"], [8, 3, 1, "", "set_module"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.BridgeProtocol": [[8, 6, 1, "", "BridgeException"], [8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "get_bridge"], [8, 3, 1, "", "has_bridge"], [8, 3, 1, "", "peek_graph"], [8, 3, 1, "", "set_bridge"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.ConditionalProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "add_conditioned_node"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "get_conditional"], [8, 3, 1, "", "has_conditional"], [8, 3, 1, "", "is_node_conditioned"], [8, 3, 1, "", "peek_conditional"], [8, 3, 1, "", "pop_conditional"], [8, 3, 1, "", "push_conditional"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.EarlyStopProtocol": [[8, 6, 1, "", "EarlyStopException"], [8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.GradProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "increment"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.LocalBackendExecuteProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.LockProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.Protocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.SwapProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "get_swap"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.UpdateProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.ValueProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.util": [[9, 1, 1, "", "WrapperModule"], [9, 4, 1, "", "apply"], [9, 4, 1, "", "fetch_attr"], [9, 4, 1, "", "wrap"]], "nnsight.util.WrapperModule": [[9, 3, 1, "", "forward"]]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:attribute", "3": "py:method", "4": "py:function", "5": "py:property", "6": "py:exception"}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "method", "Python method"], "4": ["py", "function", "Python function"], "5": ["py", "property", "Python property"], "6": ["py", "exception", "Python exception"]}, "titleterms": {"about": 0, "nnsight": [0, 2, 3, 4, 5, 6, 7, 8, 9, 11], "an": 0, "api": 0, "transpar": 0, "scienc": 0, "black": 0, "box": 0, "ai": 0, "how": 0, "do": 0, "i": [0, 33], "us": 0, "what": 0, "happen": 0, "behind": 0, "scene": 0, "document": 1, "context": [2, 33], "envoi": 3, "intervent": [4, 12, 13, 18, 33], "model": [5, 20, 32, 33], "patch": [6, 28, 29], "schema": 7, "trace": [8, 33], "util": 9, "featur": 10, "condit": [12, 33], "cross": 13, "prompt": 13, "custom": [14, 33], "function": [14, 33], "earli": [15, 33], "stop": [15, 33], "get": [16, 33, 34], "valu": [16, 27], "gradient": [17, 33], "iter": 18, "lora": [19, 33], "edit": [20, 33], "modul": 21, "multipl": 22, "token": 22, "gener": 22, "oper": [23, 33], "remot": [24, 33], "execut": [24, 33], "scan": 25, "valid": 25, "session": [26, 33], "set": [27, 33], "activ": 28, "attribut": 29, "setup": [29, 30, 32], "ignor": [29, 30, 32], "boundless": 30, "da": 30, "price": 30, "tag": 30, "game": 30, "prealign": 30, "task": 30, "dictionari": 31, "learn": 31, "logit": 32, "len": 32, "introduct": 32, "gpt2": 32, "architectur": 32, "visual": 32, "gpt": 32, "2": [32, 33], "layer": 32, "interpret": 32, "walkthrough": 33, "1": 33, "first": [33, 34], "let": 33, "": 33, "start": [33, 34], "small": 33, "method": 33, "bigger": 33, "languagemodel": 33, "batch": 33, "next": 33, "3": 33, "thought": 33, "you": 33, "said": 33, "huge": 33, "loop": 33, "train": 33, "involv": 33, "instal": 34, "step": 34, "statu": 35, "tutori": 36}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "nbsphinx": 4, "sphinx.ext.viewcode": 1, "sphinx": 60}, "alltitles": {"About NNsight": [[0, "about-nnsight"]], "An API for transparent science on black-box AI.": [[0, "an-api-for-transparent-science-on-black-box-ai"]], "How do I use NNsight?": [[0, "how-do-i-use-nnsight"]], "What happens behind the scenes?": [[0, "what-happens-behind-the-scenes"]], "Documentation": [[1, "documentation"]], "nnsight.contexts": [[2, "module-nnsight.contexts"]], "nnsight.envoy": [[3, "module-nnsight.envoy"]], "nnsight.intervention": [[4, "module-nnsight.intervention"]], "nnsight.models": [[5, "module-nnsight.models"]], "nnsight.patching": [[6, "module-nnsight.patching"]], "nnsight.schema": [[7, "module-nnsight.schema"]], "nnsight.tracing": [[8, "module-nnsight.tracing"]], "nnsight.util": [[9, "module-nnsight.util"]], "Features": [[10, "features"]], "nnsight": [[11, "nnsight"]], "Conditional Interventions": [[12, "Conditional-Interventions"], [33, "Conditional-Interventions"]], "Cross-Prompt Intervention": [[13, "Cross-Prompt-Intervention"]], "Custom Functions": [[14, "Custom-Functions"], [33, "Custom-Functions"]], "Early Stopping": [[15, "Early-Stopping"], [33, "Early-Stopping"]], "Getting Values": [[16, "Getting-Values"]], "Gradients": [[17, "Gradients"], [33, "Gradients"]], "Iterative Interventions": [[18, "Iterative-Interventions"]], "LoRA": [[19, "LoRA"]], "Model Editing": [[20, "Model-Editing"], [33, "Model-Editing"]], "Modules": [[21, "Modules"]], "Multiple Token Generation": [[22, "Multiple-Token-Generation"]], "Operations": [[23, "Operations"]], "Remote Execution": [[24, "Remote-Execution"]], "Scan and Validate": [[25, "Scan-and-Validate"]], "Sessions": [[26, "Sessions"], [33, "Sessions"]], "Setting Values": [[27, "Setting-Values"]], "Activation Patching": [[28, "Activation-Patching"]], "Attribution Patching": [[29, "Attribution-Patching"]], "Setup (Ignore)": [[29, "Setup-(Ignore)"], [30, "Setup-(Ignore)"], [32, "Setup-(Ignore)"]], "Boundless DAS": [[30, "Boundless-DAS"], [30, "id1"]], "Price Tagging game": [[30, "Price-Tagging-game"]], "Prealign Task": [[30, "Prealign-Task"]], "Dictionary Learning": [[31, "Dictionary-Learning"]], "Logit Lens": [[32, "Logit-Lens"]], "Introduction to Logit Lens": [[32, "Introduction-to-Logit-Lens"]], "GPT2 Model Architecture": [[32, "GPT2-Model-Architecture"]], "Visualizing GPT-2 Layer Interpretations": [[32, "Visualizing-GPT-2-Layer-Interpretations"]], "Walkthrough": [[33, "Walkthrough"]], "1\ufe0f\u20e3 First, let\u2019s start small": [[33, "1\ufe0f\u20e3-First,-let's-start-small"]], "Tracing Context": [[33, "Tracing-Context"]], "Getting": [[33, "Getting"]], "Functions, Methods, and Operations": [[33, "Functions,-Methods,-and-Operations"]], "Setting": [[33, "Setting"]], "2\ufe0f\u20e3 Bigger": [[33, "2\ufe0f\u20e3-Bigger"]], "LanguageModel": [[33, "LanguageModel"]], "Batching": [[33, "Batching"]], ".next()": [[33, ".next()"]], "3\ufe0f\u20e3 I thought you said huge models?": [[33, "3\ufe0f\u20e3-I-thought-you-said-huge-models?"]], "Remote execution": [[33, "Remote-execution"]], "Looping": [[33, "Looping"]], "Training a LoRA": [[33, "Training-a-LoRA"]], "Getting Involved!": [[33, "Getting-Involved!"]], "Getting Started": [[34, "getting-started"]], "Installation": [[34, "installation"]], "First Steps": [[34, "first-steps"]], "Status": [[35, "status"]], "Tutorials": [[36, "tutorials"]]}, "indexentries": {"conditional (class in nnsight.contexts.conditional)": [[2, "nnsight.contexts.Conditional.Conditional"]], "conditionalmanager (class in nnsight.contexts.conditional)": [[2, "nnsight.contexts.Conditional.ConditionalManager"]], "globaltracingcontext (class in nnsight.contexts.graphbasedcontext)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext"]], "globaltracingcontext.globaltracingexit (class in nnsight.contexts.graphbasedcontext)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.GlobalTracingExit"]], "globaltracingcontext.globaltracingtorchhandler (class in nnsight.contexts.graphbasedcontext)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.GlobalTracingTorchHandler"]], "graphbasedcontext (class in nnsight.contexts.graphbasedcontext)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext"]], "invoker (class in nnsight.contexts.invoker)": [[2, "nnsight.contexts.Invoker.Invoker"]], "iterator (class in nnsight.contexts.session.iterator)": [[2, "nnsight.contexts.session.Iterator.Iterator"]], "session (class in nnsight.contexts.session.session)": [[2, "nnsight.contexts.session.Session.Session"]], "tracer (class in nnsight.contexts.tracer)": [[2, "nnsight.contexts.Tracer.Tracer"]], "_args (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._args"]], "_condition (nnsight.contexts.conditional.conditional attribute)": [[2, "nnsight.contexts.Conditional.Conditional._condition"]], "_conditional_dict (nnsight.contexts.conditional.conditionalmanager attribute)": [[2, "nnsight.contexts.Conditional.ConditionalManager._conditional_dict"]], "_conditional_stack (nnsight.contexts.conditional.conditionalmanager attribute)": [[2, "nnsight.contexts.Conditional.ConditionalManager._conditional_stack"]], "_conditioned_nodes_dict (nnsight.contexts.conditional.conditionalmanager attribute)": [[2, "nnsight.contexts.Conditional.ConditionalManager._conditioned_nodes_dict"]], "_graph (nnsight.contexts.conditional.conditional attribute)": [[2, "nnsight.contexts.Conditional.Conditional._graph"]], "_graph (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._graph"]], "_invoker (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._invoker"]], "_invoker_inputs (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._invoker_inputs"]], "_kwargs (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._kwargs"]], "_model (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._model"]], "add_conditioned_node() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.add_conditioned_node"]], "apply() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.apply"]], "backend (nnsight.contexts.session.session.session attribute)": [[2, "nnsight.contexts.session.Session.Session.backend"]], "bool() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.bool"]], "bridge (nnsight.contexts.session.session.session attribute)": [[2, "nnsight.contexts.session.Session.Session.bridge"]], "bridge_backend_handle() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.bridge_backend_handle"]], "bytearray() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.bytearray"]], "bytes() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.bytes"]], "check_for_dependencies() (in module nnsight.contexts)": [[2, "nnsight.contexts.check_for_dependencies"]], "complex() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.complex"]], "cond() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.cond"]], "deregister() (nnsight.contexts.graphbasedcontext.globaltracingcontext static method)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.deregister"]], "dict() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.dict"]], "edit_backend_execute() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.edit_backend_execute"]], "exit() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.exit"]], "float() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.float"]], "get() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.get"]], "graph (nnsight.contexts.session.session.session attribute)": [[2, "nnsight.contexts.session.Session.Session.graph"]], "inputs (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.inputs"]], "int() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.int"]], "invoke() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.invoke"]], "is_node_conditioned() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.is_node_conditioned"]], "iter() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.iter"]], "kwargs (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.kwargs"]], "list() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.list"]], "local_backend_execute() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.local_backend_execute"]], "local_backend_execute() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.local_backend_execute"]], "log() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.log"]], "model (nnsight.contexts.session.session.session attribute)": [[2, "nnsight.contexts.session.Session.Session.model"]], "module": [[2, "module-nnsight.contexts"], [2, "module-nnsight.contexts.Conditional"], [2, "module-nnsight.contexts.GraphBasedContext"], [2, "module-nnsight.contexts.Invoker"], [2, "module-nnsight.contexts.Tracer"], [2, "module-nnsight.contexts.session.Iterator"], [2, "module-nnsight.contexts.session.Session"], [3, "module-nnsight.envoy"], [4, "module-nnsight.intervention"], [5, "module-nnsight.models"], [5, "module-nnsight.models.LanguageModel"], [5, "module-nnsight.models.NNsightModel"], [5, "module-nnsight.models.UnifiedTransformer"], [6, "module-nnsight.patching"], [7, "module-nnsight.schema"], [7, "module-nnsight.schema.Config"], [7, "module-nnsight.schema.Response"], [7, "module-nnsight.schema.format.functions"], [7, "module-nnsight.schema.format.types"], [8, "module-nnsight.tracing"], [8, "module-nnsight.tracing.Bridge"], [8, "module-nnsight.tracing.Graph"], [8, "module-nnsight.tracing.Node"], [8, "module-nnsight.tracing.Proxy"], [8, "module-nnsight.tracing.protocols"], [9, "module-nnsight.util"]], "next() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.next"]], "nnsight.contexts": [[2, "module-nnsight.contexts"]], "nnsight.contexts.conditional": [[2, "module-nnsight.contexts.Conditional"]], "nnsight.contexts.graphbasedcontext": [[2, "module-nnsight.contexts.GraphBasedContext"]], "nnsight.contexts.invoker": [[2, "module-nnsight.contexts.Invoker"]], "nnsight.contexts.tracer": [[2, "module-nnsight.contexts.Tracer"]], "nnsight.contexts.session.iterator": [[2, "module-nnsight.contexts.session.Iterator"]], "nnsight.contexts.session.session": [[2, "module-nnsight.contexts.session.Session"]], "peek() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.peek"]], "pop() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.pop"]], "push() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.push"]], "register() (nnsight.contexts.graphbasedcontext.globaltracingcontext static method)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.register"]], "remote_backend_get_model_key() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.remote_backend_get_model_key"]], "remote_backend_get_model_key() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.remote_backend_get_model_key"]], "remote_backend_handle_result_value() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.remote_backend_handle_result_value"]], "remote_backend_handle_result_value() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.remote_backend_handle_result_value"]], "remote_backend_postprocess_result() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.remote_backend_postprocess_result"]], "remote_backend_postprocess_result() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.remote_backend_postprocess_result"]], "resolve_dependencies() (in module nnsight.contexts)": [[2, "nnsight.contexts.resolve_dependencies"]], "scan (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.scan"]], "scanning (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.scanning"]], "set() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.set"]], "str() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.str"]], "tracer (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.tracer"]], "try_deregister() (nnsight.contexts.graphbasedcontext.globaltracingcontext static method)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.try_deregister"]], "try_register() (nnsight.contexts.graphbasedcontext.globaltracingcontext static method)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.try_register"]], "tuple() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.tuple"]], "vis() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.vis"]], "envoy (class in nnsight.envoy)": [[3, "nnsight.envoy.Envoy"]], "_call_iter (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy._call_iter"]], "_fake_inputs (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy._fake_inputs"]], "_fake_outputs (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy._fake_outputs"]], "_tracer (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy._tracer"]], "input (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy.input"]], "input (nnsight.envoy.envoy property)": [[3, "id0"]], "inputs (nnsight.envoy.envoy property)": [[3, "nnsight.envoy.Envoy.inputs"]], "modules() (nnsight.envoy.envoy method)": [[3, "nnsight.envoy.Envoy.modules"]], "named_modules() (nnsight.envoy.envoy method)": [[3, "nnsight.envoy.Envoy.named_modules"]], "nnsight.envoy": [[3, "module-nnsight.envoy"]], "output (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy.output"]], "output (nnsight.envoy.envoy property)": [[3, "id1"]], "path (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy.path"]], "to() (nnsight.envoy.envoy method)": [[3, "nnsight.envoy.Envoy.to"]], "hookhandler (class in nnsight.intervention)": [[4, "nnsight.intervention.HookHandler"]], "interventionhandler (class in nnsight.intervention)": [[4, "nnsight.intervention.InterventionHandler"]], "interventionprotocol (class in nnsight.intervention)": [[4, "nnsight.intervention.InterventionProtocol"]], "interventionproxy (class in nnsight.intervention)": [[4, "nnsight.intervention.InterventionProxy"]], "add() (nnsight.intervention.interventionprotocol class method)": [[4, "nnsight.intervention.InterventionProtocol.add"]], "count() (nnsight.intervention.interventionhandler method)": [[4, "nnsight.intervention.InterventionHandler.count"]], "device (nnsight.intervention.interventionproxy property)": [[4, "nnsight.intervention.InterventionProxy.device"]], "dtype (nnsight.intervention.interventionproxy property)": [[4, "nnsight.intervention.InterventionProxy.dtype"]], "get_interventions() (nnsight.intervention.interventionprotocol class method)": [[4, "nnsight.intervention.InterventionProtocol.get_interventions"]], "grad (nnsight.intervention.interventionproxy property)": [[4, "nnsight.intervention.InterventionProxy.grad"]], "handles (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.handles"]], "input_hook (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.input_hook"]], "intervene() (nnsight.intervention.interventionprotocol class method)": [[4, "nnsight.intervention.InterventionProtocol.intervene"]], "model (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.model"]], "modules (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.modules"]], "nnsight.intervention": [[4, "module-nnsight.intervention"]], "output_hook (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.output_hook"]], "save() (nnsight.intervention.interventionproxy method)": [[4, "nnsight.intervention.InterventionProxy.save"]], "shape (nnsight.intervention.interventionproxy property)": [[4, "nnsight.intervention.InterventionProxy.shape"]], "stop() (nnsight.intervention.interventionproxy method)": [[4, "nnsight.intervention.InterventionProxy.stop"]], "style() (nnsight.intervention.interventionprotocol class method)": [[4, "nnsight.intervention.InterventionProtocol.style"]], "update() (nnsight.intervention.interventionproxy method)": [[4, "nnsight.intervention.InterventionProxy.update"]], "languagemodel (class in nnsight.models.languagemodel)": [[5, "nnsight.models.LanguageModel.LanguageModel"]], "languagemodelproxy (class in nnsight.models.languagemodel)": [[5, "nnsight.models.LanguageModel.LanguageModelProxy"]], "metadispatcher (class in nnsight.models.nnsightmodel)": [[5, "nnsight.models.NNsightModel.MetaDispatcher"]], "nnsight (class in nnsight.models.nnsightmodel)": [[5, "nnsight.models.NNsightModel.NNsight"]], "tokenindexer (class in nnsight.models.languagemodel)": [[5, "nnsight.models.LanguageModel.TokenIndexer"]], "unifiedtransformer (class in nnsight.models.unifiedtransformer)": [[5, "nnsight.models.UnifiedTransformer.UnifiedTransformer"]], "_args (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._args"]], "_custom_model (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._custom_model"]], "_dispatched (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._dispatched"]], "_envoy (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._envoy"]], "_kwargs (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._kwargs"]], "_model (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._model"]], "_model_key (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._model_key"]], "_session (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._session"]], "automodel (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.automodel"]], "clear_edits() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.clear_edits"]], "config (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.config"]], "dispatch_model() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.dispatch_model"]], "edit() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.edit"]], "interleave() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.interleave"]], "model (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.model"]], "nnsight.models": [[5, "module-nnsight.models"]], "nnsight.models.languagemodel": [[5, "module-nnsight.models.LanguageModel"]], "nnsight.models.nnsightmodel": [[5, "module-nnsight.models.NNsightModel"]], "nnsight.models.unifiedtransformer": [[5, "module-nnsight.models.UnifiedTransformer"]], "proxy_class (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.proxy_class"]], "proxy_class (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight.proxy_class"]], "scan() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.scan"]], "session() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.session"]], "t (nnsight.models.languagemodel.languagemodelproxy property)": [[5, "nnsight.models.LanguageModel.LanguageModelProxy.t"]], "to() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.to"]], "token (nnsight.models.languagemodel.languagemodelproxy property)": [[5, "nnsight.models.LanguageModel.LanguageModelProxy.token"]], "tokenizer (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.tokenizer"]], "trace() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.trace"]], "patch (class in nnsight.patching)": [[6, "nnsight.patching.Patch"]], "patcher (class in nnsight.patching)": [[6, "nnsight.patching.Patcher"]], "add() (nnsight.patching.patcher method)": [[6, "nnsight.patching.Patcher.add"]], "nnsight.patching": [[6, "module-nnsight.patching"]], "obj (nnsight.patching.patch attribute)": [[6, "nnsight.patching.Patch.obj"]], "parent (nnsight.patching.patch attribute)": [[6, "nnsight.patching.Patch.parent"]], "patch() (nnsight.patching.patch method)": [[6, "nnsight.patching.Patch.patch"]], "patches (nnsight.patching.patcher attribute)": [[6, "nnsight.patching.Patcher.patches"]], "replacement (nnsight.patching.patch attribute)": [[6, "nnsight.patching.Patch.replacement"]], "restore() (nnsight.patching.patch method)": [[6, "nnsight.patching.Patch.restore"]], "apiconfigmodel (class in nnsight.schema.config)": [[7, "nnsight.schema.Config.ApiConfigModel"]], "appconfigmodel (class in nnsight.schema.config)": [[7, "nnsight.schema.Config.AppConfigModel"]], "basennsightmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.BaseNNsightModel"]], "configmodel (class in nnsight.schema.config)": [[7, "nnsight.schema.Config.ConfigModel"]], "dictmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.DictModel"]], "ellipsismodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.EllipsisModel"]], "functionmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.FunctionModel"]], "functionwhitelisterror": [[7, "nnsight.schema.format.types.FunctionWhitelistError"]], "graphmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.GraphModel"]], "iteratormodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.IteratorModel"]], "listmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.ListModel"]], "nodemodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.NodeModel"]], "nodemodel.reference (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.NodeModel.Reference"]], "primitivemodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.PrimitiveModel"]], "responsemodel (class in nnsight.schema.response)": [[7, "nnsight.schema.Response.ResponseModel"]], "responsemodel.jobstatus (class in nnsight.schema.response)": [[7, "nnsight.schema.Response.ResponseModel.JobStatus"]], "resultmodel (class in nnsight.schema.response)": [[7, "nnsight.schema.Response.ResultModel"]], "sessionmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.SessionModel"]], "slicemodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.SliceModel"]], "tensormodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.TensorModel"]], "tracermodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.TracerModel"]], "tuplemodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.TupleModel"]], "model_config (nnsight.schema.config.apiconfigmodel attribute)": [[7, "nnsight.schema.Config.ApiConfigModel.model_config"]], "model_config (nnsight.schema.config.appconfigmodel attribute)": [[7, "nnsight.schema.Config.AppConfigModel.model_config"]], "model_config (nnsight.schema.config.configmodel attribute)": [[7, "nnsight.schema.Config.ConfigModel.model_config"]], "model_config (nnsight.schema.response.responsemodel attribute)": [[7, "nnsight.schema.Response.ResponseModel.model_config"]], "model_config (nnsight.schema.response.resultmodel attribute)": [[7, "nnsight.schema.Response.ResultModel.model_config"]], "model_config (nnsight.schema.format.types.basennsightmodel attribute)": [[7, "nnsight.schema.format.types.BaseNNsightModel.model_config"]], "model_config (nnsight.schema.format.types.dictmodel attribute)": [[7, "nnsight.schema.format.types.DictModel.model_config"]], "model_config (nnsight.schema.format.types.ellipsismodel attribute)": [[7, "nnsight.schema.format.types.EllipsisModel.model_config"]], "model_config (nnsight.schema.format.types.functionmodel attribute)": [[7, "nnsight.schema.format.types.FunctionModel.model_config"]], "model_config (nnsight.schema.format.types.graphmodel attribute)": [[7, "nnsight.schema.format.types.GraphModel.model_config"]], "model_config (nnsight.schema.format.types.iteratormodel attribute)": [[7, "nnsight.schema.format.types.IteratorModel.model_config"]], "model_config (nnsight.schema.format.types.listmodel attribute)": [[7, "nnsight.schema.format.types.ListModel.model_config"]], "model_config (nnsight.schema.format.types.nodemodel attribute)": [[7, "nnsight.schema.format.types.NodeModel.model_config"]], "model_config (nnsight.schema.format.types.nodemodel.reference attribute)": [[7, "nnsight.schema.format.types.NodeModel.Reference.model_config"]], "model_config (nnsight.schema.format.types.primitivemodel attribute)": [[7, "nnsight.schema.format.types.PrimitiveModel.model_config"]], "model_config (nnsight.schema.format.types.sessionmodel attribute)": [[7, "nnsight.schema.format.types.SessionModel.model_config"]], "model_config (nnsight.schema.format.types.slicemodel attribute)": [[7, "nnsight.schema.format.types.SliceModel.model_config"]], "model_config (nnsight.schema.format.types.tensormodel attribute)": [[7, "nnsight.schema.format.types.TensorModel.model_config"]], "model_config (nnsight.schema.format.types.tracermodel attribute)": [[7, "nnsight.schema.format.types.TracerModel.model_config"]], "model_config (nnsight.schema.format.types.tuplemodel attribute)": [[7, "nnsight.schema.format.types.TupleModel.model_config"]], "model_fields (nnsight.schema.config.apiconfigmodel attribute)": [[7, "nnsight.schema.Config.ApiConfigModel.model_fields"]], "model_fields (nnsight.schema.config.appconfigmodel attribute)": [[7, "nnsight.schema.Config.AppConfigModel.model_fields"]], "model_fields (nnsight.schema.config.configmodel attribute)": [[7, "nnsight.schema.Config.ConfigModel.model_fields"]], "model_fields (nnsight.schema.response.responsemodel attribute)": [[7, "nnsight.schema.Response.ResponseModel.model_fields"]], "model_fields (nnsight.schema.response.resultmodel attribute)": [[7, "nnsight.schema.Response.ResultModel.model_fields"]], "model_fields (nnsight.schema.format.types.basennsightmodel attribute)": [[7, "nnsight.schema.format.types.BaseNNsightModel.model_fields"]], "model_fields (nnsight.schema.format.types.dictmodel attribute)": [[7, "nnsight.schema.format.types.DictModel.model_fields"]], "model_fields (nnsight.schema.format.types.ellipsismodel attribute)": [[7, "nnsight.schema.format.types.EllipsisModel.model_fields"]], "model_fields (nnsight.schema.format.types.functionmodel attribute)": [[7, "nnsight.schema.format.types.FunctionModel.model_fields"]], "model_fields (nnsight.schema.format.types.graphmodel attribute)": [[7, "nnsight.schema.format.types.GraphModel.model_fields"]], "model_fields (nnsight.schema.format.types.iteratormodel attribute)": [[7, "nnsight.schema.format.types.IteratorModel.model_fields"]], "model_fields (nnsight.schema.format.types.listmodel attribute)": [[7, "nnsight.schema.format.types.ListModel.model_fields"]], "model_fields (nnsight.schema.format.types.nodemodel attribute)": [[7, "nnsight.schema.format.types.NodeModel.model_fields"]], "model_fields (nnsight.schema.format.types.nodemodel.reference attribute)": [[7, "nnsight.schema.format.types.NodeModel.Reference.model_fields"]], "model_fields (nnsight.schema.format.types.primitivemodel attribute)": [[7, "nnsight.schema.format.types.PrimitiveModel.model_fields"]], "model_fields (nnsight.schema.format.types.sessionmodel attribute)": [[7, "nnsight.schema.format.types.SessionModel.model_fields"]], "model_fields (nnsight.schema.format.types.slicemodel attribute)": [[7, "nnsight.schema.format.types.SliceModel.model_fields"]], "model_fields (nnsight.schema.format.types.tensormodel attribute)": [[7, "nnsight.schema.format.types.TensorModel.model_fields"]], "model_fields (nnsight.schema.format.types.tracermodel attribute)": [[7, "nnsight.schema.format.types.TracerModel.model_fields"]], "model_fields (nnsight.schema.format.types.tuplemodel attribute)": [[7, "nnsight.schema.format.types.TupleModel.model_fields"]], "nnsight.schema": [[7, "module-nnsight.schema"]], "nnsight.schema.config": [[7, "module-nnsight.schema.Config"]], "nnsight.schema.response": [[7, "module-nnsight.schema.Response"]], "nnsight.schema.format.functions": [[7, "module-nnsight.schema.format.functions"]], "nnsight.schema.format.types": [[7, "module-nnsight.schema.format.types"]], "applymoduleprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol"]], "bridge (class in nnsight.tracing.bridge)": [[8, "nnsight.tracing.Bridge.Bridge"]], "bridgeprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.BridgeProtocol"]], "bridgeprotocol.bridgeexception": [[8, "nnsight.tracing.protocols.BridgeProtocol.BridgeException"]], "conditionalprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.ConditionalProtocol"]], "earlystopprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.EarlyStopProtocol"]], "earlystopprotocol.earlystopexception": [[8, "nnsight.tracing.protocols.EarlyStopProtocol.EarlyStopException"]], "gradprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.GradProtocol"]], "graph (class in nnsight.tracing.graph)": [[8, "nnsight.tracing.Graph.Graph"]], "localbackendexecuteprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.LocalBackendExecuteProtocol"]], "lockprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.LockProtocol"]], "node (class in nnsight.tracing.node)": [[8, "nnsight.tracing.Node.Node"]], "protocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.Protocol"]], "proxy (class in nnsight.tracing.proxy)": [[8, "nnsight.tracing.Proxy.Proxy"]], "swapprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.SwapProtocol"]], "updateprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.UpdateProtocol"]], "valueprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.ValueProtocol"]], "add() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.add"]], "add() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.add"]], "add() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.add"]], "add() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.add"]], "add() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.add"]], "add() (nnsight.tracing.protocols.earlystopprotocol class method)": [[8, "nnsight.tracing.protocols.EarlyStopProtocol.add"]], "add() (nnsight.tracing.protocols.gradprotocol class method)": [[8, "nnsight.tracing.protocols.GradProtocol.add"]], "add() (nnsight.tracing.protocols.localbackendexecuteprotocol class method)": [[8, "nnsight.tracing.protocols.LocalBackendExecuteProtocol.add"]], "add() (nnsight.tracing.protocols.lockprotocol class method)": [[8, "nnsight.tracing.protocols.LockProtocol.add"]], "add() (nnsight.tracing.protocols.protocol class method)": [[8, "nnsight.tracing.protocols.Protocol.add"]], "add() (nnsight.tracing.protocols.swapprotocol class method)": [[8, "nnsight.tracing.protocols.SwapProtocol.add"]], "add() (nnsight.tracing.protocols.updateprotocol class method)": [[8, "nnsight.tracing.protocols.UpdateProtocol.add"]], "add() (nnsight.tracing.protocols.valueprotocol class method)": [[8, "nnsight.tracing.protocols.ValueProtocol.add"]], "add_bridge_proxy() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.add_bridge_proxy"]], "add_conditioned_node() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.add_conditioned_node"]], "alive (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.alive"]], "arg_dependencies (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.arg_dependencies"]], "args (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.args"]], "attached() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.attached"]], "attachments (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.attachments"]], "bridged_nodes (nnsight.tracing.bridge.bridge attribute)": [[8, "nnsight.tracing.Bridge.Bridge.bridged_nodes"]], "clean() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.clean"]], "cond_dependency (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.cond_dependency"]], "copy() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.copy"]], "create() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.create"]], "create() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.create"]], "destroy() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.destroy"]], "done() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.done"]], "execute() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.execute"]], "execute() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.execute"]], "execute() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.execute"]], "execute() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.execute"]], "execute() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.execute"]], "execute() (nnsight.tracing.protocols.earlystopprotocol class method)": [[8, "nnsight.tracing.protocols.EarlyStopProtocol.execute"]], "execute() (nnsight.tracing.protocols.gradprotocol class method)": [[8, "nnsight.tracing.protocols.GradProtocol.execute"]], "execute() (nnsight.tracing.protocols.localbackendexecuteprotocol class method)": [[8, "nnsight.tracing.protocols.LocalBackendExecuteProtocol.execute"]], "execute() (nnsight.tracing.protocols.protocol class method)": [[8, "nnsight.tracing.protocols.Protocol.execute"]], "execute() (nnsight.tracing.protocols.swapprotocol class method)": [[8, "nnsight.tracing.protocols.SwapProtocol.execute"]], "execute() (nnsight.tracing.protocols.updateprotocol class method)": [[8, "nnsight.tracing.protocols.UpdateProtocol.execute"]], "execute() (nnsight.tracing.protocols.valueprotocol class method)": [[8, "nnsight.tracing.protocols.ValueProtocol.execute"]], "executed() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.executed"]], "fulfilled() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.fulfilled"]], "get_bridge() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.get_bridge"]], "get_bridge_proxy() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.get_bridge_proxy"]], "get_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.get_conditional"]], "get_graph() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.get_graph"]], "get_module() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.get_module"]], "get_swap() (nnsight.tracing.protocols.swapprotocol class method)": [[8, "nnsight.tracing.protocols.SwapProtocol.get_swap"]], "graph (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.graph"]], "graph_stack (nnsight.tracing.bridge.bridge attribute)": [[8, "nnsight.tracing.Bridge.Bridge.graph_stack"]], "has_bridge() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.has_bridge"]], "has_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.has_conditional"]], "id_to_graph (nnsight.tracing.bridge.bridge attribute)": [[8, "nnsight.tracing.Bridge.Bridge.id_to_graph"]], "increment() (nnsight.tracing.protocols.gradprotocol class method)": [[8, "nnsight.tracing.protocols.GradProtocol.increment"]], "is_node_conditioned() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.is_node_conditioned"]], "kwargs (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.kwargs"]], "listeners (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.listeners"]], "locks (nnsight.tracing.bridge.bridge attribute)": [[8, "nnsight.tracing.Bridge.Bridge.locks"]], "name (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.name"]], "name_idx (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.name_idx"]], "nnsight.tracing": [[8, "module-nnsight.tracing"]], "nnsight.tracing.bridge": [[8, "module-nnsight.tracing.Bridge"]], "nnsight.tracing.graph": [[8, "module-nnsight.tracing.Graph"]], "nnsight.tracing.node": [[8, "module-nnsight.tracing.Node"]], "nnsight.tracing.proxy": [[8, "module-nnsight.tracing.Proxy"]], "nnsight.tracing.protocols": [[8, "module-nnsight.tracing.protocols"]], "node (nnsight.tracing.proxy.proxy attribute)": [[8, "nnsight.tracing.Proxy.Proxy.node"]], "nodes (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.nodes"]], "peek_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.peek_conditional"]], "peek_graph() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.peek_graph"]], "peek_graph() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.peek_graph"]], "pop_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.pop_conditional"]], "pop_graph() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.pop_graph"]], "prepare_inputs() (nnsight.tracing.node.node class method)": [[8, "nnsight.tracing.Node.Node.prepare_inputs"]], "preprocess() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.preprocess"]], "proxy (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.proxy"]], "proxy_value (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.proxy_value"]], "proxy_wrapper() (in module nnsight.tracing.proxy)": [[8, "nnsight.tracing.Proxy.proxy_wrapper"]], "push_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.push_conditional"]], "redundant() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.redundant"]], "reset() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.reset"]], "reset() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.reset"]], "sequential (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.sequential"]], "set_bridge() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.set_bridge"]], "set_module() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.set_module"]], "set_value() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.set_value"]], "style() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.style"]], "style() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.style"]], "style() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.style"]], "style() (nnsight.tracing.protocols.earlystopprotocol class method)": [[8, "nnsight.tracing.protocols.EarlyStopProtocol.style"]], "style() (nnsight.tracing.protocols.gradprotocol class method)": [[8, "nnsight.tracing.protocols.GradProtocol.style"]], "style() (nnsight.tracing.protocols.localbackendexecuteprotocol class method)": [[8, "nnsight.tracing.protocols.LocalBackendExecuteProtocol.style"]], "style() (nnsight.tracing.protocols.lockprotocol class method)": [[8, "nnsight.tracing.protocols.LockProtocol.style"]], "style() (nnsight.tracing.protocols.protocol class method)": [[8, "nnsight.tracing.protocols.Protocol.style"]], "style() (nnsight.tracing.protocols.swapprotocol class method)": [[8, "nnsight.tracing.protocols.SwapProtocol.style"]], "style() (nnsight.tracing.protocols.updateprotocol class method)": [[8, "nnsight.tracing.protocols.UpdateProtocol.style"]], "style() (nnsight.tracing.protocols.valueprotocol class method)": [[8, "nnsight.tracing.protocols.ValueProtocol.style"]], "target (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.target"]], "validate (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.validate"]], "value (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.value"]], "value (nnsight.tracing.node.node property)": [[8, "id0"]], "value (nnsight.tracing.proxy.proxy property)": [[8, "nnsight.tracing.Proxy.Proxy.value"]], "vis() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.vis"]], "visualize() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.visualize"]], "wrappermodule (class in nnsight.util)": [[9, "nnsight.util.WrapperModule"]], "apply() (in module nnsight.util)": [[9, "nnsight.util.apply"]], "fetch_attr() (in module nnsight.util)": [[9, "nnsight.util.fetch_attr"]], "forward() (nnsight.util.wrappermodule method)": [[9, "nnsight.util.WrapperModule.forward"]], "nnsight.util": [[9, "module-nnsight.util"]], "wrap() (in module nnsight.util)": [[9, "nnsight.util.wrap"]]}}) \ No newline at end of file +Search.setIndex({"docnames": ["about", "documentation", "documentation/contexts", "documentation/envoy", "documentation/intervention", "documentation/models", "documentation/patching", "documentation/schema", "documentation/tracing", "documentation/util", "features", "index", "notebooks/features/conditionals", "notebooks/features/cross_prompt", "notebooks/features/custom_functions", "notebooks/features/early_stopping", "notebooks/features/getting", "notebooks/features/gradients", "notebooks/features/iterator", "notebooks/features/lora_training", "notebooks/features/model_editing", "notebooks/features/modules", "notebooks/features/multiple_token", "notebooks/features/operations", "notebooks/features/remote_execution", "notebooks/features/scan_validate", "notebooks/features/sessions", "notebooks/features/setting", "notebooks/tutorials/activation_patching", "notebooks/tutorials/attribution_patching", "notebooks/tutorials/boundless_DAS", "notebooks/tutorials/dict_learning", "notebooks/tutorials/logit_lens", "notebooks/tutorials/walkthrough", "start", "status", "tutorials"], "filenames": ["about.rst", "documentation.rst", "documentation/contexts.rst", "documentation/envoy.rst", "documentation/intervention.rst", "documentation/models.rst", "documentation/patching.rst", "documentation/schema.rst", "documentation/tracing.rst", "documentation/util.rst", "features.rst", "index.rst", "notebooks/features/conditionals.ipynb", "notebooks/features/cross_prompt.ipynb", "notebooks/features/custom_functions.ipynb", "notebooks/features/early_stopping.ipynb", "notebooks/features/getting.ipynb", "notebooks/features/gradients.ipynb", "notebooks/features/iterator.ipynb", "notebooks/features/lora_training.ipynb", "notebooks/features/model_editing.ipynb", "notebooks/features/modules.ipynb", "notebooks/features/multiple_token.ipynb", "notebooks/features/operations.ipynb", "notebooks/features/remote_execution.ipynb", "notebooks/features/scan_validate.ipynb", "notebooks/features/sessions.ipynb", "notebooks/features/setting.ipynb", "notebooks/tutorials/activation_patching.ipynb", "notebooks/tutorials/attribution_patching.ipynb", "notebooks/tutorials/boundless_DAS.ipynb", "notebooks/tutorials/dict_learning.ipynb", "notebooks/tutorials/logit_lens.ipynb", "notebooks/tutorials/walkthrough.ipynb", "start.rst", "status.rst", "tutorials.rst"], "titles": ["About NNsight", "Documentation", "nnsight.contexts", "nnsight.envoy", "nnsight.intervention", "nnsight.models", "nnsight.patching", "nnsight.schema", "nnsight.tracing", "nnsight.util", "Features", "nnsight", "Conditional Interventions", "Cross-Prompt Intervention", "Custom Functions", "Early Stopping", "Getting Values", "Gradients", "Iterative Interventions", "LoRA", "Model Editing", "Modules", "Multiple Token Generation", "Operations", "Remote Execution", "Scan and Validate", "Sessions", "Setting Values", "Activation Patching", "Attribution Patching", "Boundless DAS", "Dictionary Learning", "Logit Lens", "Walkthrough", "Getting Started", "Status", "Tutorials"], "terms": {"can": [0, 2, 3, 5, 8, 12, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35], "you": [0, 2, 5, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36], "studi": 0, "intern": [0, 11, 33, 34], "deep": [0, 33, 34], "network": [0, 11, 28, 30, 33], "too": 0, "larg": [0, 29, 33], "run": [0, 2, 4, 5, 8, 9, 15, 18, 19, 24, 25, 26, 28, 29, 33, 35], "In": [0, 2, 5, 12, 13, 15, 17, 20, 23, 24, 25, 26, 27, 29, 30, 33], "thi": [0, 2, 3, 4, 5, 7, 8, 9, 12, 13, 14, 15, 17, 18, 19, 20, 23, 24, 25, 26, 27, 29, 30, 32, 33], "era": [0, 33], "scale": [0, 18, 33], "learn": [0, 30, 33, 34, 36], "most": [0, 2, 3, 5, 15, 23, 25, 29, 33], "interest": [0, 15, 26, 28, 29, 31, 33], "model": [0, 1, 2, 3, 4, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 34, 35, 36], "ar": [0, 2, 3, 5, 8, 9, 14, 15, 16, 17, 19, 20, 23, 25, 26, 30, 32, 33, 35], "massiv": [0, 33], "hard": [0, 33], "ordinari": [0, 33], "commerci": [0, 33], "infer": [0, 19, 33], "servic": [0, 2, 33], "let": [0, 5, 8, 19, 20, 24, 25, 26, 28, 29, 36], "interact": [0, 2, 4, 5, 8, 17, 33], "huge": [0, 36], "thei": [0, 2, 3, 8, 15, 19, 25, 33], "see": [0, 2, 5, 8, 12, 13, 14, 17, 18, 19, 20, 23, 25, 26, 27, 29, 31, 33, 34], "The": [0, 2, 4, 5, 6, 8, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 32, 33, 35], "librari": [0, 8, 14, 25, 33, 35], "differ": [0, 2, 8, 26, 28, 29, 32, 33], "give": [0, 5, 9, 33, 34], "full": [0, 33, 34], "access": [0, 2, 3, 4, 5, 8, 10, 11, 15, 16, 17, 24, 26, 32, 33], "all": [0, 2, 3, 4, 5, 8, 9, 14, 17, 18, 19, 20, 24, 25, 26, 28, 29, 30, 32, 33, 35], "neural": [0, 11, 30, 33], "when": [0, 2, 3, 4, 5, 8, 13, 19, 20, 22, 24, 25, 29, 33], "togeth": [0, 2, 26, 33], "remot": [0, 2, 5, 10, 19, 26, 30, 35], "like": [0, 4, 5, 12, 17, 19, 21, 25, 29, 33], "nation": [0, 33], "fabric": [0, 33], "ndif": [0, 7, 13, 15, 24, 25, 26, 33, 34, 35], "experi": [0, 26, 28, 33, 35], "open": [0, 2, 5, 13, 19, 22, 24, 33, 34], "easili": [0, 5, 11, 33], "also": [0, 2, 5, 6, 12, 13, 14, 17, 18, 19, 21, 25, 26, 30, 33], "terrif": 0, "smaller": 0, "local": [0, 2, 5, 24, 26, 29, 32, 33, 35], "overview": 0, "pipelin": 0, "research": [0, 33], "write": [0, 30], "simpl": [0, 5, 8, 9, 14, 18, 19, 20, 24, 33], "python": [0, 8, 18, 33], "code": [0, 25, 30, 32, 33], "along": [0, 3, 4, 24, 33], "unlik": [0, 8, 20, 32, 33], "read": [0, 30, 32, 33, 34], "ani": [0, 2, 4, 5, 6, 7, 8, 9, 11, 14, 15, 21, 25, 33], "state": [0, 2, 5, 11, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 33], "being": [0, 4, 22, 26, 33], "creat": [0, 2, 3, 4, 5, 8, 18, 19, 20, 25, 27, 30, 32, 33], "comput": [0, 2, 4, 5, 8, 9, 10, 15, 21, 23, 25, 27, 29, 32, 33], "graph": [0, 2, 3, 4, 5, 7, 8, 10, 14, 18, 19, 23, 25, 33], "sent": [0, 19, 33], "interleav": [0, 4, 5, 33], "execut": [0, 2, 4, 5, 8, 10, 12, 14, 15, 17, 18, 19, 25, 26], "built": [0, 3, 8, 18, 33], "pytorch": [0, 5, 11, 14, 25, 33], "veri": [0, 19, 25, 33], "similar": [0, 30], "your": [0, 5, 20, 24, 25, 26, 32, 33], "own": [0, 19, 25, 26, 33], "workstat": 0, "fact": [0, 33], "same": [0, 2, 8, 9, 13, 24, 25, 26, 29, 32, 33], "small": [0, 29, 36], "just": [0, 5, 8, 12, 17, 19, 24, 25, 26, 28, 29, 33], "chang": [0, 19, 20, 23, 25, 27, 29, 33], "few": [0, 5, 33], "argument": [0, 2, 3, 5, 8, 9, 14, 33], "between": [0, 2, 8, 13, 20, 26, 28, 29, 30, 33], "normal": [0, 8, 17, 19, 25, 28, 32, 33], "treat": 0, "opaqu": 0, "instead": [0, 5, 9, 15, 29, 33], "set": [0, 2, 3, 4, 5, 8, 10, 12, 13, 14, 15, 17, 18, 19, 20, 22, 24, 25, 26, 29, 30, 32], "up": [0, 5, 8, 24, 28, 29, 31, 33], "context": [0, 1, 3, 4, 5, 6, 8, 12, 14, 15, 16, 17, 18, 19, 20, 24, 25, 26, 28, 30], "enabl": [0, 2, 4, 5, 8, 11, 20, 25, 26, 30, 33], "get": [0, 2, 3, 4, 5, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 36], "direct": [0, 5, 8, 33], "while": [0, 2, 9, 22, 29, 32, 33], "here": [0, 2, 5, 13, 18, 19, 21, 22, 25, 28, 29, 30, 32, 33], "look": [0, 5, 21, 26, 28, 33], "from": [0, 2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "import": [0, 5, 8, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "languagemodel": [0, 2, 5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32], "meta": [0, 2, 3, 5, 24, 25, 26, 33], "llama": [0, 24, 26, 33], "2": [0, 2, 5, 8, 12, 13, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 36], "70b": [0, 24, 26, 33], "hf": 0, "trace": [0, 1, 2, 4, 5, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 32], "eiffel": [0, 4, 5, 11, 12, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 32, 33], "tower": [0, 4, 5, 11, 12, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 32, 33], "citi": [0, 4, 5, 11, 12, 13, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 32, 33], "true": [0, 2, 5, 7, 8, 12, 13, 14, 17, 18, 19, 20, 24, 25, 26, 29, 30, 31, 32, 33], "hidden_st": [0, 4, 16, 17, 21, 23, 24, 33], "layer": [0, 15, 17, 19, 21, 22, 24, 26, 28, 29, 30, 31, 33], "10": [0, 5, 12, 13, 19, 22, 24, 25, 30, 32, 33], "input": [0, 2, 3, 4, 5, 8, 9, 11, 16, 17, 19, 25, 28, 29, 30, 32, 33], "0": [0, 3, 5, 8, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "save": [0, 2, 4, 5, 8, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "one": [0, 2, 3, 4, 5, 8, 9, 10, 12, 15, 19, 22, 24, 25, 26, 28, 29, 30, 33], "hidden": [0, 5, 11, 16, 17, 19, 20, 21, 22, 23, 25, 26, 27, 28, 33], "11": [0, 5, 17, 20, 22, 24, 25, 26, 27, 30, 32, 33], "mlp": [0, 3, 5, 11, 19, 29, 31, 32, 33], "output": [0, 2, 3, 4, 5, 8, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "modul": [0, 2, 3, 4, 5, 6, 8, 9, 10, 11, 15, 16, 19, 22, 25, 33], "print": [0, 2, 4, 5, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33], "predict": [0, 19, 20, 26, 28, 32, 33], "wa": [0, 5, 8, 12, 14, 15, 18, 19, 20, 22, 24, 25, 26, 29, 33], "easi": [0, 2, 33], "huggingfac": [0, 5, 12, 14, 18, 19, 20, 24, 25, 26, 29, 32, 33], "load": [0, 5, 24, 28, 30, 31, 32, 33], "object": [0, 2, 3, 4, 5, 6, 8, 9, 11, 14, 16, 18, 19, 26, 28, 29, 32, 33], "line": [0, 15, 25, 33], "notic": [0, 33], "we": [0, 3, 4, 5, 8, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33], "70": [0, 21], "billion": 0, "paramet": [0, 2, 3, 4, 5, 6, 8, 9, 19, 24, 30, 33], "which": [0, 2, 3, 5, 8, 9, 18, 19, 20, 21, 29, 30, 33, 35], "ordinarili": 0, "pretti": [0, 33], "difficult": 0, "regular": 0, "sinc": [0, 9, 15, 26, 29, 33], "would": [0, 5, 8, 14, 15, 17, 19, 31, 33], "take": [0, 2, 5, 9, 20, 26, 29, 33], "140": 0, "280": 0, "gigabyt": 0, "gpu": [0, 5, 33], "ram": 0, "store": [0, 2, 4, 8, 15, 26, 28, 33], "trick": [0, 33], "u": [0, 5, 17, 18, 21, 24, 25, 27, 31, 32, 33], "work": [0, 2, 13, 15, 17, 23, 24, 25, 32, 33], "3": [0, 5, 13, 15, 16, 17, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36], "flag": [0, 18, 25, 33], "indic": [0, 4, 5, 31, 33], "want": [0, 2, 8, 12, 13, 17, 18, 25, 27, 29, 33], "actual": [0, 2, 8, 19, 21, 24, 28, 33], "By": [0, 8, 23, 32, 33], "default": [0, 2, 3, 4, 5, 7, 8, 12, 14, 17, 18, 19, 20, 24, 25, 33], "If": [0, 2, 3, 4, 5, 8, 9, 10, 12, 13, 15, 17, 20, 25, 29, 33], "quickli": 0, "could": [0, 5, 13, 15, 19, 29, 32, 33], "leav": [0, 25, 30, 33], "fals": [0, 2, 3, 5, 7, 8, 9, 12, 14, 18, 19, 20, 24, 25, 26, 29, 30, 31, 32, 33], "Then": [0, 19, 25, 29, 33], "invok": [0, 2, 5, 11, 13, 25, 28, 29, 30, 31, 32, 33], "call": [0, 2, 3, 4, 5, 6, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33], "function": [0, 2, 3, 4, 5, 6, 7, 8, 9, 10, 18, 19, 29, 32, 34], "manag": [0, 2, 4, 5, 6, 35], "reason": [0, 23], "doe": [0, 2, 8, 14, 32, 33], "provid": [0, 2, 4, 5, 17, 25, 30, 32, 33, 34], "4": [0, 16, 19, 23, 24, 25, 27, 28, 30, 31, 32, 33], "6": [0, 16, 19, 23, 24, 25, 27, 30, 32, 33], "On": [0, 2, 33], "grab": [0, 8, 13, 28, 33], "5": [0, 5, 12, 15, 16, 17, 19, 23, 24, 25, 26, 27, 30, 31, 32, 33], "insid": [0, 12, 18, 33], "transform": [0, 3, 5, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 32, 33], "block": [0, 5, 13, 33], "through": [0, 2, 4, 5, 9, 25, 28, 32, 33, 34], "calcul": [0, 28], "complet": [0, 4, 8, 24, 26, 29, 30, 33], "defin": [0, 2, 7, 8, 9, 14, 15, 18, 19, 20, 26, 28, 30, 33], "server": [0, 10, 19, 26, 33, 35], "": [0, 2, 3, 4, 5, 8, 9, 15, 16, 17, 19, 20, 21, 24, 25, 26, 28, 29, 30, 31, 32, 36], "done": [0, 5, 8, 15, 29, 33], "result": [0, 2, 4, 8, 15, 18, 22, 24, 26, 27, 32, 33], "shown": [0, 13], "7": [0, 16, 19, 22, 23, 24, 25, 27, 28, 30, 33], "8": [0, 12, 16, 19, 22, 23, 24, 25, 27, 28, 30, 31, 32, 33], "help": [0, 20, 25, 33], "understand": [0, 32, 33], "oper": [0, 2, 5, 8, 10, 13, 14, 17, 18, 19, 25, 27, 29, 35], "immedi": [0, 5, 33], "add": [0, 2, 3, 4, 6, 8, 10, 14, 23, 25, 27, 28, 33], "intervent": [0, 1, 2, 3, 5, 8, 10, 11, 14, 15, 19, 20, 22, 25, 26, 28, 30, 36], "alongsid": [0, 33], "upon": [0, 2, 4, 33], "exit": [0, 2, 4, 16, 18, 26, 33], "exampl": [0, 2, 4, 5, 8, 12, 15, 17, 23, 25, 26, 27, 30, 33], "seen": 0, "below": [0, 15, 29, 30, 33], "node": [0, 2, 4, 5, 7, 8, 15, 25, 30, 33], "depend": [0, 2, 4, 5, 8, 12, 25, 33], "well": [0, 2, 5, 8, 14, 25, 33], "other": [0, 8, 14, 26, 33], "chosen": 0, "request": [0, 3, 4, 10, 25, 26, 30, 33], "inject": [0, 4, 8, 33], "basic": [0, 5, 23, 33, 34, 36], "lot": [0, 33], "insight": [0, 32, 33], "go": [0, 19, 24, 33], "For": [0, 2, 5, 9, 12, 14, 18, 19, 20, 22, 25, 29, 33], "logit": [0, 4, 5, 17, 19, 24, 28, 29, 30, 33, 36], "len": [0, 25, 28, 29, 30, 36], "text": [0, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "And": [0, 26, 33], "causal": [0, 30, 36], "path": [0, 3, 4, 5, 8, 9], "patch": [0, 1, 36], "circuit": [0, 29], "discoveri": [0, 29], "method": [0, 2, 4, 5, 8, 9, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32], "locat": [0, 13, 20, 33], "compon": [0, 29, 33], "within": [0, 2, 3, 8, 9, 12, 13, 14, 15, 17, 18, 20, 26, 28, 32, 33], "plai": 0, "decis": 0, "role": 0, "make": [0, 2, 4, 5, 10, 19, 20, 25, 28, 29, 33], "gradient": [0, 5, 8, 10, 29], "optim": [0, 19, 26, 30, 33], "out": [0, 2, 5, 6, 8, 14, 17, 18, 19, 21, 22, 25, 29, 33, 34], "order": [0, 2, 3, 4, 5, 8, 15, 21, 26, 33], "applic": [0, 14, 33], "cross": [0, 10, 19, 33], "prompt": [0, 2, 5, 10, 19, 22, 28, 29, 30, 31, 32, 33], "mani": [0, 2, 4, 8, 10, 18], "more": [0, 3, 5, 8, 12, 14, 18, 19, 20, 22, 25, 29, 30, 32, 33], "featur": [0, 20, 25, 31, 33, 34], "start": [0, 7, 11, 24, 26, 30, 36], "page": [0, 33], "inform": [0, 2, 4, 8, 25, 27, 29, 33], "project": [0, 15, 25, 29, 33, 34], "current": [0, 2, 3, 4, 8, 24, 25, 26, 33], "alpha": [0, 19, 33], "pre": [0, 2, 8, 13, 33], "releas": [0, 8, 30], "earli": [0, 8, 10, 18, 26], "user": [0, 3, 4, 5, 8, 13, 19, 25, 26, 33], "contributor": 0, "contribut": [0, 29, 33], "feedback": [0, 33], "join": [0, 33], "discord": [0, 33], "updat": [0, 2, 4, 8, 9, 12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 30, 31, 32, 33], "bug": 0, "report": 0, "opportun": 0, "effort": 0, "nnsight": [1, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34], "envoi": [1, 2, 5, 8, 19, 33], "schema": 1, "util": [1, 19, 25, 28, 30, 32, 33], "contain": [2, 4, 5, 8, 19, 30, 33], "logic": [2, 4, 8, 33], "primari": [2, 4, 5], "two": [2, 8, 12, 13, 17, 28, 29, 30, 33], "class": [2, 3, 4, 5, 6, 7, 8, 9, 11, 19, 33], "involv": [2, 4, 8, 36], "tracer": [2, 3, 5, 7, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 32, 33], "around": [2, 5, 33], "underli": [2, 3, 5, 8, 15, 33], "an": [2, 3, 4, 5, 6, 7, 8, 9, 15, 17, 18, 19, 20, 24, 25, 26, 29, 30, 31, 33, 35], "track": [2, 4, 5, 8], "perform": [2, 5, 9, 17], "said": [2, 8, 36], "expos": [2, 11, 16, 18, 33], "attribut": [2, 3, 4, 5, 6, 8, 9, 16, 17, 32, 33, 36], "To": [2, 24, 26, 30, 32, 33, 34, 35], "do": [2, 3, 5, 10, 14, 15, 17, 19, 21, 24, 25, 28, 29, 33], "need": [2, 4, 5, 9, 10, 14, 19, 20, 24, 25, 28, 29, 30, 33], "know": [2, 19, 33], "about": [2, 4, 7, 11, 30, 31, 32, 33], "so": [2, 3, 4, 5, 8, 16, 19, 24, 25, 29, 33], "each": [2, 5, 8, 18, 22, 26, 29, 30, 32, 33], "i": [2, 3, 4, 5, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 36], "keep": [2, 4, 25, 33], "batch_siz": [2, 4, 19, 30, 33], "recent": [2, 3, 15, 25, 33], "gener": [2, 3, 4, 5, 8, 10, 13, 19, 32, 33, 35], "index": [2, 4, 5, 8, 19, 25, 28, 32, 33], "multi": [2, 33], "iter": [2, 3, 4, 7, 10, 19, 28, 33], "made": [2, 12, 20, 33], "dure": [2, 8, 15, 17, 21, 27, 33], "its": [2, 5, 8, 14, 16, 20, 24, 25, 26, 29, 33], "batched_input": 2, "ad": [2, 4, 5, 8, 18, 19, 23, 33], "should": [2, 3, 4, 5, 7, 8, 9, 19, 22, 25, 33], "format": [2, 7, 30, 33], "where": [2, 5, 8, 15, 17, 25, 28, 29, 30, 33], "batch": [2, 4, 5, 19, 28, 29, 30], "allow": [2, 4, 5, 8, 18, 20, 21, 25, 33, 35], "thing": [2, 10, 17, 21, 33], "consist": 2, "valid": [2, 5, 8, 10, 24, 30, 33], "both": [2, 4, 5, 19, 33], "becom": 2, "case": [2, 5, 8, 13, 19, 29, 33], "regardless": 2, "whether": [2, 8, 30], "string": [2, 3, 5, 9, 32, 33], "process": [2, 5, 8, 17, 24, 26, 32, 33], "dictionari": [2, 4, 7, 8, 33, 36], "id": [2, 5, 7, 8, 19, 32, 33], "onli": [2, 3, 4, 5, 8, 9, 12, 15, 19, 22, 24, 25, 27, 30, 33], "us": [2, 4, 5, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35], "carri": [2, 6, 8], "what": [2, 5, 19, 25, 27, 28, 32, 33], "accept": 2, "parent": [2, 5, 6, 8], "appropri": [2, 5, 8, 30, 33], "respect": [2, 3, 29, 33], "enter": [2, 5, 13, 28, 33], "some": [2, 5, 8, 9, 19, 25, 31, 33], "leverag": [2, 5, 33], "prepar": [2, 5, 8, 33], "version": [2, 5, 8, 13, 20, 26, 29, 32, 33], "size": [2, 4, 12, 22, 25, 33], "It": [2, 12, 14, 18, 19, 20, 24, 25, 26, 31, 33], "meta_model": [2, 5], "dtype": [2, 4, 7, 24, 33], "base": [2, 4, 5, 8, 18, 20, 30, 33], "characterist": 2, "come": [2, 13, 33], "extens": 2, "remotetrac": 2, "check_for_depend": 2, "data": [2, 4, 7, 9, 19, 25, 26, 30, 33], "tupl": [2, 3, 4, 5, 7, 28, 30, 33], "bool": [2, 3, 5, 7, 8, 9, 33], "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 24, 30, 33, 34], "check": [2, 3, 4, 8, 12, 14, 18, 19, 20, 25, 29, 33, 34], "proxi": [2, 3, 4, 5, 8, 14, 15, 17, 23, 25, 28, 33], "convert": [2, 8], "them": [2, 4, 5, 8, 9, 13, 14, 23, 25, 28, 30, 33], "bridg": [2, 8], "lock": [2, 8], "later": [2, 26, 33], "valu": [2, 4, 5, 7, 8, 10, 13, 15, 17, 19, 23, 25, 26, 28, 29, 30, 31, 32, 33], "return": [2, 3, 4, 5, 8, 9, 14, 15, 19, 22, 25, 29, 30, 33], "replac": [2, 6, 7, 8, 13, 19, 25, 26, 33], "were": [2, 5, 8, 15, 28, 33], "type": [2, 3, 4, 5, 6, 7, 8, 9, 15, 25, 32, 33], "resolve_depend": [2, 33], "turn": [2, 25, 33], "find": [2, 28, 29, 30, 31, 32, 33], "resolv": 2, "backend": [2, 5, 25, 33], "none": [2, 3, 4, 5, 6, 7, 8, 19, 25, 30, 33], "return_context": [2, 5, 18, 19, 33], "kwarg": [2, 3, 4, 5, 7, 8, 9, 25, 33], "_model": [2, 5, 33], "nnsightmodel": [2, 5, 33], "th": 2, "_graph": 2, "_arg": [2, 5], "posit": [2, 3, 5, 8, 12, 19, 28, 29, 30, 32, 33], "pass": [2, 3, 4, 5, 8, 9, 10, 15, 17, 18, 20, 28, 29, 33], "list": [2, 3, 4, 5, 6, 7, 8, 9, 18, 30, 32, 33], "_kwarg": [2, 5, 33], "keyword": [2, 5, 8, 33], "dict": [2, 4, 5, 7, 8, 9, 33], "str": [2, 3, 4, 5, 6, 7, 8, 9, 15, 25, 33], "_invoker_input": 2, "invoc": [2, 13, 28], "_invok": 2, "edit_backend_execut": 2, "handl": [2, 4, 5, 6, 8, 26, 33], "editmixin": 2, "edit": [2, 4, 5, 10, 11, 27], "dor": 2, "given": [2, 4, 8, 9, 11, 25, 28, 29, 32, 33], "rais": [2, 5, 8, 15, 25, 30, 33], "except": [2, 7, 8, 33], "alreadi": [2, 3, 4, 5, 8, 24, 26, 33], "local_backend_execut": [2, 33], "remotemixin": 2, "next": [2, 8, 20, 22, 32], "increment": [2, 4, 8, 33], "int": [2, 3, 4, 5, 7, 8, 12, 19, 30, 33], "1": [2, 5, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36], "call_it": [2, 4], "how": [2, 4, 8, 19, 20, 22, 23, 25, 29, 30, 31, 32, 33], "onc": [2, 3, 16, 24, 25, 33], "remote_backend_get_model_kei": 2, "model_kei": 2, "specifi": [2, 8, 12, 14, 24, 32, 33], "kei": [2, 4, 5, 6, 24, 25, 29, 33, 35], "remote_backend_handle_result_valu": 2, "postprocess": 2, "remote_backend_postprocess_result": 2, "local_result": 2, "move": [2, 8, 26, 29, 33], "tensor": [2, 3, 4, 5, 7, 8, 10, 12, 13, 14, 16, 17, 19, 21, 22, 23, 24, 25, 27, 29, 30, 33], "cpu": [2, 29, 30, 31, 33], "detach": [2, 29, 30, 32], "etc": [2, 8, 26, 33], "post": [2, 29, 32, 33], "scan": [2, 5, 10, 19, 30, 33], "meant": 2, "tandem": 2, "initi": [2, 3, 5, 22, 33], "_prepare_input": [2, 5], "faketensor": [2, 8], "potenti": [2, 4, 19, 30, 33], "correctli": [2, 25, 33], "free": [2, 8, 30, 35], "wise": 2, "mai": [2, 33], "loop": [2, 10, 18, 19, 25], "shape": [2, 3, 4, 5, 8, 10, 17, 19, 22, 25, 27, 30, 33], "error": [2, 8, 25, 33], "have": [2, 4, 5, 8, 12, 13, 19, 25, 26, 29, 31, 33], "first": [2, 3, 4, 5, 9, 13, 15, 17, 19, 28, 36], "graphbasedcontext": [2, 25, 33], "globaltracingcontext": [2, 25, 33], "global": 2, "without": [2, 19, 20, 26, 33, 35], "refer": [2, 3, 4, 7, 8, 26, 33], "There": [2, 5, 8, 17, 33], "global_tracing_context": [2, 25, 33], "torch_handl": 2, "torch": [2, 3, 4, 5, 8, 9, 11, 12, 14, 17, 19, 21, 22, 23, 24, 27, 29, 30, 31, 32, 33], "globaltracingexit": [2, 25, 33], "globaltracingtorchhandl": [2, 25, 33], "static": 2, "deregist": 2, "graph_based_context": 2, "regist": [2, 4, 9, 35], "try_deregist": 2, "attempt": [2, 4, 8, 25, 33], "Will": 2, "w": 2, "success": [2, 33], "otherwis": [2, 3, 4, 5, 8, 25, 30, 33], "try_regist": 2, "appli": [2, 4, 5, 8, 9, 10, 14, 19, 20, 21, 22, 25, 28, 29, 32, 33], "target": [2, 7, 8, 9, 25, 33], "callabl": [2, 3, 4, 5, 8, 9, 32], "arg": [2, 3, 4, 5, 7, 8, 9, 19, 25, 33], "interventionproxi": [2, 3, 4, 5, 8], "helper": [2, 5], "directli": [2, 5, 8, 20, 25, 33], "try": [2, 8, 25, 33], "fakemod": 2, "test": [2, 5, 13, 30], "traceabl": [2, 8, 33], "bridge_backend_handl": 2, "self": [2, 5, 15, 19, 25, 33], "capac": 2, "bytearrai": [2, 33], "byte": [2, 33], "complex": [2, 8, 11, 33], "number": [2, 5, 8, 30, 31, 33], "cond": [2, 12, 18, 33], "condit": [2, 7, 8, 10], "entrypoint": [2, 5], "act": [2, 3, 5, 32, 33], "evalu": [2, 8, 30], "boolean": [2, 8, 30, 33], "bodi": [2, 18, 33], "union": [2, 4, 5, 7, 8, 25, 33], "setup": [2, 8, 36], "ex": [2, 4, 8], "sequenti": [2, 5, 7, 8, 11, 19, 26, 33], "earlystopprotocol": [2, 8, 33], "float": [2, 7, 19, 33], "log": [2, 7, 8, 12, 18, 19, 26, 33], "via": [2, 4, 5, 8, 17, 18, 24, 33], "vi": [2, 8], "visual": [2, 4, 8], "A": [2, 8, 18, 22, 25, 29, 33], "conting": 2, "_condit": 2, "conditionalmanag": [2, 8], "attach": [2, 4, 5, 8, 15, 25, 33], "_conditional_dict": 2, "map": [2, 4, 7, 8, 30], "conditionalprotocol": [2, 8], "name": [2, 3, 4, 5, 7, 8, 14, 15, 25, 29, 33], "_conditioned_nodes_dict": 2, "condition": 2, "_conditional_stack": 2, "stack": [2, 8, 31], "visit": [2, 8], "conditonalprotocol": 2, "add_conditioned_nod": [2, 8], "conditon": [2, 8], "latest": [2, 8], "is_node_condit": [2, 8], "peek": 2, "lastest": 2, "non": [2, 33], "empti": 2, "option": [2, 3, 4, 5, 8, 19, 20, 32, 33], "pop": [2, 8], "push": 2, "conditional_nod": 2, "session": [2, 5, 7, 10, 18, 19, 32], "root": [2, 3, 4, 8, 9, 33], "collect": [2, 3, 4, 5, 8, 9, 25, 30, 33], "new": [2, 4, 5, 8, 12, 13, 17, 19, 20, 25, 27, 33], "subsequ": [2, 4, 22, 33], "referenc": 2, "item": [2, 14, 18, 28, 29, 30, 31, 33], "over": [2, 5, 18, 19, 29, 33], "module_path": [3, 4, 8, 33], "tree": [3, 21], "repres": [3, 5, 6, 8, 28, 30], "rel": [3, 4, 8], "separ": [3, 8, 9, 14, 29, 33], "e": [3, 9, 26, 33], "x": [3, 5, 8, 9, 28, 30, 32, 33], "h": [3, 5, 9, 11, 14, 15, 16, 17, 19, 20, 21, 22, 23, 25, 27, 28, 29, 32, 33], "_fake_output": 3, "_scan": 3, "multipl": [3, 5, 8, 10, 20, 26, 28, 33], "than": [3, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33], "_fake_input": 3, "reset": [3, 5, 8], "forward": [3, 5, 8, 9, 15, 19, 20, 28, 29, 30, 33], "_call_it": 3, "integ": [3, 12, 33], "_tracer": 3, "must": [3, 8, 14, 33], "manual": [3, 33], "properti": [3, 4, 5, 8, 15, 33], "denot": [3, 4, 22], "wish": [3, 4, 5, 20, 33], "therefor": [3, 4, 8, 14, 15, 33], "time": [3, 4, 5, 8, 10, 12, 19, 31, 33], "include_fn": 3, "ran": [3, 33], "against": 3, "includ": [3, 17, 33], "final": [3, 5, 33], "itself": [3, 5, 8, 19, 33], "named_modul": 3, "overrid": [3, 5], "nn": [3, 4, 5, 8, 11, 19, 30, 31, 32, 33], "extend": [4, 18, 33], "easier": 4, "interven": [4, 10, 13, 27, 33], "entri": 4, "hook": [4, 5, 8, 9, 29, 33], "hookmodel": 4, "remov": [4, 5, 8, 13, 20, 33], "hookhandl": [4, 5, 33], "module_kei": 4, "input_hook": [4, 33], "output_hook": [4, 33], "__enter__": [4, 6, 25, 33], "__exit__": [4, 6, 25, 33], "design": [4, 33], "signatur": 4, "removablehandl": 4, "interventionhandl": [4, 5, 33], "batch_group": [4, 33], "interventionprotocol": [4, 33], "total": [4, 14, 33], "counter": 4, "ha": [4, 5, 8, 9, 24, 26, 30, 33], "been": [4, 5, 8, 9, 15, 19, 24, 26, 33], "count": [4, 8], "tri": [4, 33], "protocol": [4, 8, 33], "overal": 4, "classmethod": [4, 8], "proxy_valu": [4, 8, 15, 25, 33], "module1": [4, 8], "module2": [4, 8], "_description_": [4, 5], "get_intervent": [4, 33], "interventionnod": 4, "activ": [4, 5, 26, 29, 31, 32, 33, 36], "intervention_handl": [4, 33], "form": [4, 5, 8, 14, 33], "exist": [4, 5, 8, 32], "batch_start": 4, "readi": [4, 8], "yet": [4, 5, 32, 33], "continu": [4, 30, 33], "narrow": [4, 33], "select": 4, "relev": [4, 8, 33], "view": [4, 8, 25, 30, 33], "oppos": 4, "copi": [4, 5, 8, 30], "downstream": [4, 5], "origin": [4, 5, 6, 8, 11, 13, 20, 25, 26, 30, 33], "prevent": [4, 31], "effect": [4, 11, 20, 29, 33], "bath": 4, "outsid": [4, 8, 33], "preview": 4, "either": [4, 5, 24, 26, 33], "handler": 4, "modifi": [4, 20, 25, 26, 33], "style": [4, 8], "sub": [4, 5, 8, 33], "addit": [4, 19, 26, 33], "delet": [4, 16, 33], "listen": [4, 8, 33], "lm_head": [4, 5, 11, 19, 20, 21, 26, 28, 29, 32, 33], "devic": [4, 5, 8, 14, 16, 17, 21, 22, 23, 25, 27, 30, 33], "retriev": [4, 9, 19, 33], "real": [4, 5, 25, 30, 33], "grad": [4, 8, 17, 29, 33], "stop": [4, 7, 8, 10, 26], "after": [4, 5, 9, 16, 17, 19, 22, 24, 26, 28, 29, 32, 33], "creation": 4, "updateprotocol": [4, 8], "main": [5, 33], "wrap": [5, 8, 9, 11, 14, 33], "gpt2": [5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 33, 36], "repo": 5, "device_map": [5, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33], "cuda": [5, 16, 17, 21, 22, 23, 27, 28, 30, 31], "declar": 5, "entail": 5, "automodelforcausallm": [5, 33], "unus": [5, 30], "acceler": 5, "packag": [5, 9, 11, 12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 32, 33, 34], "encompass": 5, "displai": [5, 8, 32, 33], "structur": 5, "abil": [5, 29], "gpt2lmheadmodel": [5, 32, 33], "gpt2model": [5, 32, 33], "wte": [5, 13, 32, 33], "embed": [5, 13, 32, 33], "50257": [5, 32, 33], "768": [5, 19, 22, 25, 32, 33], "wpe": [5, 32, 33], "1024": [5, 19, 32, 33], "drop": [5, 32, 33], "dropout": [5, 32, 33], "p": [5, 32, 33], "inplac": [5, 9, 20, 32, 33], "modulelist": [5, 32, 33], "12": [5, 12, 14, 18, 19, 20, 21, 25, 26, 29, 30, 32, 33], "gpt2block": [5, 32, 33], "ln_1": [5, 32, 33], "layernorm": [5, 32, 33], "ep": [5, 32, 33], "1e": [5, 30, 32, 33], "05": [5, 32, 33], "elementwise_affin": [5, 32, 33], "attn": [5, 29, 32, 33], "gpt2attentionalt": 5, "c_attn": [5, 32, 33], "conv1d": [5, 32, 33], "c_proj": [5, 29, 32, 33], "attn_dropout": [5, 32, 33], "resid_dropout": [5, 32, 33], "queri": 5, "wrappermodul": [5, 9, 32, 33], "ln_2": [5, 32, 33], "gpt2mlp": [5, 32, 33], "c_fc": [5, 32, 33], "newgeluactiv": [5, 32, 33], "ln_f": [5, 21, 32, 33], "linear": [5, 11, 29, 31, 32, 33], "in_featur": [5, 31, 32, 33], "out_featur": [5, 31, 32, 33], "bia": [5, 31, 32, 33], "explicit": [5, 33], "control": [5, 33], "level": [5, 9, 15, 30, 33], "specif": [5, 29, 33], "spawn": 5, "runner": [5, 24, 33], "metadispatch": 5, "_dispatch_kei": 5, "becaus": [5, 28], "evil": 5, "ty": 5, "caden": [5, 17, 27, 31], "implement": [5, 8, 34], "wrapper": [5, 9, 33], "gain": [5, 32], "proxy_class": [5, 8, 25, 33], "_model_kei": 5, "kind": [5, 9, 18, 33], "usual": [5, 12, 21, 33], "hug": [5, 32], "face": [5, 32], "checkpoint": [5, 31], "custom": [5, 10], "_dispatch": 5, "_custom_model": 5, "repoid_path_model": 5, "_envoi": [5, 25, 33], "_session": 5, "clear_edit": [5, 20, 33], "dispatch_model": 5, "dispatch": [5, 29, 30, 32, 33], "_load": 5, "futur": 5, "place": [5, 17, 19, 20, 33], "editor": [5, 20, 33], "_execut": [5, 33], "raw": 5, "openai": [5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 32, 33], "commun": [5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 32, 33], "complexmodul": 5, "def": [5, 14, 15, 19, 25, 29, 30, 33], "__init__": [5, 8, 9, 19, 25, 33], "super": [5, 19, 25, 33], "l0": 5, "gpt2_edit": 5, "msg_prompt": 5, "clone": [5, 17, 25, 27, 33, 34], "original_output": [5, 25], "edited_output": 5, "fn": [5, 8, 9, 33], "intervention_graph": [5, 33], "re": [5, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "compil": 5, "last": [5, 8, 15, 17, 19, 20, 21, 22, 25, 26, 33], "total_batch_s": 5, "garbag": 5, "clear": [5, 20, 33], "memori": [5, 8, 25, 30, 33], "group": 5, "alia": 5, "popul": [5, 8, 15, 16, 19, 33], "fake": [5, 8, 25, 33], "tenor": 5, "dim": [5, 11, 19, 20, 21, 25, 26, 29, 30, 31, 32, 33], "noop": 5, "remotebackend": 5, "url": 5, "invoker_arg": [5, 33], "short": 5, "inspect": [5, 8, 15, 25, 33], "complic": 5, "prepare_input": [5, 8, 25, 33], "valueerror": [5, 8, 15, 33], "noth": [5, 8, 31], "wai": [5, 17, 19, 25, 28, 31, 33], "extrem": 5, "our": [5, 10, 12, 14, 19, 25, 26, 28, 29, 30, 33], "ordereddict": [5, 11, 33], "input_s": [5, 11, 33], "hidden_dim": [5, 11, 33], "output_s": [5, 11, 33], "layer1": [5, 11, 33], "sigma1": 5, "sigmoid": 5, "layer2": [5, 11, 33], "sigma2": 5, "example_input": 5, "rand": [5, 12, 33], "singl": [5, 8, 18, 26, 30, 33], "l2_input": [5, 33], "l2_output": 5, "second": [5, 13, 17, 33], "divid": 5, "scope": [5, 33], "inner": [5, 19, 32, 33], "simpli": [5, 19, 24, 33], "expect": [5, 20, 33], "example_input2": 5, "output1": 5, "output2": 5, "languag": [5, 24, 33], "token": [5, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "custom_model": 5, "generationmixin": 5, "config": [5, 7, 24, 26, 28, 30, 33], "file": [5, 15, 24, 25, 33], "repositori": 5, "pretrainedconfig": 5, "lm": 5, "pretrainedtoken": 5, "automodel": 5, "auto": [5, 12, 13, 14, 15, 17, 18, 19, 20, 25, 26, 27, 29, 31, 32, 33], "pretrainedmodel": 5, "languagemodelproxi": 5, "idx": [5, 30, 33], "t": [5, 8, 14, 19, 25, 26, 28, 29, 31, 32, 33], "pad": [5, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33], "mean": [5, 8, 25, 26, 29, 33], "shift": [5, 32], "care": [5, 9, 33], "_type_": 5, "tokenindex": 5, "dimens": [5, 19, 25, 29, 30, 31, 33], "neg": 5, "left": [5, 22, 30], "equival": 5, "aid": 5, "unifiedtransform": 5, "transformerlen": 5, "hookedtransform": 5, "constructor": 5, "from_pretrained_no_process": 5, "from_pretrain": 5, "obj": [6, 33], "restor": [6, 20, 33], "patcher": [6, 25, 33], "apiconfigmodel": 7, "host": [7, 26, 33], "dev": 7, "ssl": 7, "apikei": 7, "job_id": 7, "model_config": 7, "classvar": 7, "configdict": 7, "configur": [7, 24, 33], "conform": 7, "pydant": 7, "model_field": 7, "fieldinfo": 7, "annot": [7, 32], "nonetyp": 7, "requir": [7, 24, 29, 31, 33, 35], "metadata": 7, "field": [7, 30, 33], "__fields__": 7, "v1": 7, "appconfigmodel": 7, "remote_log": 7, "configmodel": 7, "api": [7, 24, 33, 35], "app": 7, "respons": [7, 8, 29, 30], "responsemodel": 7, "statu": [7, 33], "jobstatu": 7, "descript": 7, "receiv": [7, 24, 26, 33], "datetim": 7, "session_id": 7, "enumer": [7, 28, 30, 32], "resultmodel": 7, "basennsightmodel": 7, "type_nam": 7, "liter": 7, "arbitrary_types_allow": 7, "dictmodel": 7, "tracermodel": 7, "iteratormodel": 7, "sessionmodel": 7, "nodemodel": 7, "slicemodel": 7, "tensormodel": 7, "primitivemodel": 7, "tuplemodel": 7, "listmodel": 7, "ellipsismodel": 7, "discrimin": 7, "aftervalid": 7, "slice": 7, "strict": 7, "ellipsi": 7, "functionmodel": 7, "function_nam": 7, "functionwhitelisterror": 7, "graphmodel": 7, "forwardref": 7, "graphtyp": 7, "node_refer": 7, "nodereferencetyp": 7, "primitivetyp": 7, "valuetyp": 7, "builtin_function_or_method": 7, "method_descriptor": 7, "primit": 7, "step": [7, 19, 23, 30, 31, 32, 33], "invoker_input": [7, 33], "individu": [8, 29], "graph_id": 8, "compos": [8, 33], "preserv": [8, 20, 33], "extra": 8, "aliv": [8, 25, 33], "consid": [8, 29], "still": [8, 32, 33], "name_idx": 8, "target_nam": 8, "previou": [8, 33], "uniqu": 8, "possibl": [8, 13, 24, 26, 33], "essenti": 8, "faketensormod": [8, 25, 33], "catch": [8, 25, 33], "fulfil": [8, 33], "These": 8, "construct": 8, "recurs": 8, "newli": [8, 25, 33], "titl": [8, 28, 29, 32], "graphic": 8, "pygraphviz": 8, "param": [8, 30], "directori": 8, "content": 8, "show": [8, 19, 28, 29, 32, 33], "imag": 8, "action": [8, 33], "AND": 8, "ones": [8, 33], "datatyp": [8, 33], "set_valu": [8, 33], "bi": 8, "similarli": [8, 33], "ceas": 8, "destroi": [8, 15, 33], "remain": 8, "weak": 8, "arg_depend": [8, 33], "cond_depend": 8, "weakref": 8, "dead": 8, "clean": [8, 28, 29], "v": [8, 24, 30, 33], "assum": [8, 17, 33], "destruct": 8, "els": [8, 12, 15, 25, 29, 30, 33], "remaining_depend": [8, 33], "less": 8, "correct": [8, 19, 22, 25, 28, 29, 30, 33], "preprocess": 8, "redund": 8, "remaining_listen": [8, 33], "event": 8, "now": [8, 19, 20, 28, 32, 33], "_valu": [8, 15, 33], "_empti": [8, 15, 25, 33], "never": [8, 15, 19, 24, 25, 31, 33], "viz_graph": 8, "agraph": 8, "backend_nam": 8, "edg": 8, "inher": 8, "differenti": 8, "magic": 8, "__torch_function__": [8, 25, 33], "proxy_wrapp": 8, "problemat": 8, "sometim": 8, "applymoduleprotocol": 8, "__call__": [8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "wont": 8, "trigger": 8, "set_modul": 8, "applymodul": 8, "get_modul": 8, "bridgeprotocol": 8, "connect": 8, "anoth": [8, 21, 26, 33], "bridgeexcept": 8, "get_bridg": 8, "set_bridg": 8, "has_bridg": 8, "peek_graph": 8, "statement": [8, 12, 18, 33], "get_condit": 8, "cond_node_nam": 8, "has_condit": 8, "peek_condit": 8, "pop_condit": 8, "push_condit": 8, "earlystopexcept": [8, 33], "stop_point_nod": 8, "gradprotocol": 8, "backward": [8, 17, 19, 29, 30, 33], "register_hook": [8, 17], "backward_idx": 8, "localbackendexecuteprotocol": 8, "localmixin": [8, 33], "lockprotocol": 8, "who": [8, 11], "won": [8, 33], "might": [8, 33], "power": [8, 32, 33], "swapprotocol": [8, 33], "swap": [8, 17, 26, 30, 33], "get_swap": [8, 33], "new_valu": 8, "valueprotocol": 8, "facilit": 8, "matter": [8, 19, 33], "id_to_graph": 8, "graph_stack": 8, "bridged_nod": 8, "defaultdict": 8, "entiti": 8, "ti": [8, 15, 33], "add_bridge_proxi": 8, "bridge_proxi": 8, "correspond": [8, 32, 33], "get_bridge_proxi": 8, "get_graph": 8, "hierarch": 8, "pop_graph": 8, "throughout": [9, 25], "element": [9, 14, 33], "everi": [9, 26, 29, 31, 32, 33], "overridden": 9, "subclass": [9, 33], "although": 9, "recip": 9, "instanc": [9, 20, 30, 33], "afterward": 9, "former": [9, 33], "latter": [9, 33], "silent": 9, "ignor": [9, 33, 36], "cl": [9, 33], "member": 9, "fetch_attr": 9, "hierarchi": [9, 33], "fetch": 9, "__class__": 9, "debug": [10, 25, 33], "persist": [10, 20, 33], "lora": 10, "train": [10, 15, 19, 30], "interpret": [11, 33, 34], "\u025bn": [11, 34], "sa\u026at": [11, 34], "manipul": [11, 34], "doc": [11, 33], "tutori": [11, 29, 30, 33, 34], "capabl": [11, 33], "net": [11, 33], "39": [11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33], "walkthrough": [11, 29, 34, 36], "invent": 11, "hidden_state_output": 11, "hidden_state_input": 11, "develop": [11, 33], "measur": 11, "argmax": [11, 20, 21, 26, 30, 33], "met": [12, 33], "rand_int": [12, 33], "randint": [12, 33], "low": [12, 33], "high": [12, 30, 31, 33], "random": [12, 30, 33], "even": [12, 15, 17, 21, 33], "odd": [12, 33], "opt": [12, 14, 18, 19, 20, 25, 26, 33], "homebrew": [12, 14, 18, 19, 20, 25, 26, 33], "anaconda3": [12, 14, 18, 19, 20, 25, 26, 33], "env": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 33], "nnsight_loc": [12, 14, 18, 19, 20, 25, 26, 33], "lib": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 32, 33], "python3": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 32, 33], "site": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 33], "tqdm": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 30, 31], "py": [12, 13, 14, 15, 17, 18, 19, 20, 25, 26, 27, 31, 32, 33], "21": [12, 13, 14, 17, 18, 19, 20, 24, 25, 26, 27, 29, 31, 33], "tqdmwarn": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "iprogress": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "found": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31, 33], "pleas": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34], "jupyt": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "ipywidget": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "http": [12, 13, 14, 17, 18, 19, 20, 24, 25, 26, 27, 31, 32, 33], "readthedoc": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "io": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "en": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "stabl": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "user_instal": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "html": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "autonotebook": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "notebook_tqdm": [12, 13, 14, 17, 18, 19, 20, 25, 26, 27, 31], "tokenization_utils_bas": [12, 14, 18, 19, 20, 25, 33], "1601": [12, 14, 18, 19, 20, 25, 33], "futurewarn": [12, 13, 14, 18, 19, 20, 25, 33], "clean_up_tokenization_spac": [12, 14, 18, 19, 20, 25, 33], "behavior": [12, 14, 18, 19, 20, 25, 30, 33], "deprec": [12, 13, 14, 18, 19, 20, 25, 33], "v4": [12, 14, 18, 19, 20, 25, 33], "45": [12, 14, 15, 18, 19, 20, 25, 32, 33], "detail": [12, 14, 18, 19, 20, 25, 29, 33], "issu": [12, 14, 18, 19, 20, 25, 33], "github": [12, 14, 18, 19, 20, 25, 33, 34], "com": [12, 14, 18, 19, 20, 25, 33], "31884": [12, 14, 18, 19, 20, 25, 33], "warn": [12, 13, 14, 18, 19, 20, 24, 25, 26, 30, 32, 33], "gpt2tokenizerfast": [12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 32, 33], "note": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33], "fast": [12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "faster": [12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "encod": [12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 28, 29, 30, 31, 32, 33], "follow": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "abov": [12, 20, 25, 26, 29, 33], "mutual": [12, 33], "exclus": [12, 33], "nest": [12, 18, 33], "non_rand_int": [12, 33], "madison": 13, "squar": 13, "garden": 13, "rockinglikebalboa": 13, "huggingface_hub": [13, 32], "file_download": 13, "1132": 13, "resume_download": 13, "download": [13, 24, 26, 33], "alwai": [13, 19, 20, 33], "resum": 13, "forc": 13, "force_download": 13, "max_new_token": [13, 22, 33], "_": [13, 18, 19, 28, 32, 33], "batch_decod": [13, 19, 33], "pad_token_id": [13, 19, 22, 33], "eos_token_id": [13, 19, 22, 33], "50256": [13, 19, 22, 33], "end": [13, 19, 22, 28, 33], "york": 13, "everyth": [14, 33], "part": [14, 31, 33], "box": [14, 33], "support": [14, 18, 33, 34], "einop": [14, 29, 33], "don": [14, 25, 26, 28, 29, 33], "anyth": [14, 25, 33], "special": [14, 33], "sum": [14, 17, 23, 29, 30, 31, 33], "tensor_sum": [14, 33], "flat": [14, 33], "flatten": [14, 30, 33], "coma": [14, 33], "custom_sum": [14, 33], "npytorch": 14, "191": 14, "2442": 14, "mp": [14, 25, 33], "grad_fn": [14, 16, 17, 21, 23, 25, 27], "lt": [14, 16, 17, 21, 23, 24, 25, 26, 27, 30, 33], "sumbackward0": [14, 23], "gt": [14, 15, 16, 17, 21, 23, 25, 27, 30, 33], "wide": [14, 33], "intermedi": [15, 18, 26, 30, 32, 33], "halt": [15, 33], "reduc": [15, 29, 33], "runtim": [15, 17, 33], "conserv": [15, 33], "resourc": [15, 33], "One": [15, 29, 30, 33], "particularli": [15, 33], "sae": [15, 33], "l1_out": [15, 33], "l1": [15, 33], "necessarili": [15, 33], "associ": [15, 32, 33], "As": [15, 25, 33], "termin": [15, 26, 33], "link": [15, 33], "beyond": [15, 33], "point": [15, 21, 33], "skip": [15, 29, 33], "earlier": [15, 26, 33], "cannot": [15, 33], "l2_out": [15, 33], "l2": [15, 33], "traceback": [15, 25, 33], "cell": [15, 25, 32, 33], "34": [15, 21, 25, 33], "src": [15, 25, 33], "56": [15, 33], "__str__": [15, 33], "52": [15, 17, 30, 33], "54": [15, 30, 33], "58": [15, 33], "f": [15, 28, 29, 30, 33], "__name__": [15, 25, 33], "50": [15, 30, 33], "42": [15, 30, 33], "43": [15, 30, 33], "44": [15, 33], "46": [15, 33], "47": [15, 30, 33], "48": [15, 33], "182": [15, 33], "172": [15, 33], "173": [15, 33], "174": [15, 33], "178": [15, 33], "179": [15, 33], "181": [15, 33], "befor": [15, 17, 22, 24, 25, 26, 28, 31, 33], "184": [15, 24, 33], "desir": 16, "0505": [16, 23, 27], "1728": [16, 23, 27], "1690": [16, 23, 27], "0096": [16, 23, 27], "1280": [16, 23, 27], "0687": [16, 23, 27], "7494": [16, 23, 27], "9057": [16, 23, 27], "3024": [16, 23, 27], "0418": [16, 23, 27], "2964": [16, 23, 27], "8677": [16, 23, 27], "2960": [16, 23, 27], "6686": [16, 23, 27], "6642": [16, 23, 27], "2391": [16, 23, 27], "6064": [16, 23, 27], "2263": [16, 23, 27], "1537": [16, 23, 27], "8917": [16, 23, 27], "8651": [16, 23, 27], "0588": [16, 23, 27], "9866": [16, 23, 27], "9188": [16, 23, 27], "4460": [16, 23, 27], "4285": [16, 23, 27], "9": [16, 19, 23, 24, 25, 27, 30, 33], "3065": [16, 23, 27], "0528": [16, 23, 27], "7946": [16, 23, 27], "5556": [16, 23, 27], "6286": [16, 23, 27], "7258": [16, 23, 27], "7969": [16, 23, 24, 27, 33], "6714": [16, 23, 27], "0683": [16, 23, 27], "0481": [16, 23, 27], "addbackward0": [16, 17, 23], "coupl": [17, 33], "requires_grad": [17, 19, 33], "share": [17, 27, 31, 33], "conda": [17, 27, 31], "interp": [17, 27, 31], "hello": [17, 19, 33], "world": [17, 31], "5216": 17, "1755": 17, "4617": 17, "1919": 17, "0204": 17, "0075": 17, "9841": 17, "2175": 17, "5851": 17, "5212": 17, "2286": 17, "7334": 17, "retain_grad": 17, "hidden_states_grad": 17, "28": [17, 33], "7976": 17, "282": 17, "5981": 17, "868": 17, "7354": 17, "120": 17, "1743": 17, "2264": 17, "168": 17, "6449": 17, "79": [17, 26, 33], "4181": 17, "253": 17, "6225": 17, "1322": [17, 19], "1293": 17, "208": 17, "3980": 17, "19": [17, 29, 33], "5545": 17, "509": 17, "9857": 17, "better": [17, 33], "demonstr": [17, 20, 24, 25, 29, 33], "ablat": [17, 33], "zero": [17, 19, 32, 33], "hidden_states_grad_befor": 17, "hidden_states_grad_aft": 17, "scalabl": [18, 29, 33], "sequenc": [18, 33], "close": [18, 33], "mimic": [18, 33], "convent": [18, 33], "syntax": [18, 33], "li": [18, 33], "append": [18, 28, 29, 30, 31, 32, 33], "num": [18, 33], "rang": [18, 28, 29, 30, 32, 33], "li2": [18, 33], "item_2": [18, 33], "nlist": [18, 33], "pari": [19, 20, 21, 26, 33], "r": [19, 33], "init": [19, 33], "randn": [19, 27, 33], "wb": [19, 33], "much": [19, 29, 33], "alter": [19, 20, 33], "a_x": [19, 33], "matmul": [19, 33], "ba_x": [19, 33], "variabl": [19, 24, 26, 30, 33], "answer": [19, 28, 29, 33], "answer_token": [19, 33], "lora_dim": [19, 33], "fulli": [19, 33], "achiev": [19, 33], "dataload": [19, 30, 33], "isn": [19, 33], "transmit": [19, 33], "dataset": [19, 30, 32, 33], "100": [19, 24, 25, 26, 30, 33], "pair": [19, 30, 33], "blank": [19, 33], "adamw": [19, 33], "lr": [19, 30, 33], "correct_token": [19, 33], "entropi": [19, 33], "loss": [19, 30, 33], "cross_entropi": [19, 33], "arent": [19, 33], "zero_grad": [19, 30, 33], "weight": [19, 30, 31, 33], "inde": [19, 33], "5262": 19, "6452": 19, "8448": 19, "7407": 19, "4497": 19, "7200": 19, "0452": 19, "0630": 19, "7231": 19, "0991": 19, "3883": 19, "1719": 19, "0024": 19, "1490": 19, "5580": 19, "9070": 19, "1946": 19, "8469": 19, "8173": 19, "8333": 19, "1722": 19, "8518": 19, "5542": 19, "3361": 19, "6813": 19, "4550": 19, "9903": 19, "5476": 19, "3310": 19, "5932": 19, "9087": 19, "0441": 19, "7201": 19, "0849": 19, "3954": 19, "1480": 19, "1580": 19, "9589": 19, "3856": 19, "0354": 19, "3153": 19, "6950": 19, "8893": 19, "9347": 19, "4812": 19, "4821": 19, "1935": 19, "6101": 19, "2552": [19, 21], "3574": 19, "9555": 19, "4472": 19, "2370": 19, "4913": 19, "7973": 19, "8731": 19, "2148": 19, "8610": 19, "5298": 19, "0569": 19, "7628": 19, "8462": 19, "2901": 19, "9117": 19, "6102": 19, "5902": 19, "0834": 19, "0093": 19, "4495": 19, "3539": 19, "0740": 19, "3545": 19, "7871": 19, "8562": 19, "4963": 19, "9433": 19, "7392": 19, "9859": 19, "2827": 19, "3862": 19, "7453": 19, "4021": 19, "0508": 19, "5621": 19, "2794": 19, "3303": 19, "7909": 19, "4538": 19, "1313": 19, "0819": 19, "6503": 19, "5484": 19, "9757": 19, "8230": 19, "5514": 19, "9135": 19, "0300": 19, "0671": 19, "7480": 19, "1516": 19, "9534": 19, "1927": 19, "4806": 19, "6110": 19, "9870": 19, "6541": 19, "2833": 19, "7793": 19, "5076": 19, "5269": 19, "0037": 19, "7067": 19, "3638": 19, "2859": 19, "9272": 19, "7984": 19, "2132": 19, "0050": [19, 33], "7416": 19, "1828": 19, "0524": 19, "0584": 19, "7789": 19, "1404": 19, "9479": 19, "1800": 19, "4593": 19, "6158": 19, "0084": 19, "6854": 19, "2958": 19, "7769": 19, "5156": [19, 24, 33], "5044": 19, "9969": 19, "7388": 19, "3761": 19, "2705": 19, "9826": 19, "8277": 19, "2302": 19, "9683": 19, "7128": 19, "2308": 19, "8993": 19, "8751": 19, "6339": 19, "9546": 19, "7678": 19, "9929": 19, "2638": 19, "4456": 19, "8543": 19, "5411": 19, "1332": 19, "5998": 19, "3486": 19, "3077": 19, "8154": 19, "5951": 19, "2131": 19, "0807": 19, "8615": 19, "6812": 19, "0719": 19, "7578": 19, "5100": 19, "6025": 19, "5490": 19, "3451": 19, "6261": 19, "4447": 19, "6631": 19, "9259": 19, "5568": 19, "2529": 19, "8272": 19, "2799": 19, "0383": 19, "9686": 19, "4911": 19, "3074": 19, "9068": 19, "7484": 19, "5957": 19, "3908": 19, "7700": 19, "4054": 19, "1650": 19, "8296": 19, "1858": 19, "1039": 19, "9361": 19, "1787": 19, "0026": 19, "2144": 19, "4693": 19, "6995": 19, "1395": [19, 21], "8447": 19, "4018": 19, "8409": 19, "6084": 19, "5108": 19, "0477": 19, "8995": [19, 27], "4809": 19, "2972": 19, "2091": 19, "9804": 19, "3483": 19, "7015": 19, "4362": 19, "6675": 19, "5581": 19, "4253": 19, "6306": 19, "4597": 19, "6652": 19, "9124": 19, "1657": 19, "6208": 19, "3349": 19, "8752": 19, "3011": 19, "0775": 19, "9528": 19, "5035": 19, "3898": 19, "9537": 19, "7455": 19, "4682": 19, "8253": 19, "3640": 19, "1378": [19, 27], "9405": 19, "de": [19, 33], "With": [19, 24, 33], "produc": [19, 30, 33], "temporari": [20, 33], "variant": [20, 33], "across": [20, 22, 33], "compar": [20, 26, 28, 33], "explor": [20, 32, 33], "hs11": [20, 33], "model_edit": 20, "unmodifi": [20, 33], "vatican": [20, 33], "original_token": [20, 33], "modified_token": [20, 33], "norigin": [20, 25, 33], "decod": [20, 21, 22, 26, 28, 30, 31, 32, 33, 36], "rome": [20, 33], "safe": [20, 33], "experiment": [20, 33], "cautious": [20, 33], "consequ": [20, 33], "ve": [20, 33], "revert": [20, 33], "chain": 21, "vocabularli": 21, "space": [21, 28, 30], "softmax": [21, 32], "vocabulari": 21, "36": [21, 33], "2875": 21, "35": [21, 33], "0115": 21, "38": [21, 30, 33], "0794": 21, "40": [21, 33], "5164": 21, "41": [21, 33], "3760": 21, "9194": 21, "68": 21, "8886": 21, "1562": [21, 24, 33], "71": 21, "8408": 21, "80": [21, 30, 33], "4194": 21, "78": 21, "1206": 21, "82": 21, "2950": 21, "81": 21, "6519": 21, "83": [21, 30], "9940": 21, "94": [21, 25, 33], "4878": 21, "5194": 21, "85": 21, "6997": 21, "113": [21, 25, 33], "8675": 21, "111": [21, 25, 33], "8628": 21, "6634": 21, "116": 21, "7652": 21, "114": [21, 26], "8267": 21, "112": 21, "3621": 21, "8531": 21, "3007": 21, "91": [21, 25, 33], "8193": 21, "92": [21, 25, 30, 33], "9943": 21, "89": [21, 25, 33], "8382": 21, "6898": 21, "103": [21, 25, 33], "9307": 21, "102": [21, 33], "5054": 21, "105": 21, "1563": 21, "109": [21, 25, 33], "3099": 21, "110": [21, 25, 33], "4196": 21, "unsafeviewbackward0": 21, "198": [21, 33], "417": [21, 22, 33], "8765": [21, 22, 33], "318": [21, 22, 33], "257": [21, 33], "262": [21, 22, 33], "3504": [21, 33], "7372": [21, 33], "6342": [21, 22, 33], "el": 21, "middl": 21, "centr": 21, "three": 22, "hidden_states1": 22, "hidden_states2": 22, "hidden_states3": 22, "architectur": [22, 36], "right": [22, 33], "detect": 22, "padding_sid": 22, "464": [22, 33], "412": [22, 33], "733": [22, 33], "287": [22, 33], "1748": [22, 33], "286": [22, 33], "290": [22, 33], "themselv": [23, 33], "whatev": 23, "variou": [23, 32, 33], "hidden_states_pr": [23, 27], "hs_sum": 23, "hs_edit": 23, "501": 23, "2959": 23, "3464": 23, "1231": 23, "1269": 23, "500": 23, "2863": 23, "4239": 23, "2272": 23, "510": 23, "0453": 23, "504": 23, "2016": 23, "506": 23, "5983": 23, "493": 23, "2541": 23, "502": 23, "5923": 23, "498": 23, "4282": 23, "5919": 23, "505": 23, "9645": 23, "497": 23, "6317": 23, "5350": 23, "6895": 23, "5222": 23, "503": 23, "4496": 23, "508": 23, "1876": 23, "1610": 23, "3547": 23, "499": 23, "3093": 23, "507": 23, "2147": 23, "8499": 23, "7244": 23, "491": 23, "9894": 23, "3487": 23, "5013": 23, "8515": 23, "9245": 23, "0217": 23, "0928": 23, "9673": 23, "3641": 23, "3440": 23, "login": [24, 33], "sign": [24, 33], "set_default_api_kei": [24, 26, 33], "your_api_kei": [24, 26, 33], "instal": [24, 32, 33], "larger": [24, 33], "o": [24, 26, 33], "llama3": [24, 33], "gate": [24, 33], "environ": [24, 26, 33], "hf_token": [24, 26, 32, 33], "your_hugging_face_token": [24, 26, 33], "ll": [24, 32, 33], "2024": [24, 26, 33], "08": [24, 26, 33], "30": [24, 26, 33], "07": [24, 33], "150": [24, 33], "mainprocess": [24, 26, 33], "nnsight_remot": [24, 26, 33], "info": [24, 26, 33], "36ff46f0": [24, 33], "d81a": [24, 33], "4586": [24, 33], "b7e7": [24, 33], "eaf6f97d6c0b": [24, 33], "job": [24, 26, 33], "wait": [24, 26, 33], "approv": [24, 26, 33], "206": [24, 33], "398": [24, 33], "00": [24, 25, 26, 30, 33], "48m": [24, 33], "b": [24, 30, 33], "got": [24, 26, 33], "fork": [24, 26, 33], "parallel": [24, 26, 30, 33], "disabl": [24, 26, 33], "avoid": [24, 26, 33], "deadlock": [24, 26, 33], "explicitli": [24, 26, 33], "tokenizers_parallel": [24, 26, 33], "02": [24, 25, 33], "21mb": [24, 33], "4688": [24, 33], "9062": [24, 33], "2344": [24, 33], "6875": [24, 33], "9609": [24, 33], "2578": [24, 33], "5469": [24, 33], "6172": [24, 33], "4531": [24, 33], "1406": [24, 33], "1250": [24, 33], "7812": [24, 33], "8906": [24, 33], "1875": [24, 33], "1680": [24, 33], "5625": [24, 33], "9453": [24, 33], "3711": [24, 33], "3516": [24, 33], "3828": [24, 33], "9297": [24, 33], "3672": [24, 33], "2617": [24, 33], "4414": [24, 33], "6758": [24, 33], "6094": [24, 33], "0938": [24, 33], "7031": [24, 33], "8672": [24, 33], "1328": [24, 33], "5000": [24, 30, 33], "bfloat16": [24, 30, 33], "dynamiccach": [24, 33], "3750": [24, 33], "6250": [24, 33], "13": [24, 25, 29, 30, 33], "0000": [24, 29, 33], "8594": [24, 33], "9375": [24, 33], "5938": [24, 33], "5781": [24, 33], "0796": [24, 33], "8750": [24, 33], "4062": [24, 33], "9844": [24, 33], "2500": [24, 33], "7188": [24, 33], "realli": [24, 33], "techniqu": [24, 29, 33, 34], "avail": [24, 33], "encount": 25, "situat": 25, "messag": 25, "suggest": 25, "compat": 25, "tool": [25, 26, 32, 33], "number_of_token": 25, "modified_output": 25, "indexerror": [25, 33], "exc_typ": [25, 33], "exc_val": [25, 33], "exc_tb": [25, 33], "98": [25, 33], "_reset": [25, 33], "216": [25, 33], "214": [25, 33], "215": [25, 33], "218": [25, 33], "14": [25, 29, 30, 33], "16": [25, 29, 30, 31, 33], "18": [25, 29, 33], "__setitem__": [25, 33], "88": [25, 30, 32, 33], "90": [25, 33], "setitem": [25, 33], "270": [25, 33], "267": [25, 33], "269": [25, 33], "271": [25, 33], "272": [25, 28, 33], "273": [25, 33], "274": [25, 33], "275": [25, 33], "276": [25, 33], "106": [25, 33], "107": [25, 33], "108": [25, 33], "96": [25, 33], "93": [25, 30, 33], "theres": [25, 33], "131": [25, 33], "128": [25, 33], "did": [25, 33], "129": [25, 33], "133": [25, 33], "134": [25, 33], "135": [25, 33], "136": [25, 33], "isinst": [25, 30, 33], "137": [25, 33], "138": [25, 33], "20": [25, 29, 31, 33], "15": [25, 26, 29, 30, 33], "allow_non_fake_input": [25, 33], "shape_env": [25, 33], "shapeenv": [25, 33], "assume_static_by_default": [25, 33], "17": [25, 29, 33], "fake_mod": [25, 33], "fakecopymod": [25, 33], "exit_global_tracing_context": [25, 33], "22": [25, 33], "24": [25, 33], "25": [25, 30, 33], "26": [25, 33], "27": [25, 33], "330": [25, 33], "326": [25, 33], "328": [25, 33], "baseexcept": [25, 33], "312": [25, 33], "func": [25, 33], "305": [25, 33], "_variablefunctionsclass": [25, 33], "__qualname__": [25, 33], "306": [25, 33], "307": [25, 33], "308": [25, 33], "309": [25, 33], "310": [25, 33], "bound": [25, 30, 33], "ah": [25, 33], "cours": [25, 33], "abl": [25, 32, 33], "though": [25, 33], "under": [25, 33], "record": [25, 33], "doesn": [25, 33], "incur": [25, 33], "cost": [25, 30, 33], "throught": [25, 33], "least": [25, 33], "word": [25, 28, 32, 33], "caution": [25, 33], "relat": [25, 33], "effici": [25, 26, 29, 33], "off": [25, 31, 33], "best": [25, 33], "unsur": [25, 33], "again": [25, 33], "6286e": 25, "7258e": 25, "7969e": 25, "8255e": 25, "0698e": 25, "4242e": 25, "2749e": 25, "0404e": 25, "2988e": 25, "7030e": 25, "9210e": 25, "01": [25, 30], "5507e": 25, "4831e": 25, "4496e": 25, "2496e": 25, "4764e": 25, "5587e": 25, "8417e": 25, "7383e": 25, "9535e": 25, "1625e": 25, "4659e": 25, "9305e": 25, "2014e": 25, "6166e": 25, "3293e": 25, "1797e": 25, "6870e": 25, "9511e": 25, "3648e": 25, "5362e": 25, "2539e": 25, "4988e": 25, "2232e": 25, "4482e": 25, "8883e": 25, "5206e": 25, "3218e": 25, "5060e": 25, "2041e": 25, "8520e": 25, "3440e": 25, "0114e": 25, "7492e": 25, "4499e": 25, "5314e": 25, "0311e": 25, "3609e": 25, "4801e": 25, "6725e": 25, "0538e": 25, "5054e": 25, "9737e": 25, "5169e": 25, "9845e": 25, "4548e": 25, "7004e": 25, "8162e": 25, "5651e": 25, "8362e": 25, "5023e": 25, "9528e": 25, "4438e": 25, "7818e": 25, "0992e": 25, "8575e": 25, "1478e": 25, "6564e": 25, "2905e": 25, "3264e": 25, "9211e": 25, "6120e": 25, "6601e": 25, "5331e": 25, "2056e": 25, "6827e": 25, "7709e": 25, "1225e": 25, "9829e": 25, "9273e": 25, "6971e": 25, "6272e": 25, "2709e": 25, "0965e": 25, "4081e": 25, "4534e": 25, "4642e": 25, "0931e": 25, "8111e": 25, "1471e": 25, "9692e": 25, "1457e": 25, "1235e": 25, "2517e": 25, "2227e": 25, "2003e": 25, "1090e": 25, "8102e": 25, "4567e": 25, "7879e": 25, "2834e": 25, "7080e": 25, "6301e": 25, "9053e": 25, "9357e": 25, "7841e": 25, "0679e": 25, "0271e": 25, "0579e": 25, "7195e": 25, "1443e": 25, "7420e": 25, "3746e": 25, "5129e": 25, "9945e": 25, "1595e": 25, "5102e": 25, "2280e": 25, "4264e": 25, "5586e": 25, "8480e": 25, "8030e": 25, "3625e": 25, "1234e": 25, "5630e": 25, "4384e": 25, "0834e": 25, "3671e": 25, "9106e": 25, "9593e": 25, "0443e": 25, "2028e": 25, "1285e": 25, "6665e": 25, "1522e": 25, "0780e": 25, "5473e": 25, "9861e": 25, "5902e": 25, "2159e": 25, "0041e": 25, "03": 25, "4291e": 25, "5786e": 25, "3004e": 25, "3246e": 25, "4886e": 25, "1515e": 25, "5345e": 25, "1293e": 25, "2794e": 25, "1508e": 25, "1936e": 25, "7968e": 25, "2526e": 25, "0222e": 25, "4691e": 25, "1648e": 25, "6389e": 25, "7188e": 25, "1339e": 25, "8595e": 25, "7614e": 25, "3966e": 25, "0889e": 25, "5380e": 25, "0410e": 25, "5772e": 25, "4345e": 25, "2805e": 25, "1078e": 25, "2193e": 25, "4413e": 25, "2237e": 25, "5395e": 25, "3000e": 25, "7484e": 25, "1002e": 25, "5656e": 25, "1450e": 25, "1324e": 25, "2751e": 25, "7061e": 25, "3499e": 25, "0883e": 25, "2036e": 25, "4077e": 25, "0958e": 25, "4460e": 25, "6134e": 25, "8703e": 25, "2674e": 25, "2317e": 25, "0362e": 25, "1834e": 25, "3516e": 25, "0807e": 25, "0336e": 25, "0479e": 25, "9521e": 25, "9104e": 25, "0803e": 25, "2048e": 25, "7705e": 25, "8135e": 25, "4048e": 25, "3258e": 25, "1608e": 25, "2787e": 25, "8557e": 25, "1077e": 25, "0518e": 25, "6806e": 25, "2934e": 25, "4432e": 25, "5619e": 25, "1031e": 25, "2877e": 25, "0819e": 25, "9329e": 25, "8585e": 25, "9784e": 25, "1124e": 25, "2287e": 25, "7348e": 25, "0236e": 25, "4054e": 25, "5393e": 25, "5170e": 25, "5092e": 25, "3856e": 25, "0673e": 25, "6784e": 25, "3701e": 25, "4999e": 25, "3039e": 25, "5358e": 25, "9126e": 25, "1336e": 25, "2421e": 25, "4454e": 25, "0309e": 25, "3034e": 25, "0879e": 25, "4193e": 25, "5885e": 25, "5374e": 25, "4802e": 25, "9640e": 25, "6382e": 25, "5199e": 25, "1697e": 25, "1011e": 25, "9947e": 25, "5317e": 25, "3526e": 25, "4459e": 25, "6096e": 25, "6977e": 25, "5488e": 25, "9472e": 25, "5825e": 25, "1431e": 25, "7997e": 25, "4164e": 25, "7173e": 25, "5707e": 25, "2898e": 25, "0544e": 25, "1279e": 25, "0761e": 25, "0572e": 25, "4155e": 25, "1557e": 25, "0821e": 25, "4200e": 25, "1833e": 25, "3272e": 25, "4302e": 25, "4085e": 25, "8076e": 25, "1994e": 25, "6751e": 25, "7346e": 25, "0669e": 25, "9313e": 25, "0663e": 25, "6838e": 25, "5756e": 25, "8478e": 25, "4335e": 25, "1085e": 25, "5366e": 25, "3190e": 25, "4223e": 25, "6886e": 25, "7125e": 25, "6715e": 25, "9403e": 25, "6051e": 25, "9405e": 25, "9342e": 25, "0049e": 25, "0645e": 25, "4900e": 25, "7649e": 25, "0025e": 25, "6692e": 25, "1792e": 25, "7743e": 25, "0210e": 25, "8536e": 25, "3734e": 25, "2150e": 25, "1420e": 25, "3237e": 25, "1060e": 25, "8375e": 25, "4864e": 25, "0235e": 25, "7014e": 25, "0699e": 25, "2431e": 25, "2326e": 25, "2734e": 25, "1882e": 25, "0536e": 25, "6773e": 25, "9881e": 25, "4860e": 25, "0162e": 25, "5636e": 25, "0074e": 25, "6067e": 25, "3144e": 25, "1818e": 25, "4546e": 25, "0912e": 25, "1206e": 25, "3724e": 25, "7155e": 25, "4178e": 25, "2956e": 25, "6902e": 25, "5223e": 25, "4952e": 25, "7531e": 25, "1116e": 25, "8512e": 25, "7123e": 25, "6355e": 25, "8020e": 25, "8983e": 25, "3574e": 25, "3467e": 25, "8905e": 25, "3620e": 25, "8599e": 25, "2110e": 25, "5844e": 25, "4734e": 25, "9198e": 25, "9884e": 25, "7416e": 25, "6009e": 25, "6512e": 25, "0772e": 25, "8859e": 25, "4945e": 25, "9834e": 25, "2670e": 25, "6965e": 25, "0969e": 25, "9006e": 25, "9760e": 25, "3006e": 25, "3767e": 25, "9463e": 25, "3662e": 25, "5842e": 25, "1415e": 25, "5953e": 25, "7413e": 25, "7179e": 25, "1987e": 25, "8265e": 25, "9532e": 25, "1599e": 25, "9978e": 25, "8641e": 25, "0306e": 25, "1554e": 25, "0086e": 25, "8663e": 25, "8928e": 25, "1998e": 25, "5062e": 25, "2103e": 25, "7206e": 25, "5376e": 25, "5671e": 25, "2228e": 25, "6561e": 25, "8118e": 25, "8825e": 25, "8699e": 25, "3017e": 25, "3756e": 25, "2634e": 25, "6821e": 25, "7862e": 25, "6553e": 25, "7938e": 25, "6224e": 25, "7574e": 25, "0822e": 25, "9101e": 25, "3470e": 25, "4396e": 25, "8533e": 25, "3989e": 25, "3025e": 25, "0689e": 25, "5526e": 25, "0326e": 25, "0746e": 25, "0950e": 25, "1649e": 25, "4935e": 25, "1394e": 25, "0906e": 25, "1690e": 25, "2226e": 25, "2760e": 25, "4431e": 25, "0973e": 25, "3528e": 25, "9426e": 25, "5969e": 25, "5405e": 25, "7662e": 25, "4922e": 25, "4357e": 25, "8989e": 25, "2059e": 25, "9071e": 25, "3410e": 25, "0605e": 25, "5846e": 25, "7736e": 25, "0953e": 25, "5078e": 25, "7121e": 25, "4718e": 25, "8174e": 25, "7044e": 25, "0058e": 25, "1485e": 25, "8376e": 25, "5943e": 25, "8444e": 25, "8978e": 25, "0776e": 25, "0642e": 25, "3514e": 25, "2874e": 25, "2097e": 25, "6646e": 25, "6328e": 25, "2562e": 25, "4275e": 25, "6121e": 25, "4209e": 25, "1070e": 25, "9542e": 25, "7836e": 25, "0035e": 25, "0094e": 25, "7393e": 25, "4366e": 25, "8556e": 25, "2903e": 25, "5690e": 25, "6298e": 25, "2884e": 25, "0525e": 25, "3517e": 25, "1991e": 25, "9318e": 25, "2929e": 25, "2494e": 25, "4547e": 25, "6449e": 25, "0015e": 25, "5933e": 25, "1539e": 25, "7483e": 25, "9571e": 25, "6167e": 25, "1041e": 25, "1621e": 25, "2981e": 25, "2509e": 25, "9099e": 25, "9714e": 25, "3853e": 25, "2267e": 25, "2992e": 25, "8448e": 25, "9776e": 25, "0985e": 25, "9363e": 25, "0710e": 25, "9856e": 25, "9332e": 25, "8208e": 25, "6373e": 25, "4278e": 25, "3095e": 25, "1847e": 25, "4024e": 25, "2026e": 25, "0059e": 25, "7174e": 25, "0502e": 25, "2487e": 25, "4279e": 25, "2406e": 25, "9508e": 25, "2061e": 25, "5007e": 25, "5605e": 25, "6327e": 25, "6576e": 25, "1315e": 25, "5557e": 25, "7006e": 25, "6053e": 25, "9167e": 25, "5669e": 25, "4749e": 25, "2183e": 25, "4309e": 25, "5208e": 25, "1254e": 25, "7077e": 25, "9774e": 25, "3449e": 25, "4506e": 25, "2922e": 25, "2381e": 25, "1032e": 25, "7615e": 25, "3168e": 25, "8688e": 25, "5302e": 25, "0305e": 25, "4317e": 25, "4285e": 25, "6842e": 25, "0345e": 25, "0907e": 25, "3043e": 25, "8652e": 25, "4368e": 25, "0064e": 25, "9621e": 25, "6881e": 25, "6544e": 25, "9820e": 25, "2363e": 25, "4828e": 25, "5182e": 25, "0165e": 25, "8026e": 25, "3627e": 25, "1291e": 25, "0510e": 25, "2262e": 25, "6994e": 25, "1767e": 25, "2933e": 25, "8151e": 25, "8563e": 25, "1988e": 25, "6882e": 25, "8934e": 25, "4241e": 25, "5913e": 25, "1459e": 25, "3060e": 25, "9042e": 25, "1736e": 25, "4661e": 25, "1147e": 25, "0368e": 25, "1779e": 25, "8113e": 25, "0269e": 25, "9996e": 25, "8506e": 25, "3495e": 25, "3824e": 25, "6062e": 25, "2471e": 25, "6041e": 25, "8814e": 25, "3164e": 25, "5559e": 25, "3661e": 25, "7891e": 25, "9709e": 25, "2465e": 25, "9410e": 25, "3974e": 25, "8152e": 25, "7801e": 25, "4493e": 25, "0901e": 25, "9918e": 25, "8610e": 25, "2574e": 25, "8129e": 25, "2315e": 25, "0814e": 25, "8385e": 25, "2490e": 25, "4800e": 25, "8052e": 25, "3061e": 25, "8434e": 25, "5931e": 25, "2917e": 25, "9720e": 25, "3967e": 25, "4260e": 25, "1623e": 25, "1470e": 25, "2324e": 25, "5378e": 25, "0738e": 25, "3570e": 25, "2882e": 25, "0768e": 25, "7377e": 25, "5838e": 25, "1146e": 25, "9866e": 25, "3019e": 25, "8275e": 25, "4068e": 25, "7844e": 25, "6919e": 25, "9575e": 25, "8200e": 25, "8251e": 25, "5988e": 25, "7482e": 25, "0484e": 25, "6259e": 25, "5771e": 25, "8153e": 25, "3178e": 25, "6060e": 25, "5188e": 25, "0826e": 25, "3834e": 25, "7229e": 25, "6664e": 25, "6413e": 25, "0723e": 25, "3191e": 25, "4131e": 25, "6075e": 25, "2504e": 25, "3741e": 25, "7716e": 25, "4227e": 25, "3925e": 25, "5700e": 25, "7153e": 25, "3690e": 25, "1079e": 25, "3346e": 25, "9114e": 25, "0677e": 25, "0595e": 25, "8981e": 25, "1321e": 25, "9002e": 25, "9221e": 25, "1126e": 25, "5232e": 25, "5203e": 25, "8918e": 25, "8023e": 25, "7897e": 25, "6398e": 25, "3831e": 25, "3203e": 25, "7896e": 25, "1591e": 25, "2745e": 25, "0674e": 25, "1897e": 25, "5548e": 25, "0816e": 25, "4219e": 25, "2085e": 25, "0132e": 25, "1880e": 25, "2857e": 25, "3511e": 25, "3891e": 25, "3398e": 25, "5823e": 25, "1914e": 25, "7218e": 25, "5562e": 25, "9274e": 25, "1782e": 25, "9518e": 25, "3836e": 25, "5140e": 25, "8808e": 25, "9965e": 25, "6073e": 25, "4745e": 25, "4041e": 25, "8542e": 25, "0609e": 25, "0068e": 25, "6370e": 25, "4448e": 25, "0635e": 25, "6714e": 25, "0683e": 25, "0481e": 25, "selectbackward0": 25, "dispos": [25, 33], "nois": [25, 27, 33], "queue": [26, 33], "concurr": [26, 33], "offer": [26, 33], "benefit": [26, 29, 33], "back": [26, 33], "forth": [26, 33], "machin": [26, 33], "t1": [26, 33], "captur": [26, 33], "hs_79": [26, 33], "t1_tokens_out": [26, 33], "buckingham": [26, 33], "palac": [26, 33], "t2": [26, 33], "t2_tokens_out": [26, 33], "nt1": [26, 33], "49": [26, 30, 33], "072": 26, "1478bff8": 26, "622a": 26, "42cf": 26, "9ba0": 26, "78d3a0803a8b": 26, "097": 26, "423": 26, "69k": [26, 33], "20mb": 26, "strictli": [26, 33], "definit": [26, 33], "t3": [26, 33], "53": 26, "770": 26, "e794cd1a": 26, "3c4d": 26, "4300": 26, "ba68": 26, "6dcb6d8bda02": 26, "795": 26, "801": 26, "811": 26, "823": 26, "928": [26, 33], "66mb": 26, "mention": [26, 33], "vanilla": [26, 33], "instruct": [26, 30, 33], "entir": [26, 33], "often": [27, 33], "happen": [27, 28, 33], "flow": [27, 33], "assig": 27, "001": [27, 33], "hidden_states_post": 27, "clonebackward0": 27, "0244": 27, "1430": 27, "1384": 27, "0185": 27, "1173": 27, "0855": 27, "8112": 27, "3000": 27, "0057": 27, "3378": 27, "8778": 27, "2780": 27, "6427": 27, "6233": 27, "5877": 27, "2030": 27, "1590": 27, "9278": 27, "8584": 27, "0728": 27, "0145": 27, "9685": 27, "4962": 27, "4435": 27, "3371": 27, "1299": 27, "7784": 27, "5379": 27, "6941": 27, "7279": 27, "8105": 27, "6403": 27, "0599": 27, "0637": 27, "copyslic": 27, "indirect": [28, 29], "identif": 28, "task": [28, 29, 33, 36], "plotli": [28, 29], "express": [28, 29], "px": [28, 29], "corrupt": [28, 29], "clean_prompt": 28, "john": [28, 29], "mari": [28, 29], "went": [28, 29, 33], "gave": [28, 29], "bottl": 28, "milk": 28, "corrupted_prompt": 28, "That": [28, 33], "sure": [28, 33], "combin": [28, 29, 33], "correct_index": 28, "input_id": [28, 29, 30, 32], "incorrect_index": 28, "1757": 28, "5335": 28, "thank": 28, "whole": [28, 29, 33], "break": [28, 29], "n_layer": 28, "clean_token": [28, 29], "No": [28, 30], "clean_h": 28, "layer_idx": [28, 32], "clean_logit": [28, 29], "incorrect": 28, "clean_logit_diff": 28, "corrupted_logit": [28, 29], "corrupted_logit_diff": 28, "ioi_patching_result": 28, "_ioi_patching_result": 28, "token_idx": 28, "patched_logit": 28, "patched_logit_diff": 28, "improv": 28, "patched_result": 28, "3f": 28, "lambda": [28, 33], "token_label": 28, "fig": [28, 29], "imshow": [28, 29], "color_continuous_midpoint": [28, 29], "color_continuous_scal": [28, 29], "rdbu": [28, 29], "label": [28, 30, 32], "y": 28, "residu": [28, 29], "stream": [28, 29], "ioi": [28, 29], "124": 28, "adapt": 29, "neel": 29, "nanda": 29, "blog": [29, 32], "outperform": 29, "autom": 29, "colab": [29, 32, 33], "section": [29, 33], "scenario": [29, 33], "arena": 29, "sentenc": [29, 30], "shop": 29, "bag": 29, "tom": 29, "jame": 29, "park": 29, "ball": 29, "dan": 29, "sid": 29, "appl": 29, "martin": 29, "ami": 29, "drink": 29, "return_tensor": 29, "pt": [29, 31], "corrupted_token": 29, "answer_token_indic": 29, "j": 29, "get_logit_diff": 29, "correct_logit": 29, "gather": 29, "unsqueez": 29, "incorrect_logit": 29, "clean_baselin": 29, "diff": 29, "4f": 29, "corrupted_baselin": 29, "8138": 29, "metric": 29, "subject": 29, "eg": 29, "ioi_metr": 29, "baselin": 29, "approxim": [29, 36], "assumpt": 29, "corrupted_x": 29, "clean_x": 29, "corrupted_grad_x": 29, "cach": 29, "down": 29, "nice": [29, 33], "attent": 29, "head": [29, 32], "represent": [29, 30], "implicitli": 29, "per": 29, "snippet": [29, 33], "clean_out": 29, "corrupted_out": 29, "corrupted_grad": 29, "invoker_clean": 29, "attn_out": 29, "invoker_corrupt": 29, "corrupted_grad_act": 29, "clean_act": 29, "corrupted_act": 29, "rearrang": 29, "estim": 29, "rather": 29, "patching_result": 29, "zip": [29, 30], "residual_attr": 29, "64": 29, "numpi": [29, 32], "update_layout": 29, "xaxis_titl": 29, "yaxis_titl": 29, "simulatan": 29, "serv": [29, 33], "heurist": 29, "practic": [29, 33], "howev": [29, 33, 35], "decent": 29, "bad": 29, "big": [29, 33], "exclud": 29, "accur": 29, "pictur": 29, "po": 29, "adap": 30, "pyven": 30, "paper": 30, "zhengxuan": 30, "wu": 30, "et": 30, "al": 30, "trang": 30, "boundlessrotatedspaceintervent": 30, "sklearn": 30, "model_select": 30, "train_test_split": 30, "hf_dataset": 30, "get_linear_schedule_with_warmup": 30, "gc": 30, "tutorial_price_tagging_util": 30, "factual_sampl": 30, "bound_alignment_sampl": 30, "lower_bound_alignment_example_sampl": 30, "is_avail": 30, "sharpbai": 30, "alpaca": [30, 36], "7b": 30, "merg": 30, "torch_dtyp": 30, "free_unused_cuda_memori": 30, "empty_cach": 30, "runtimeerror": 30, "calculate_loss": 30, "subspace_proj": 30, "mask_weight": 30, "vocab_s": 30, "32001": 30, "shift_logit": 30, "contigu": 30, "shift_label": 30, "loss_fct": 30, "crossentropyloss": 30, "boundary_loss": 30, "intervention_boundari": 30, "compute_metr": 30, "eval_pr": 30, "eval_label": 30, "generate_output": 30, "total_count": 30, "correct_count": 30, "label_idx": 30, "ne": 30, "nonzero": 30, "squeez": 30, "actual_test_label": 30, "tolist": 30, "pred_test_label": 30, "uncom": 30, "return_dict": 30, "accuraci": 30, "round": 30, "publicli": 30, "templat": 30, "core": [30, 33], "english": 30, "sai": [30, 33], "ye": 30, "xx": 30, "dollar": 30, "amount": 30, "drawn": 30, "uniform": 30, "distribut": [30, 33], "99": 30, "hypothesi": 30, "solv": [30, 33], "boundari": 30, "higher": 30, "lower": 30, "incorpor": 30, "focu": 30, "align": 30, "raw_prealign": 30, "pricing_tag": 30, "prealign_dataset": 30, "from_dict": 30, "set_format": 30, "column": 30, "prealign_dataload": 30, "appear": 30, "describ": [30, 33], "further": 30, "n": [30, 32], "npleas": 30, "n9": 30, "76": 30, "no_grad": 30, "k": 30, "eval_metr": 30, "eval_dict": 30, "TO": 30, "BE": 30, "good": [30, 33], "625": 30, "08it": 30, "goal": 30, "sampl": 30, "counterfactu": 30, "rotat": [30, 32], "lastli": 30, "matrix": 30, "trainabl": 30, "raw_data": 30, "10000": 30, "raw_train": 30, "raw_temp": 30, "test_siz": 30, "random_st": 30, "raw_ev": 30, "raw_test": 30, "unpack": 30, "create_dataset": 30, "source_input_id": 30, "intervention_id": 30, "with_format": 30, "train_dataload": 30, "eval_dataload": 30, "test_dataload": 30, "embed_dim": 30, "hidden_s": 30, "gradient_accumulation_step": 30, "epoch": 30, "temperature_start": 30, "temperature_end": 30, "intervention_lay": 30, "t_total": 30, "warm_up_step": 30, "optimizer_param": 30, "rotate_lay": 30, "adam": 30, "schedul": 30, "num_warmup_step": 30, "num_training_step": 30, "target_total_step": 30, "temperature_schedul": 30, "linspac": 30, "total_step": 30, "set_temperatur": 30, "parametrizedrotatelay": 30, "parametr": 30, "moduledict": 30, "parametrizationlist": 30, "_orthogon": 30, "batch_subspace_swap": 30, "subspace_swap": 30, "all_ind": 30, "arang": [30, 32], "base_prompt": 30, "source_prompt": 30, "mixed_out": 30, "save_out": 30, "del": 30, "output_logit": 30, "train_iter": 30, "desc": 30, "log_dict": 30, "epoch_iter": 30, "counterfactual_output": 30, "loss_str": 30, "acc": 30, "set_postfix": 30, "1000": 30, "llamatokenizerfast": 30, "63": 30, "51": 30, "2905": 30, "125": 30, "09it": 30, "dictionary_learn": 31, "autoencod": [31, 36], "weights_path": 31, "pythia": 31, "70m": 31, "dedup": 31, "mlp_out_layer0": 31, "0_8192": 31, "ae_99000": 31, "activation_dim": 31, "512": 31, "dictionary_s": 31, "ae": 31, "load_state_dict": 31, "8192": [31, 33], "eleutherai": 31, "me": [31, 33], "ishmael": 31, "year": 31, "ago": 31, "mind": 31, "long": 31, "precis": [31, 33], "littl": [31, 33], "monei": 31, "my": 31, "purs": 31, "particular": [31, 33], "shore": 31, "thought": [31, 36], "sail": 31, "wateri": 31, "drive": 31, "spleen": 31, "regul": 31, "circul": 31, "whenev": 31, "myself": 31, "grow": 31, "grim": 31, "mouth": 31, "damp": 31, "drizzli": 31, "novemb": 31, "soul": 31, "involuntarili": 31, "paus": 31, "coffin": 31, "warehous": 31, "bring": [31, 33], "rear": 31, "funer": 31, "meet": 31, "especi": [31, 33], "hypo": 31, "upper": 31, "hand": 31, "strong": 31, "moral": 31, "principl": [31, 33], "deliber": 31, "street": 31, "knock": 31, "peopl": 31, "hat": 31, "account": [31, 35], "sea": 31, "soon": 31, "mlp_0": 31, "gpt_neox": 31, "gptneoxtokenizerfast": 31, "summed_activ": 31, "ab": 31, "sort": 31, "max": [31, 32], "top_activations_indic": 31, "topk": 31, "top": [31, 32], "compound": 31, "circuitsvi": 31, "colored_tokens_multi": 31, "str_token": 31, "grant": 32, "simplifi": 32, "glimps": 32, "evolv": 32, "stage": 32, "tradit": 32, "approach": 32, "focus": 32, "belief": 32, "spotlight": 32, "believ": [32, 33], "junctur": 32, "nostalgebraist": 32, "lesswrong": 32, "pip": [32, 33, 34], "matplotlib": 32, "pyplot": 32, "plt": 32, "seaborn": 32, "sn": 32, "np": 32, "ipython": [32, 33], "clear_output": [32, 33], "usr": 32, "dist": 32, "_token": 32, "userwarn": 32, "secret": 32, "authent": 32, "hub": 32, "tab": 32, "co": [32, 33], "googl": 32, "restart": 32, "reus": 32, "notebook": 32, "recommend": 32, "public": 32, "gpt2attent": 32, "analyz": [32, 33], "probabl": 32, "aggreg": 32, "confid": 32, "probs_lay": 32, "layer_output": 32, "obtain": [32, 35], "prob": 32, "cat": 32, "maximum": 32, "max_prob": 32, "unicode_escap": 32, "layer_token": 32, "input_word": 32, "output_word": 32, "cmap": 32, "diverging_palett": 32, "255": 32, "as_cmap": 32, "figur": 32, "figsiz": 32, "ax": 32, "heatmap": 32, "arrai": 32, "fmt": 32, "linewidth": 32, "cbar_kw": 32, "xlabel": 32, "ylabel": 32, "ytick": 32, "gca": 32, "xaxi": 32, "tick_top": 32, "set_label_posit": 32, "xtick": 32, "vertic": 32, "axi": 32, "guess": 32, "accord": 32, "color": 32, "ai": 33, "black": 33, "transpar": 33, "team": [33, 34], "lab": 33, "independ": 33, "alik": 33, "passion": 33, "collabor": 33, "profoundli": 33, "tini": 33, "upgrad": 33, "submodul": 33, "complementari": 33, "requires_grad_": 33, "tiny_model": 33, "reflect": 33, "talk": 33, "conclud": 33, "common": [33, 34], "myfil": 33, "txt": 33, "Being": 33, "enough": 33, "discuss": 33, "intuit": 33, "But": 33, "explanatori": 33, "until": 33, "defer": 33, "eventu": 33, "put": 33, "oh": 33, "why": 33, "fix": 33, "2687": 33, "3314": 33, "discov": 33, "coincident": 33, "l1_output": 33, "2341": 33, "3416": 33, "8637": 33, "5382": 33, "3792": 33, "1253": 33, "4137": 33, "5758": 33, "3158": 33, "1226": 33, "rest": 33, "analysi": 33, "highest": 33, "l1_amax": 33, "seamlessli": 33, "hold": 33, "didn": 33, "3797": 33, "those": 33, "7796": 33, "ml": 33, "exactli": 33, "influenc": 33, "l1_output_befor": 33, "0th": 33, "l1_output_aft": 33, "seem": 33, "380": 33, "379": 33, "382": 33, "caus": 33, "localbackend": 33, "147": 33, "143": 33, "145": 33, "148": 33, "149": 33, "151": 33, "152": 33, "154": 33, "155": 33, "462": 33, "454": 33, "455": 33, "456": 33, "458": 33, "459": 33, "460": 33, "463": 33, "465": 33, "466": 33, "467": 33, "468": 33, "469": 33, "470": 33, "471": 33, "472": 33, "473": 33, "574": 33, "571": 33, "573": 33, "474": 33, "475": 33, "todo": 33, "476": 33, "584": 33, "prepared_input": 33, "581": 33, "582": 33, "585": 33, "586": 33, "587": 33, "1553": 33, "_wrapped_call_impl": 33, "1551": 33, "_compiled_call_impl": 33, "misc": 33, "1552": 33, "_call_impl": 33, "1603": 33, "1600": 33, "bw_hook": 33, "backwardhook": 33, "full_backward_hook": 33, "backward_pre_hook": 33, "setup_input_hook": 33, "forward_cal": 33, "1604": 33, "_global_forward_hook": 33, "_forward_hook": 33, "1605": 33, "hook_id": 33, "1606": 33, "1607": 33, "1608": 33, "1609": 33, "mark": 33, "219": 33, "217": 33, "220": 33, "1616": 33, "1614": 33, "hook_result": 33, "1615": 33, "1618": 33, "1619": 33, "559": 33, "558": 33, "449": 33, "442": 33, "443": 33, "444": 33, "445": 33, "446": 33, "448": 33, "451": 33, "452": 33, "453": 33, "410": 33, "407": 33, "409": 33, "413": 33, "387": 33, "383": 33, "385": 33, "388": 33, "389": 33, "391": 33, "392": 33, "setitem_0": 33, "6063279136": 33, "wrong": 33, "henc": 33, "feasibl": 33, "varianc": 33, "2283": 33, "3262": 33, "8443": 33, "5498": 33, "3424": 33, "1178": 33, "4780": 33, "5522": 33, "2394": 33, "1264": 33, "backpropag": 33, "layer1_output_grad": 33, "layer2_output_grad": 33, "propag": 33, "2777": 33, "1917": 33, "1359": 33, "2426": 33, "1477": 33, "0748": 33, "1204": 33, "1260": 33, "2847": 33, "previous": 33, "doubl": 33, "23": 33, "belt": 33, "bare": 33, "bone": 33, "excit": 33, "automat": 33, "gpt": 33, "llm": 33, "gpt2sdpaattent": 33, "evenli": 33, "model_doc": 33, "aren": 33, "simpler": 33, "token_id": 33, "ntoken": 33, "338": 33, "3576": 33, "london": 33, "piec": 33, "miss": 33, "Of": 33, "behind": 33, "scene": 33, "guarante": 33, "arbitrari": 33, "broadcast": 33, "laguagemodel": 33, "max_length": 33, "truncat": 33, "29": 33, "token_ids_intervent": 33, "token_ids_origin": 33, "affect": 33, "neat": 33, "cool": 33, "transfer": 33, "placehold": 33, "onto": 33, "At": 33, "match": 33, "31": 33, "token_ids_1": 33, "token_ids_2": 33, "token_ids_3": 33, "npredict": 33, "32": 33, "llm_edit": 33, "33": 33, "democrat": 33, "half": 33, "fairli": 33, "straightforward": 33, "json": 33, "amp": 33, "37": 33, "4a6576dd": 33, "b5fd": 33, "4f1f": 33, "9836": 33, "a619f8277057": 33, "207": 33, "416": 33, "30mb": 33, "900": 33, "28ac8e47": 33, "fa48": 33, "45a1": 33, "acb0": 33, "3e17960e36b8": 33, "934": 33, "935": 33, "951": 33, "953": 33, "11mb": 33, "problem": 33, "689": 33, "667c4310": 33, "9041": 33, "451d": 33, "99a5": 33, "f713f639abb8": 33, "708": 33, "726": 33, "332": 33, "49mb": 33, "315": 33, "8734ee75": 33, "b616": 33, "4270": 33, "9d4d": 33, "7cfabd6d63a": 33, "334": 33, "342": 33, "354": 33, "06k": 33, "7mb": 33, "friendli": 33, "interfac": 33, "Ins": 33, "compl": 33, "551": 33, "5f0b434d": 33, "178d": 33, "4807": 33, "913f": 33, "331f403eb0ea": 33, "593": 33, "594": 33, "610": 33, "611": 33, "630": 33, "992": 33, "68mb": 33, "niec": 33, "bunch": 33, "someon": 33, "delv": 33, "cover": 33, "091": 33, "3e78f88a": 33, "e620": 33, "4679": 33, "ac73": 33, "abeb4f14ce8": 33, "146": 33, "166": 33, "704": 33, "6289": 33, "1172": 33, "6719": 33, "1816": 33, "2715": 33, "5547": 33, "2812": 33, "8086": 33, "5820": 33, "7070": 33, "1094": 33, "2910": 33, "6016": 33, "6602": 33, "4590": 33, "3477": 33, "3438": 33, "1797": 33, "0312": 33, "0469": 33, "7930": 33, "4141": 33, "853": 33, "0859": 33, "6523": 33, "1758": 33, "2637": 33, "5391": 33, "2422": 33, "7852": 33, "0625": 33, "5664": 33, "0781": 33, "2832": 33, "6406": 33, "4453": 33, "3379": 33, "3047": 33, "0156": 33, "7695": 33, "4023": 33, "983": 33, "5898": 33, "0547": 33, "6328": 33, "1709": 33, "2559": 33, "5234": 33, "2031": 33, "7617": 33, "5508": 33, "6680": 33, "2754": 33, "6211": 33, "4316": 33, "3281": 33, "2656": 33, "9688": 33, "7461": 33, "3906": 33, "5703": 33, "0234": 33, "6133": 33, "1660": 33, "2480": 33, "5078": 33, "1641": 33, "7383": 33, "5352": 33, "6484": 33, "2676": 33, "4180": 33, "3184": 33, "2266": 33, "9414": 33, "9531": 33, "7227": 33, "3789": 33, "9922": 33, "1611": 33, "2402": 33, "4922": 33, "7148": 33, "5195": 33, "2598": 33, "4844": 33, "3086": 33, "9141": 33, "9258": 33, "6992": 33, "374": 33, "5742": 33, "2334": 33, "4766": 33, "1016": 33, "6953": 33, "5039": 33, "2520": 33, "3945": 33, "2988": 33, "1484": 33, "8867": 33, "8984": 33, "6797": 33, "3555": 33, "755": 33, "9336": 33, "5586": 33, "1514": 33, "4629": 33, "0703": 33, "4883": 33, "2441": 33, "2891": 33, "8711": 33, "3457": 33, "757": 33, "5430": 33, "1465": 33, "2197": 33, "4492": 33, "0391": 33, "6562": 33, "4727": 33, "2363": 33, "8320": 33, "8438": 33, "3359": 33, "8789": 33, "5273": 33, "1426": 33, "2129": 33, "4355": 33, "0078": 33, "6367": 33, "2295": 33, "3594": 33, "2734": 33, "8203": 33, "8516": 33, "5117": 33, "1387": 33, "2061": 33, "4219": 33, "9766": 33, "2227": 33, "3164": 33, "901": 33, "133k": 33, "571kb": 33, "c1c6e24c": 33, "9f3f": 33, "415b": 33, "8f90": 33, "de8404fc2e74": 33, "539": 33, "572": 33, "695": 33, "31k": 33, "88mb": 33, "begin_of_text": 33, "203": 33, "88838ccd": 33, "230d": 33, "485b": 33, "8f57": 33, "8399453c2250": 33, "224": 33, "231": 33, "350": 33, "93mb": 33, "caveat": 33, "websit": 33, "twitter": 33, "ndif_team": 33, "star": 34, "walk": 34, "system": 35, "boundless": 36, "da": 36, "identifi": 36, "mechan": 36, "spars": 36, "price": 36, "tag": 36, "game": 36, "prealign": 36, "bigger": 36}, "objects": {"nnsight": [[2, 0, 0, "-", "contexts"], [3, 0, 0, "-", "envoy"], [4, 0, 0, "-", "intervention"], [5, 0, 0, "-", "models"], [6, 0, 0, "-", "patching"], [7, 0, 0, "-", "schema"], [8, 0, 0, "-", "tracing"], [9, 0, 0, "-", "util"]], "nnsight.contexts": [[2, 0, 0, "-", "Conditional"], [2, 0, 0, "-", "GraphBasedContext"], [2, 0, 0, "-", "Invoker"], [2, 0, 0, "-", "Tracer"], [2, 4, 1, "", "check_for_dependencies"], [2, 4, 1, "", "resolve_dependencies"]], "nnsight.contexts.Conditional": [[2, 1, 1, "", "Conditional"], [2, 1, 1, "", "ConditionalManager"]], "nnsight.contexts.Conditional.Conditional": [[2, 2, 1, "", "_condition"], [2, 2, 1, "", "_graph"]], "nnsight.contexts.Conditional.ConditionalManager": [[2, 2, 1, "", "_conditional_dict"], [2, 2, 1, "", "_conditional_stack"], [2, 2, 1, "", "_conditioned_nodes_dict"], [2, 3, 1, "", "add_conditioned_node"], [2, 3, 1, "", "get"], [2, 3, 1, "", "is_node_conditioned"], [2, 3, 1, "", "peek"], [2, 3, 1, "", "pop"], [2, 3, 1, "", "push"]], "nnsight.contexts.GraphBasedContext": [[2, 1, 1, "", "GlobalTracingContext"], [2, 1, 1, "", "GraphBasedContext"]], "nnsight.contexts.GraphBasedContext.GlobalTracingContext": [[2, 1, 1, "", "GlobalTracingExit"], [2, 1, 1, "", "GlobalTracingTorchHandler"], [2, 3, 1, "", "deregister"], [2, 3, 1, "", "register"], [2, 3, 1, "", "try_deregister"], [2, 3, 1, "", "try_register"]], "nnsight.contexts.GraphBasedContext.GraphBasedContext": [[2, 3, 1, "", "apply"], [2, 3, 1, "", "bool"], [2, 3, 1, "", "bridge_backend_handle"], [2, 3, 1, "", "bytearray"], [2, 3, 1, "", "bytes"], [2, 3, 1, "", "complex"], [2, 3, 1, "", "cond"], [2, 3, 1, "", "dict"], [2, 3, 1, "", "exit"], [2, 3, 1, "", "float"], [2, 3, 1, "", "int"], [2, 3, 1, "", "list"], [2, 3, 1, "", "log"], [2, 3, 1, "", "set"], [2, 3, 1, "", "str"], [2, 3, 1, "", "tuple"], [2, 3, 1, "", "vis"]], "nnsight.contexts.Invoker": [[2, 1, 1, "", "Invoker"]], "nnsight.contexts.Invoker.Invoker": [[2, 2, 1, "", "inputs"], [2, 2, 1, "", "kwargs"], [2, 2, 1, "", "scan"], [2, 2, 1, "", "scanning"], [2, 2, 1, "", "tracer"]], "nnsight.contexts.Tracer": [[2, 1, 1, "", "Tracer"]], "nnsight.contexts.Tracer.Tracer": [[2, 2, 1, "", "_args"], [2, 2, 1, "", "_graph"], [2, 2, 1, "", "_invoker"], [2, 2, 1, "", "_invoker_inputs"], [2, 2, 1, "", "_kwargs"], [2, 2, 1, "", "_model"], [2, 3, 1, "", "edit_backend_execute"], [2, 3, 1, "", "invoke"], [2, 3, 1, "", "local_backend_execute"], [2, 3, 1, "", "next"], [2, 3, 1, "", "remote_backend_get_model_key"], [2, 3, 1, "", "remote_backend_handle_result_value"], [2, 3, 1, "", "remote_backend_postprocess_result"]], "nnsight.contexts.session": [[2, 0, 0, "-", "Iterator"], [2, 0, 0, "-", "Session"]], "nnsight.contexts.session.Iterator": [[2, 1, 1, "", "Iterator"]], "nnsight.contexts.session.Session": [[2, 1, 1, "", "Session"]], "nnsight.contexts.session.Session.Session": [[2, 2, 1, "", "backend"], [2, 2, 1, "", "bridge"], [2, 2, 1, "", "graph"], [2, 3, 1, "", "iter"], [2, 3, 1, "", "local_backend_execute"], [2, 2, 1, "", "model"], [2, 3, 1, "", "remote_backend_get_model_key"], [2, 3, 1, "", "remote_backend_handle_result_value"], [2, 3, 1, "", "remote_backend_postprocess_result"]], "nnsight.envoy": [[3, 1, 1, "", "Envoy"]], "nnsight.envoy.Envoy": [[3, 2, 1, "", "_call_iter"], [3, 2, 1, "", "_fake_inputs"], [3, 2, 1, "", "_fake_outputs"], [3, 2, 1, "", "_tracer"], [3, 5, 1, "id0", "input"], [3, 5, 1, "", "inputs"], [3, 3, 1, "", "modules"], [3, 3, 1, "", "named_modules"], [3, 5, 1, "id1", "output"], [3, 2, 1, "", "path"], [3, 3, 1, "", "to"]], "nnsight.intervention": [[4, 1, 1, "", "HookHandler"], [4, 1, 1, "", "InterventionHandler"], [4, 1, 1, "", "InterventionProtocol"], [4, 1, 1, "", "InterventionProxy"]], "nnsight.intervention.HookHandler": [[4, 2, 1, "", "handles"], [4, 2, 1, "", "input_hook"], [4, 2, 1, "", "model"], [4, 2, 1, "", "modules"], [4, 2, 1, "", "output_hook"]], "nnsight.intervention.InterventionHandler": [[4, 3, 1, "", "count"]], "nnsight.intervention.InterventionProtocol": [[4, 3, 1, "", "add"], [4, 3, 1, "", "get_interventions"], [4, 3, 1, "", "intervene"], [4, 3, 1, "", "style"]], "nnsight.intervention.InterventionProxy": [[4, 5, 1, "", "device"], [4, 5, 1, "", "dtype"], [4, 5, 1, "", "grad"], [4, 3, 1, "", "save"], [4, 5, 1, "", "shape"], [4, 3, 1, "", "stop"], [4, 3, 1, "", "update"]], "nnsight.models": [[5, 0, 0, "-", "LanguageModel"], [5, 0, 0, "-", "NNsightModel"], [5, 0, 0, "-", "UnifiedTransformer"]], "nnsight.models.LanguageModel": [[5, 1, 1, "", "LanguageModel"], [5, 1, 1, "", "LanguageModelProxy"], [5, 1, 1, "", "TokenIndexer"]], "nnsight.models.LanguageModel.LanguageModel": [[5, 2, 1, "", "automodel"], [5, 2, 1, "", "config"], [5, 2, 1, "", "model"], [5, 2, 1, "", "proxy_class"], [5, 2, 1, "", "tokenizer"]], "nnsight.models.LanguageModel.LanguageModelProxy": [[5, 5, 1, "", "t"], [5, 5, 1, "", "token"]], "nnsight.models.NNsightModel": [[5, 1, 1, "", "MetaDispatcher"], [5, 1, 1, "", "NNsight"]], "nnsight.models.NNsightModel.NNsight": [[5, 2, 1, "", "_args"], [5, 2, 1, "", "_custom_model"], [5, 2, 1, "", "_dispatched"], [5, 2, 1, "", "_envoy"], [5, 2, 1, "", "_kwargs"], [5, 2, 1, "", "_model"], [5, 2, 1, "", "_model_key"], [5, 2, 1, "", "_session"], [5, 3, 1, "", "clear_edits"], [5, 3, 1, "", "dispatch_model"], [5, 3, 1, "", "edit"], [5, 3, 1, "", "interleave"], [5, 2, 1, "", "proxy_class"], [5, 3, 1, "", "scan"], [5, 3, 1, "", "session"], [5, 3, 1, "", "to"], [5, 3, 1, "", "trace"]], "nnsight.models.UnifiedTransformer": [[5, 1, 1, "", "UnifiedTransformer"]], "nnsight.patching": [[6, 1, 1, "", "Patch"], [6, 1, 1, "", "Patcher"]], "nnsight.patching.Patch": [[6, 2, 1, "", "obj"], [6, 2, 1, "", "parent"], [6, 3, 1, "", "patch"], [6, 2, 1, "", "replacement"], [6, 3, 1, "", "restore"]], "nnsight.patching.Patcher": [[6, 3, 1, "", "add"], [6, 2, 1, "", "patches"]], "nnsight.schema": [[7, 0, 0, "-", "Config"], [7, 0, 0, "-", "Response"]], "nnsight.schema.Config": [[7, 1, 1, "", "ApiConfigModel"], [7, 1, 1, "", "AppConfigModel"], [7, 1, 1, "", "ConfigModel"]], "nnsight.schema.Config.ApiConfigModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.Config.AppConfigModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.Config.ConfigModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.Response": [[7, 1, 1, "", "ResponseModel"], [7, 1, 1, "", "ResultModel"]], "nnsight.schema.Response.ResponseModel": [[7, 1, 1, "", "JobStatus"], [7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.Response.ResultModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format": [[7, 0, 0, "-", "functions"], [7, 0, 0, "-", "types"]], "nnsight.schema.format.types": [[7, 1, 1, "", "BaseNNsightModel"], [7, 1, 1, "", "DictModel"], [7, 1, 1, "", "EllipsisModel"], [7, 1, 1, "", "FunctionModel"], [7, 6, 1, "", "FunctionWhitelistError"], [7, 1, 1, "", "GraphModel"], [7, 1, 1, "", "IteratorModel"], [7, 1, 1, "", "ListModel"], [7, 1, 1, "", "NodeModel"], [7, 1, 1, "", "PrimitiveModel"], [7, 1, 1, "", "SessionModel"], [7, 1, 1, "", "SliceModel"], [7, 1, 1, "", "TensorModel"], [7, 1, 1, "", "TracerModel"], [7, 1, 1, "", "TupleModel"]], "nnsight.schema.format.types.BaseNNsightModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.DictModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.EllipsisModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.FunctionModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.GraphModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.IteratorModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.ListModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.NodeModel": [[7, 1, 1, "", "Reference"], [7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.NodeModel.Reference": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.PrimitiveModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.SessionModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.SliceModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.TensorModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.TracerModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.schema.format.types.TupleModel": [[7, 2, 1, "", "model_config"], [7, 2, 1, "", "model_fields"]], "nnsight.tracing": [[8, 0, 0, "-", "Bridge"], [8, 0, 0, "-", "Graph"], [8, 0, 0, "-", "Node"], [8, 0, 0, "-", "Proxy"], [8, 0, 0, "-", "protocols"]], "nnsight.tracing.Bridge": [[8, 1, 1, "", "Bridge"]], "nnsight.tracing.Bridge.Bridge": [[8, 3, 1, "", "add"], [8, 3, 1, "", "add_bridge_proxy"], [8, 2, 1, "", "bridged_nodes"], [8, 3, 1, "", "get_bridge_proxy"], [8, 3, 1, "", "get_graph"], [8, 2, 1, "", "graph_stack"], [8, 2, 1, "", "id_to_graph"], [8, 2, 1, "", "locks"], [8, 3, 1, "", "peek_graph"], [8, 3, 1, "", "pop_graph"]], "nnsight.tracing.Graph": [[8, 1, 1, "", "Graph"]], "nnsight.tracing.Graph.Graph": [[8, 3, 1, "", "add"], [8, 2, 1, "", "alive"], [8, 2, 1, "", "attachments"], [8, 3, 1, "", "copy"], [8, 3, 1, "", "create"], [8, 3, 1, "", "execute"], [8, 2, 1, "", "name_idx"], [8, 2, 1, "", "nodes"], [8, 3, 1, "", "reset"], [8, 2, 1, "", "sequential"], [8, 2, 1, "", "validate"], [8, 3, 1, "", "vis"]], "nnsight.tracing.Node": [[8, 1, 1, "", "Node"]], "nnsight.tracing.Node.Node": [[8, 2, 1, "", "arg_dependencies"], [8, 2, 1, "", "args"], [8, 3, 1, "", "attached"], [8, 3, 1, "", "clean"], [8, 2, 1, "", "cond_dependency"], [8, 3, 1, "", "create"], [8, 3, 1, "", "destroy"], [8, 3, 1, "", "done"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "executed"], [8, 3, 1, "", "fulfilled"], [8, 2, 1, "", "graph"], [8, 2, 1, "", "kwargs"], [8, 2, 1, "", "listeners"], [8, 2, 1, "", "name"], [8, 3, 1, "", "prepare_inputs"], [8, 3, 1, "", "preprocess"], [8, 2, 1, "", "proxy"], [8, 2, 1, "", "proxy_value"], [8, 3, 1, "", "redundant"], [8, 3, 1, "", "reset"], [8, 3, 1, "", "set_value"], [8, 2, 1, "", "target"], [8, 5, 1, "id0", "value"], [8, 3, 1, "", "visualize"]], "nnsight.tracing.Proxy": [[8, 1, 1, "", "Proxy"], [8, 4, 1, "", "proxy_wrapper"]], "nnsight.tracing.Proxy.Proxy": [[8, 2, 1, "", "node"], [8, 5, 1, "", "value"]], "nnsight.tracing.protocols": [[8, 1, 1, "", "ApplyModuleProtocol"], [8, 1, 1, "", "BridgeProtocol"], [8, 1, 1, "", "ConditionalProtocol"], [8, 1, 1, "", "EarlyStopProtocol"], [8, 1, 1, "", "GradProtocol"], [8, 1, 1, "", "LocalBackendExecuteProtocol"], [8, 1, 1, "", "LockProtocol"], [8, 1, 1, "", "Protocol"], [8, 1, 1, "", "SwapProtocol"], [8, 1, 1, "", "UpdateProtocol"], [8, 1, 1, "", "ValueProtocol"]], "nnsight.tracing.protocols.ApplyModuleProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "get_module"], [8, 3, 1, "", "set_module"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.BridgeProtocol": [[8, 6, 1, "", "BridgeException"], [8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "get_bridge"], [8, 3, 1, "", "has_bridge"], [8, 3, 1, "", "peek_graph"], [8, 3, 1, "", "set_bridge"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.ConditionalProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "add_conditioned_node"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "get_conditional"], [8, 3, 1, "", "has_conditional"], [8, 3, 1, "", "is_node_conditioned"], [8, 3, 1, "", "peek_conditional"], [8, 3, 1, "", "pop_conditional"], [8, 3, 1, "", "push_conditional"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.EarlyStopProtocol": [[8, 6, 1, "", "EarlyStopException"], [8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.GradProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "increment"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.LocalBackendExecuteProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.LockProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.Protocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.SwapProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "get_swap"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.UpdateProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.tracing.protocols.ValueProtocol": [[8, 3, 1, "", "add"], [8, 3, 1, "", "execute"], [8, 3, 1, "", "style"]], "nnsight.util": [[9, 1, 1, "", "WrapperModule"], [9, 4, 1, "", "apply"], [9, 4, 1, "", "fetch_attr"], [9, 4, 1, "", "wrap"]], "nnsight.util.WrapperModule": [[9, 3, 1, "", "forward"]]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:attribute", "3": "py:method", "4": "py:function", "5": "py:property", "6": "py:exception"}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "method", "Python method"], "4": ["py", "function", "Python function"], "5": ["py", "property", "Python property"], "6": ["py", "exception", "Python exception"]}, "titleterms": {"about": 0, "nnsight": [0, 2, 3, 4, 5, 6, 7, 8, 9, 11], "an": 0, "api": 0, "transpar": 0, "scienc": 0, "black": 0, "box": 0, "ai": 0, "how": 0, "do": 0, "i": [0, 33], "us": 0, "what": 0, "happen": 0, "behind": 0, "scene": 0, "document": 1, "context": [2, 33], "envoi": 3, "intervent": [4, 12, 13, 18, 33], "model": [5, 20, 32, 33], "patch": [6, 28, 29], "schema": 7, "trace": [8, 33], "util": 9, "featur": 10, "condit": [12, 33], "cross": 13, "prompt": 13, "custom": [14, 33], "function": [14, 33], "earli": [15, 33], "stop": [15, 33], "get": [16, 33, 34], "valu": [16, 27], "gradient": [17, 33], "iter": 18, "lora": [19, 33], "edit": [20, 33], "modul": 21, "multipl": 22, "token": 22, "gener": 22, "oper": [23, 33], "remot": [24, 33], "execut": [24, 33], "scan": 25, "valid": 25, "session": [26, 33], "set": [27, 33], "activ": 28, "attribut": 29, "setup": [29, 30, 32], "ignor": [29, 30, 32], "boundless": 30, "da": 30, "price": 30, "tag": 30, "game": 30, "prealign": 30, "task": 30, "dictionari": 31, "learn": 31, "logit": 32, "len": 32, "introduct": 32, "gpt2": 32, "architectur": 32, "visual": 32, "gpt": 32, "2": [32, 33], "layer": 32, "interpret": 32, "walkthrough": 33, "1": 33, "first": [33, 34], "let": 33, "": 33, "start": [33, 34], "small": 33, "method": 33, "bigger": 33, "languagemodel": 33, "batch": 33, "next": 33, "3": 33, "thought": 33, "you": 33, "said": 33, "huge": 33, "loop": 33, "train": 33, "involv": 33, "instal": 34, "step": 34, "statu": 35, "tutori": 36}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "nbsphinx": 4, "sphinx.ext.viewcode": 1, "sphinx": 60}, "alltitles": {"About NNsight": [[0, "about-nnsight"]], "An API for transparent science on black-box AI.": [[0, "an-api-for-transparent-science-on-black-box-ai"]], "How do I use NNsight?": [[0, "how-do-i-use-nnsight"]], "What happens behind the scenes?": [[0, "what-happens-behind-the-scenes"]], "Documentation": [[1, "documentation"]], "nnsight.contexts": [[2, "module-nnsight.contexts"]], "nnsight.envoy": [[3, "module-nnsight.envoy"]], "nnsight.intervention": [[4, "module-nnsight.intervention"]], "nnsight.models": [[5, "module-nnsight.models"]], "nnsight.patching": [[6, "module-nnsight.patching"]], "nnsight.schema": [[7, "module-nnsight.schema"]], "nnsight.tracing": [[8, "module-nnsight.tracing"]], "nnsight.util": [[9, "module-nnsight.util"]], "Features": [[10, "features"]], "nnsight": [[11, "nnsight"]], "Conditional Interventions": [[12, "Conditional-Interventions"], [33, "Conditional-Interventions"]], "Cross-Prompt Intervention": [[13, "Cross-Prompt-Intervention"]], "Custom Functions": [[14, "Custom-Functions"], [33, "Custom-Functions"]], "Early Stopping": [[15, "Early-Stopping"], [33, "Early-Stopping"]], "Getting Values": [[16, "Getting-Values"]], "Gradients": [[17, "Gradients"], [33, "Gradients"]], "Iterative Interventions": [[18, "Iterative-Interventions"]], "LoRA": [[19, "LoRA"]], "Model Editing": [[20, "Model-Editing"], [33, "Model-Editing"]], "Modules": [[21, "Modules"]], "Multiple Token Generation": [[22, "Multiple-Token-Generation"]], "Operations": [[23, "Operations"]], "Remote Execution": [[24, "Remote-Execution"]], "Scan and Validate": [[25, "Scan-and-Validate"]], "Sessions": [[26, "Sessions"], [33, "Sessions"]], "Setting Values": [[27, "Setting-Values"]], "Activation Patching": [[28, "Activation-Patching"]], "Attribution Patching": [[29, "Attribution-Patching"]], "Setup (Ignore)": [[29, "Setup-(Ignore)"], [30, "Setup-(Ignore)"], [32, "Setup-(Ignore)"]], "Boundless DAS": [[30, "Boundless-DAS"], [30, "id1"]], "Price Tagging game": [[30, "Price-Tagging-game"]], "Prealign Task": [[30, "Prealign-Task"]], "Dictionary Learning": [[31, "Dictionary-Learning"]], "Logit Lens": [[32, "Logit-Lens"]], "Introduction to Logit Lens": [[32, "Introduction-to-Logit-Lens"]], "GPT2 Model Architecture": [[32, "GPT2-Model-Architecture"]], "Visualizing GPT-2 Layer Interpretations": [[32, "Visualizing-GPT-2-Layer-Interpretations"]], "Walkthrough": [[33, "Walkthrough"]], "1\ufe0f\u20e3 First, let\u2019s start small": [[33, "1\ufe0f\u20e3-First,-let's-start-small"]], "Tracing Context": [[33, "Tracing-Context"]], "Getting": [[33, "Getting"]], "Functions, Methods, and Operations": [[33, "Functions,-Methods,-and-Operations"]], "Setting": [[33, "Setting"]], "2\ufe0f\u20e3 Bigger": [[33, "2\ufe0f\u20e3-Bigger"]], "LanguageModel": [[33, "LanguageModel"]], "Batching": [[33, "Batching"]], ".next()": [[33, ".next()"]], "3\ufe0f\u20e3 I thought you said huge models?": [[33, "3\ufe0f\u20e3-I-thought-you-said-huge-models?"]], "Remote execution": [[33, "Remote-execution"]], "Looping": [[33, "Looping"]], "Training a LoRA": [[33, "Training-a-LoRA"]], "Getting Involved!": [[33, "Getting-Involved!"]], "Getting Started": [[34, "getting-started"]], "Installation": [[34, "installation"]], "First Steps": [[34, "first-steps"]], "Status": [[35, "status"]], "Tutorials": [[36, "tutorials"]]}, "indexentries": {"conditional (class in nnsight.contexts.conditional)": [[2, "nnsight.contexts.Conditional.Conditional"]], "conditionalmanager (class in nnsight.contexts.conditional)": [[2, "nnsight.contexts.Conditional.ConditionalManager"]], "globaltracingcontext (class in nnsight.contexts.graphbasedcontext)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext"]], "globaltracingcontext.globaltracingexit (class in nnsight.contexts.graphbasedcontext)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.GlobalTracingExit"]], "globaltracingcontext.globaltracingtorchhandler (class in nnsight.contexts.graphbasedcontext)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.GlobalTracingTorchHandler"]], "graphbasedcontext (class in nnsight.contexts.graphbasedcontext)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext"]], "invoker (class in nnsight.contexts.invoker)": [[2, "nnsight.contexts.Invoker.Invoker"]], "iterator (class in nnsight.contexts.session.iterator)": [[2, "nnsight.contexts.session.Iterator.Iterator"]], "session (class in nnsight.contexts.session.session)": [[2, "nnsight.contexts.session.Session.Session"]], "tracer (class in nnsight.contexts.tracer)": [[2, "nnsight.contexts.Tracer.Tracer"]], "_args (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._args"]], "_condition (nnsight.contexts.conditional.conditional attribute)": [[2, "nnsight.contexts.Conditional.Conditional._condition"]], "_conditional_dict (nnsight.contexts.conditional.conditionalmanager attribute)": [[2, "nnsight.contexts.Conditional.ConditionalManager._conditional_dict"]], "_conditional_stack (nnsight.contexts.conditional.conditionalmanager attribute)": [[2, "nnsight.contexts.Conditional.ConditionalManager._conditional_stack"]], "_conditioned_nodes_dict (nnsight.contexts.conditional.conditionalmanager attribute)": [[2, "nnsight.contexts.Conditional.ConditionalManager._conditioned_nodes_dict"]], "_graph (nnsight.contexts.conditional.conditional attribute)": [[2, "nnsight.contexts.Conditional.Conditional._graph"]], "_graph (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._graph"]], "_invoker (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._invoker"]], "_invoker_inputs (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._invoker_inputs"]], "_kwargs (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._kwargs"]], "_model (nnsight.contexts.tracer.tracer attribute)": [[2, "nnsight.contexts.Tracer.Tracer._model"]], "add_conditioned_node() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.add_conditioned_node"]], "apply() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.apply"]], "backend (nnsight.contexts.session.session.session attribute)": [[2, "nnsight.contexts.session.Session.Session.backend"]], "bool() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.bool"]], "bridge (nnsight.contexts.session.session.session attribute)": [[2, "nnsight.contexts.session.Session.Session.bridge"]], "bridge_backend_handle() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.bridge_backend_handle"]], "bytearray() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.bytearray"]], "bytes() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.bytes"]], "check_for_dependencies() (in module nnsight.contexts)": [[2, "nnsight.contexts.check_for_dependencies"]], "complex() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.complex"]], "cond() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.cond"]], "deregister() (nnsight.contexts.graphbasedcontext.globaltracingcontext static method)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.deregister"]], "dict() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.dict"]], "edit_backend_execute() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.edit_backend_execute"]], "exit() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.exit"]], "float() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.float"]], "get() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.get"]], "graph (nnsight.contexts.session.session.session attribute)": [[2, "nnsight.contexts.session.Session.Session.graph"]], "inputs (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.inputs"]], "int() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.int"]], "invoke() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.invoke"]], "is_node_conditioned() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.is_node_conditioned"]], "iter() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.iter"]], "kwargs (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.kwargs"]], "list() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.list"]], "local_backend_execute() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.local_backend_execute"]], "local_backend_execute() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.local_backend_execute"]], "log() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.log"]], "model (nnsight.contexts.session.session.session attribute)": [[2, "nnsight.contexts.session.Session.Session.model"]], "module": [[2, "module-nnsight.contexts"], [2, "module-nnsight.contexts.Conditional"], [2, "module-nnsight.contexts.GraphBasedContext"], [2, "module-nnsight.contexts.Invoker"], [2, "module-nnsight.contexts.Tracer"], [2, "module-nnsight.contexts.session.Iterator"], [2, "module-nnsight.contexts.session.Session"], [3, "module-nnsight.envoy"], [4, "module-nnsight.intervention"], [5, "module-nnsight.models"], [5, "module-nnsight.models.LanguageModel"], [5, "module-nnsight.models.NNsightModel"], [5, "module-nnsight.models.UnifiedTransformer"], [6, "module-nnsight.patching"], [7, "module-nnsight.schema"], [7, "module-nnsight.schema.Config"], [7, "module-nnsight.schema.Response"], [7, "module-nnsight.schema.format.functions"], [7, "module-nnsight.schema.format.types"], [8, "module-nnsight.tracing"], [8, "module-nnsight.tracing.Bridge"], [8, "module-nnsight.tracing.Graph"], [8, "module-nnsight.tracing.Node"], [8, "module-nnsight.tracing.Proxy"], [8, "module-nnsight.tracing.protocols"], [9, "module-nnsight.util"]], "next() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.next"]], "nnsight.contexts": [[2, "module-nnsight.contexts"]], "nnsight.contexts.conditional": [[2, "module-nnsight.contexts.Conditional"]], "nnsight.contexts.graphbasedcontext": [[2, "module-nnsight.contexts.GraphBasedContext"]], "nnsight.contexts.invoker": [[2, "module-nnsight.contexts.Invoker"]], "nnsight.contexts.tracer": [[2, "module-nnsight.contexts.Tracer"]], "nnsight.contexts.session.iterator": [[2, "module-nnsight.contexts.session.Iterator"]], "nnsight.contexts.session.session": [[2, "module-nnsight.contexts.session.Session"]], "peek() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.peek"]], "pop() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.pop"]], "push() (nnsight.contexts.conditional.conditionalmanager method)": [[2, "nnsight.contexts.Conditional.ConditionalManager.push"]], "register() (nnsight.contexts.graphbasedcontext.globaltracingcontext static method)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.register"]], "remote_backend_get_model_key() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.remote_backend_get_model_key"]], "remote_backend_get_model_key() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.remote_backend_get_model_key"]], "remote_backend_handle_result_value() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.remote_backend_handle_result_value"]], "remote_backend_handle_result_value() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.remote_backend_handle_result_value"]], "remote_backend_postprocess_result() (nnsight.contexts.tracer.tracer method)": [[2, "nnsight.contexts.Tracer.Tracer.remote_backend_postprocess_result"]], "remote_backend_postprocess_result() (nnsight.contexts.session.session.session method)": [[2, "nnsight.contexts.session.Session.Session.remote_backend_postprocess_result"]], "resolve_dependencies() (in module nnsight.contexts)": [[2, "nnsight.contexts.resolve_dependencies"]], "scan (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.scan"]], "scanning (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.scanning"]], "set() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.set"]], "str() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.str"]], "tracer (nnsight.contexts.invoker.invoker attribute)": [[2, "nnsight.contexts.Invoker.Invoker.tracer"]], "try_deregister() (nnsight.contexts.graphbasedcontext.globaltracingcontext static method)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.try_deregister"]], "try_register() (nnsight.contexts.graphbasedcontext.globaltracingcontext static method)": [[2, "nnsight.contexts.GraphBasedContext.GlobalTracingContext.try_register"]], "tuple() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.tuple"]], "vis() (nnsight.contexts.graphbasedcontext.graphbasedcontext method)": [[2, "nnsight.contexts.GraphBasedContext.GraphBasedContext.vis"]], "envoy (class in nnsight.envoy)": [[3, "nnsight.envoy.Envoy"]], "_call_iter (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy._call_iter"]], "_fake_inputs (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy._fake_inputs"]], "_fake_outputs (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy._fake_outputs"]], "_tracer (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy._tracer"]], "input (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy.input"]], "input (nnsight.envoy.envoy property)": [[3, "id0"]], "inputs (nnsight.envoy.envoy property)": [[3, "nnsight.envoy.Envoy.inputs"]], "modules() (nnsight.envoy.envoy method)": [[3, "nnsight.envoy.Envoy.modules"]], "named_modules() (nnsight.envoy.envoy method)": [[3, "nnsight.envoy.Envoy.named_modules"]], "nnsight.envoy": [[3, "module-nnsight.envoy"]], "output (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy.output"]], "output (nnsight.envoy.envoy property)": [[3, "id1"]], "path (nnsight.envoy.envoy attribute)": [[3, "nnsight.envoy.Envoy.path"]], "to() (nnsight.envoy.envoy method)": [[3, "nnsight.envoy.Envoy.to"]], "hookhandler (class in nnsight.intervention)": [[4, "nnsight.intervention.HookHandler"]], "interventionhandler (class in nnsight.intervention)": [[4, "nnsight.intervention.InterventionHandler"]], "interventionprotocol (class in nnsight.intervention)": [[4, "nnsight.intervention.InterventionProtocol"]], "interventionproxy (class in nnsight.intervention)": [[4, "nnsight.intervention.InterventionProxy"]], "add() (nnsight.intervention.interventionprotocol class method)": [[4, "nnsight.intervention.InterventionProtocol.add"]], "count() (nnsight.intervention.interventionhandler method)": [[4, "nnsight.intervention.InterventionHandler.count"]], "device (nnsight.intervention.interventionproxy property)": [[4, "nnsight.intervention.InterventionProxy.device"]], "dtype (nnsight.intervention.interventionproxy property)": [[4, "nnsight.intervention.InterventionProxy.dtype"]], "get_interventions() (nnsight.intervention.interventionprotocol class method)": [[4, "nnsight.intervention.InterventionProtocol.get_interventions"]], "grad (nnsight.intervention.interventionproxy property)": [[4, "nnsight.intervention.InterventionProxy.grad"]], "handles (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.handles"]], "input_hook (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.input_hook"]], "intervene() (nnsight.intervention.interventionprotocol class method)": [[4, "nnsight.intervention.InterventionProtocol.intervene"]], "model (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.model"]], "modules (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.modules"]], "nnsight.intervention": [[4, "module-nnsight.intervention"]], "output_hook (nnsight.intervention.hookhandler attribute)": [[4, "nnsight.intervention.HookHandler.output_hook"]], "save() (nnsight.intervention.interventionproxy method)": [[4, "nnsight.intervention.InterventionProxy.save"]], "shape (nnsight.intervention.interventionproxy property)": [[4, "nnsight.intervention.InterventionProxy.shape"]], "stop() (nnsight.intervention.interventionproxy method)": [[4, "nnsight.intervention.InterventionProxy.stop"]], "style() (nnsight.intervention.interventionprotocol class method)": [[4, "nnsight.intervention.InterventionProtocol.style"]], "update() (nnsight.intervention.interventionproxy method)": [[4, "nnsight.intervention.InterventionProxy.update"]], "languagemodel (class in nnsight.models.languagemodel)": [[5, "nnsight.models.LanguageModel.LanguageModel"]], "languagemodelproxy (class in nnsight.models.languagemodel)": [[5, "nnsight.models.LanguageModel.LanguageModelProxy"]], "metadispatcher (class in nnsight.models.nnsightmodel)": [[5, "nnsight.models.NNsightModel.MetaDispatcher"]], "nnsight (class in nnsight.models.nnsightmodel)": [[5, "nnsight.models.NNsightModel.NNsight"]], "tokenindexer (class in nnsight.models.languagemodel)": [[5, "nnsight.models.LanguageModel.TokenIndexer"]], "unifiedtransformer (class in nnsight.models.unifiedtransformer)": [[5, "nnsight.models.UnifiedTransformer.UnifiedTransformer"]], "_args (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._args"]], "_custom_model (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._custom_model"]], "_dispatched (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._dispatched"]], "_envoy (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._envoy"]], "_kwargs (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._kwargs"]], "_model (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._model"]], "_model_key (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._model_key"]], "_session (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight._session"]], "automodel (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.automodel"]], "clear_edits() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.clear_edits"]], "config (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.config"]], "dispatch_model() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.dispatch_model"]], "edit() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.edit"]], "interleave() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.interleave"]], "model (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.model"]], "nnsight.models": [[5, "module-nnsight.models"]], "nnsight.models.languagemodel": [[5, "module-nnsight.models.LanguageModel"]], "nnsight.models.nnsightmodel": [[5, "module-nnsight.models.NNsightModel"]], "nnsight.models.unifiedtransformer": [[5, "module-nnsight.models.UnifiedTransformer"]], "proxy_class (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.proxy_class"]], "proxy_class (nnsight.models.nnsightmodel.nnsight attribute)": [[5, "nnsight.models.NNsightModel.NNsight.proxy_class"]], "scan() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.scan"]], "session() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.session"]], "t (nnsight.models.languagemodel.languagemodelproxy property)": [[5, "nnsight.models.LanguageModel.LanguageModelProxy.t"]], "to() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.to"]], "token (nnsight.models.languagemodel.languagemodelproxy property)": [[5, "nnsight.models.LanguageModel.LanguageModelProxy.token"]], "tokenizer (nnsight.models.languagemodel.languagemodel attribute)": [[5, "nnsight.models.LanguageModel.LanguageModel.tokenizer"]], "trace() (nnsight.models.nnsightmodel.nnsight method)": [[5, "nnsight.models.NNsightModel.NNsight.trace"]], "patch (class in nnsight.patching)": [[6, "nnsight.patching.Patch"]], "patcher (class in nnsight.patching)": [[6, "nnsight.patching.Patcher"]], "add() (nnsight.patching.patcher method)": [[6, "nnsight.patching.Patcher.add"]], "nnsight.patching": [[6, "module-nnsight.patching"]], "obj (nnsight.patching.patch attribute)": [[6, "nnsight.patching.Patch.obj"]], "parent (nnsight.patching.patch attribute)": [[6, "nnsight.patching.Patch.parent"]], "patch() (nnsight.patching.patch method)": [[6, "nnsight.patching.Patch.patch"]], "patches (nnsight.patching.patcher attribute)": [[6, "nnsight.patching.Patcher.patches"]], "replacement (nnsight.patching.patch attribute)": [[6, "nnsight.patching.Patch.replacement"]], "restore() (nnsight.patching.patch method)": [[6, "nnsight.patching.Patch.restore"]], "apiconfigmodel (class in nnsight.schema.config)": [[7, "nnsight.schema.Config.ApiConfigModel"]], "appconfigmodel (class in nnsight.schema.config)": [[7, "nnsight.schema.Config.AppConfigModel"]], "basennsightmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.BaseNNsightModel"]], "configmodel (class in nnsight.schema.config)": [[7, "nnsight.schema.Config.ConfigModel"]], "dictmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.DictModel"]], "ellipsismodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.EllipsisModel"]], "functionmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.FunctionModel"]], "functionwhitelisterror": [[7, "nnsight.schema.format.types.FunctionWhitelistError"]], "graphmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.GraphModel"]], "iteratormodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.IteratorModel"]], "listmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.ListModel"]], "nodemodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.NodeModel"]], "nodemodel.reference (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.NodeModel.Reference"]], "primitivemodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.PrimitiveModel"]], "responsemodel (class in nnsight.schema.response)": [[7, "nnsight.schema.Response.ResponseModel"]], "responsemodel.jobstatus (class in nnsight.schema.response)": [[7, "nnsight.schema.Response.ResponseModel.JobStatus"]], "resultmodel (class in nnsight.schema.response)": [[7, "nnsight.schema.Response.ResultModel"]], "sessionmodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.SessionModel"]], "slicemodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.SliceModel"]], "tensormodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.TensorModel"]], "tracermodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.TracerModel"]], "tuplemodel (class in nnsight.schema.format.types)": [[7, "nnsight.schema.format.types.TupleModel"]], "model_config (nnsight.schema.config.apiconfigmodel attribute)": [[7, "nnsight.schema.Config.ApiConfigModel.model_config"]], "model_config (nnsight.schema.config.appconfigmodel attribute)": [[7, "nnsight.schema.Config.AppConfigModel.model_config"]], "model_config (nnsight.schema.config.configmodel attribute)": [[7, "nnsight.schema.Config.ConfigModel.model_config"]], "model_config (nnsight.schema.response.responsemodel attribute)": [[7, "nnsight.schema.Response.ResponseModel.model_config"]], "model_config (nnsight.schema.response.resultmodel attribute)": [[7, "nnsight.schema.Response.ResultModel.model_config"]], "model_config (nnsight.schema.format.types.basennsightmodel attribute)": [[7, "nnsight.schema.format.types.BaseNNsightModel.model_config"]], "model_config (nnsight.schema.format.types.dictmodel attribute)": [[7, "nnsight.schema.format.types.DictModel.model_config"]], "model_config (nnsight.schema.format.types.ellipsismodel attribute)": [[7, "nnsight.schema.format.types.EllipsisModel.model_config"]], "model_config (nnsight.schema.format.types.functionmodel attribute)": [[7, "nnsight.schema.format.types.FunctionModel.model_config"]], "model_config (nnsight.schema.format.types.graphmodel attribute)": [[7, "nnsight.schema.format.types.GraphModel.model_config"]], "model_config (nnsight.schema.format.types.iteratormodel attribute)": [[7, "nnsight.schema.format.types.IteratorModel.model_config"]], "model_config (nnsight.schema.format.types.listmodel attribute)": [[7, "nnsight.schema.format.types.ListModel.model_config"]], "model_config (nnsight.schema.format.types.nodemodel attribute)": [[7, "nnsight.schema.format.types.NodeModel.model_config"]], "model_config (nnsight.schema.format.types.nodemodel.reference attribute)": [[7, "nnsight.schema.format.types.NodeModel.Reference.model_config"]], "model_config (nnsight.schema.format.types.primitivemodel attribute)": [[7, "nnsight.schema.format.types.PrimitiveModel.model_config"]], "model_config (nnsight.schema.format.types.sessionmodel attribute)": [[7, "nnsight.schema.format.types.SessionModel.model_config"]], "model_config (nnsight.schema.format.types.slicemodel attribute)": [[7, "nnsight.schema.format.types.SliceModel.model_config"]], "model_config (nnsight.schema.format.types.tensormodel attribute)": [[7, "nnsight.schema.format.types.TensorModel.model_config"]], "model_config (nnsight.schema.format.types.tracermodel attribute)": [[7, "nnsight.schema.format.types.TracerModel.model_config"]], "model_config (nnsight.schema.format.types.tuplemodel attribute)": [[7, "nnsight.schema.format.types.TupleModel.model_config"]], "model_fields (nnsight.schema.config.apiconfigmodel attribute)": [[7, "nnsight.schema.Config.ApiConfigModel.model_fields"]], "model_fields (nnsight.schema.config.appconfigmodel attribute)": [[7, "nnsight.schema.Config.AppConfigModel.model_fields"]], "model_fields (nnsight.schema.config.configmodel attribute)": [[7, "nnsight.schema.Config.ConfigModel.model_fields"]], "model_fields (nnsight.schema.response.responsemodel attribute)": [[7, "nnsight.schema.Response.ResponseModel.model_fields"]], "model_fields (nnsight.schema.response.resultmodel attribute)": [[7, "nnsight.schema.Response.ResultModel.model_fields"]], "model_fields (nnsight.schema.format.types.basennsightmodel attribute)": [[7, "nnsight.schema.format.types.BaseNNsightModel.model_fields"]], "model_fields (nnsight.schema.format.types.dictmodel attribute)": [[7, "nnsight.schema.format.types.DictModel.model_fields"]], "model_fields (nnsight.schema.format.types.ellipsismodel attribute)": [[7, "nnsight.schema.format.types.EllipsisModel.model_fields"]], "model_fields (nnsight.schema.format.types.functionmodel attribute)": [[7, "nnsight.schema.format.types.FunctionModel.model_fields"]], "model_fields (nnsight.schema.format.types.graphmodel attribute)": [[7, "nnsight.schema.format.types.GraphModel.model_fields"]], "model_fields (nnsight.schema.format.types.iteratormodel attribute)": [[7, "nnsight.schema.format.types.IteratorModel.model_fields"]], "model_fields (nnsight.schema.format.types.listmodel attribute)": [[7, "nnsight.schema.format.types.ListModel.model_fields"]], "model_fields (nnsight.schema.format.types.nodemodel attribute)": [[7, "nnsight.schema.format.types.NodeModel.model_fields"]], "model_fields (nnsight.schema.format.types.nodemodel.reference attribute)": [[7, "nnsight.schema.format.types.NodeModel.Reference.model_fields"]], "model_fields (nnsight.schema.format.types.primitivemodel attribute)": [[7, "nnsight.schema.format.types.PrimitiveModel.model_fields"]], "model_fields (nnsight.schema.format.types.sessionmodel attribute)": [[7, "nnsight.schema.format.types.SessionModel.model_fields"]], "model_fields (nnsight.schema.format.types.slicemodel attribute)": [[7, "nnsight.schema.format.types.SliceModel.model_fields"]], "model_fields (nnsight.schema.format.types.tensormodel attribute)": [[7, "nnsight.schema.format.types.TensorModel.model_fields"]], "model_fields (nnsight.schema.format.types.tracermodel attribute)": [[7, "nnsight.schema.format.types.TracerModel.model_fields"]], "model_fields (nnsight.schema.format.types.tuplemodel attribute)": [[7, "nnsight.schema.format.types.TupleModel.model_fields"]], "nnsight.schema": [[7, "module-nnsight.schema"]], "nnsight.schema.config": [[7, "module-nnsight.schema.Config"]], "nnsight.schema.response": [[7, "module-nnsight.schema.Response"]], "nnsight.schema.format.functions": [[7, "module-nnsight.schema.format.functions"]], "nnsight.schema.format.types": [[7, "module-nnsight.schema.format.types"]], "applymoduleprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol"]], "bridge (class in nnsight.tracing.bridge)": [[8, "nnsight.tracing.Bridge.Bridge"]], "bridgeprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.BridgeProtocol"]], "bridgeprotocol.bridgeexception": [[8, "nnsight.tracing.protocols.BridgeProtocol.BridgeException"]], "conditionalprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.ConditionalProtocol"]], "earlystopprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.EarlyStopProtocol"]], "earlystopprotocol.earlystopexception": [[8, "nnsight.tracing.protocols.EarlyStopProtocol.EarlyStopException"]], "gradprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.GradProtocol"]], "graph (class in nnsight.tracing.graph)": [[8, "nnsight.tracing.Graph.Graph"]], "localbackendexecuteprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.LocalBackendExecuteProtocol"]], "lockprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.LockProtocol"]], "node (class in nnsight.tracing.node)": [[8, "nnsight.tracing.Node.Node"]], "protocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.Protocol"]], "proxy (class in nnsight.tracing.proxy)": [[8, "nnsight.tracing.Proxy.Proxy"]], "swapprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.SwapProtocol"]], "updateprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.UpdateProtocol"]], "valueprotocol (class in nnsight.tracing.protocols)": [[8, "nnsight.tracing.protocols.ValueProtocol"]], "add() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.add"]], "add() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.add"]], "add() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.add"]], "add() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.add"]], "add() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.add"]], "add() (nnsight.tracing.protocols.earlystopprotocol class method)": [[8, "nnsight.tracing.protocols.EarlyStopProtocol.add"]], "add() (nnsight.tracing.protocols.gradprotocol class method)": [[8, "nnsight.tracing.protocols.GradProtocol.add"]], "add() (nnsight.tracing.protocols.localbackendexecuteprotocol class method)": [[8, "nnsight.tracing.protocols.LocalBackendExecuteProtocol.add"]], "add() (nnsight.tracing.protocols.lockprotocol class method)": [[8, "nnsight.tracing.protocols.LockProtocol.add"]], "add() (nnsight.tracing.protocols.protocol class method)": [[8, "nnsight.tracing.protocols.Protocol.add"]], "add() (nnsight.tracing.protocols.swapprotocol class method)": [[8, "nnsight.tracing.protocols.SwapProtocol.add"]], "add() (nnsight.tracing.protocols.updateprotocol class method)": [[8, "nnsight.tracing.protocols.UpdateProtocol.add"]], "add() (nnsight.tracing.protocols.valueprotocol class method)": [[8, "nnsight.tracing.protocols.ValueProtocol.add"]], "add_bridge_proxy() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.add_bridge_proxy"]], "add_conditioned_node() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.add_conditioned_node"]], "alive (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.alive"]], "arg_dependencies (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.arg_dependencies"]], "args (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.args"]], "attached() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.attached"]], "attachments (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.attachments"]], "bridged_nodes (nnsight.tracing.bridge.bridge attribute)": [[8, "nnsight.tracing.Bridge.Bridge.bridged_nodes"]], "clean() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.clean"]], "cond_dependency (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.cond_dependency"]], "copy() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.copy"]], "create() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.create"]], "create() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.create"]], "destroy() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.destroy"]], "done() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.done"]], "execute() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.execute"]], "execute() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.execute"]], "execute() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.execute"]], "execute() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.execute"]], "execute() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.execute"]], "execute() (nnsight.tracing.protocols.earlystopprotocol class method)": [[8, "nnsight.tracing.protocols.EarlyStopProtocol.execute"]], "execute() (nnsight.tracing.protocols.gradprotocol class method)": [[8, "nnsight.tracing.protocols.GradProtocol.execute"]], "execute() (nnsight.tracing.protocols.localbackendexecuteprotocol class method)": [[8, "nnsight.tracing.protocols.LocalBackendExecuteProtocol.execute"]], "execute() (nnsight.tracing.protocols.protocol class method)": [[8, "nnsight.tracing.protocols.Protocol.execute"]], "execute() (nnsight.tracing.protocols.swapprotocol class method)": [[8, "nnsight.tracing.protocols.SwapProtocol.execute"]], "execute() (nnsight.tracing.protocols.updateprotocol class method)": [[8, "nnsight.tracing.protocols.UpdateProtocol.execute"]], "execute() (nnsight.tracing.protocols.valueprotocol class method)": [[8, "nnsight.tracing.protocols.ValueProtocol.execute"]], "executed() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.executed"]], "fulfilled() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.fulfilled"]], "get_bridge() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.get_bridge"]], "get_bridge_proxy() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.get_bridge_proxy"]], "get_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.get_conditional"]], "get_graph() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.get_graph"]], "get_module() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.get_module"]], "get_swap() (nnsight.tracing.protocols.swapprotocol class method)": [[8, "nnsight.tracing.protocols.SwapProtocol.get_swap"]], "graph (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.graph"]], "graph_stack (nnsight.tracing.bridge.bridge attribute)": [[8, "nnsight.tracing.Bridge.Bridge.graph_stack"]], "has_bridge() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.has_bridge"]], "has_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.has_conditional"]], "id_to_graph (nnsight.tracing.bridge.bridge attribute)": [[8, "nnsight.tracing.Bridge.Bridge.id_to_graph"]], "increment() (nnsight.tracing.protocols.gradprotocol class method)": [[8, "nnsight.tracing.protocols.GradProtocol.increment"]], "is_node_conditioned() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.is_node_conditioned"]], "kwargs (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.kwargs"]], "listeners (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.listeners"]], "locks (nnsight.tracing.bridge.bridge attribute)": [[8, "nnsight.tracing.Bridge.Bridge.locks"]], "name (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.name"]], "name_idx (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.name_idx"]], "nnsight.tracing": [[8, "module-nnsight.tracing"]], "nnsight.tracing.bridge": [[8, "module-nnsight.tracing.Bridge"]], "nnsight.tracing.graph": [[8, "module-nnsight.tracing.Graph"]], "nnsight.tracing.node": [[8, "module-nnsight.tracing.Node"]], "nnsight.tracing.proxy": [[8, "module-nnsight.tracing.Proxy"]], "nnsight.tracing.protocols": [[8, "module-nnsight.tracing.protocols"]], "node (nnsight.tracing.proxy.proxy attribute)": [[8, "nnsight.tracing.Proxy.Proxy.node"]], "nodes (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.nodes"]], "peek_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.peek_conditional"]], "peek_graph() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.peek_graph"]], "peek_graph() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.peek_graph"]], "pop_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.pop_conditional"]], "pop_graph() (nnsight.tracing.bridge.bridge method)": [[8, "nnsight.tracing.Bridge.Bridge.pop_graph"]], "prepare_inputs() (nnsight.tracing.node.node class method)": [[8, "nnsight.tracing.Node.Node.prepare_inputs"]], "preprocess() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.preprocess"]], "proxy (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.proxy"]], "proxy_value (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.proxy_value"]], "proxy_wrapper() (in module nnsight.tracing.proxy)": [[8, "nnsight.tracing.Proxy.proxy_wrapper"]], "push_conditional() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.push_conditional"]], "redundant() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.redundant"]], "reset() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.reset"]], "reset() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.reset"]], "sequential (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.sequential"]], "set_bridge() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.set_bridge"]], "set_module() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.set_module"]], "set_value() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.set_value"]], "style() (nnsight.tracing.protocols.applymoduleprotocol class method)": [[8, "nnsight.tracing.protocols.ApplyModuleProtocol.style"]], "style() (nnsight.tracing.protocols.bridgeprotocol class method)": [[8, "nnsight.tracing.protocols.BridgeProtocol.style"]], "style() (nnsight.tracing.protocols.conditionalprotocol class method)": [[8, "nnsight.tracing.protocols.ConditionalProtocol.style"]], "style() (nnsight.tracing.protocols.earlystopprotocol class method)": [[8, "nnsight.tracing.protocols.EarlyStopProtocol.style"]], "style() (nnsight.tracing.protocols.gradprotocol class method)": [[8, "nnsight.tracing.protocols.GradProtocol.style"]], "style() (nnsight.tracing.protocols.localbackendexecuteprotocol class method)": [[8, "nnsight.tracing.protocols.LocalBackendExecuteProtocol.style"]], "style() (nnsight.tracing.protocols.lockprotocol class method)": [[8, "nnsight.tracing.protocols.LockProtocol.style"]], "style() (nnsight.tracing.protocols.protocol class method)": [[8, "nnsight.tracing.protocols.Protocol.style"]], "style() (nnsight.tracing.protocols.swapprotocol class method)": [[8, "nnsight.tracing.protocols.SwapProtocol.style"]], "style() (nnsight.tracing.protocols.updateprotocol class method)": [[8, "nnsight.tracing.protocols.UpdateProtocol.style"]], "style() (nnsight.tracing.protocols.valueprotocol class method)": [[8, "nnsight.tracing.protocols.ValueProtocol.style"]], "target (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.target"]], "validate (nnsight.tracing.graph.graph attribute)": [[8, "nnsight.tracing.Graph.Graph.validate"]], "value (nnsight.tracing.node.node attribute)": [[8, "nnsight.tracing.Node.Node.value"]], "value (nnsight.tracing.node.node property)": [[8, "id0"]], "value (nnsight.tracing.proxy.proxy property)": [[8, "nnsight.tracing.Proxy.Proxy.value"]], "vis() (nnsight.tracing.graph.graph method)": [[8, "nnsight.tracing.Graph.Graph.vis"]], "visualize() (nnsight.tracing.node.node method)": [[8, "nnsight.tracing.Node.Node.visualize"]], "wrappermodule (class in nnsight.util)": [[9, "nnsight.util.WrapperModule"]], "apply() (in module nnsight.util)": [[9, "nnsight.util.apply"]], "fetch_attr() (in module nnsight.util)": [[9, "nnsight.util.fetch_attr"]], "forward() (nnsight.util.wrappermodule method)": [[9, "nnsight.util.WrapperModule.forward"]], "nnsight.util": [[9, "module-nnsight.util"]], "wrap() (in module nnsight.util)": [[9, "nnsight.util.wrap"]]}}) \ No newline at end of file diff --git a/public/start/index.html b/public/start/index.html index 26b8f64..7b70eb5 100644 --- a/public/start/index.html +++ b/public/start/index.html @@ -57,8 +57,8 @@ - - + + diff --git a/public/status/index.html b/public/status/index.html index 92c4dd2..d3f7743 100644 --- a/public/status/index.html +++ b/public/status/index.html @@ -55,8 +55,8 @@ - - + + diff --git a/public/tutorials/index.html b/public/tutorials/index.html index d2dbb9e..64d5891 100644 --- a/public/tutorials/index.html +++ b/public/tutorials/index.html @@ -57,8 +57,8 @@ - - + +