stanfordnlp
diff --git a/‎pyvene/models/intervenable_modelcard.py‎
Lines changed: 10 additions & 0 deletions b/‎pyvene/models/intervenable_modelcard.py‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎pyvene/models/olmo2/__init__.py‎ b/‎pyvene/models/olmo2/__init__.py‎
diff --git a/‎pyvene/models/olmo2/modelings_intervenable_olmo2.py‎
Lines changed: 94 additions & 0 deletions b/‎pyvene/models/olmo2/modelings_intervenable_olmo2.py‎
Lines changed: 94 additions & 0 deletions
diff --git a/‎pyvene/models/qwen3/__init__.py‎ b/‎pyvene/models/qwen3/__init__.py‎
diff --git a/‎pyvene/models/qwen3/modelings_intervenable_qwen3.py‎
Lines changed: 77 additions & 0 deletions b/‎pyvene/models/qwen3/modelings_intervenable_qwen3.py‎
Lines changed: 77 additions & 0 deletions
@@ -14,6 +14,8 @@
 from .llava.modelings_intervenable_llava import *
 from .qwen2.modelings_intervenable_qwen2 import *
 from .olmo.modelings_intervenable_olmo import *
+from .olmo2.modelings_intervenable_olmo2 import *
+from .qwen3.modelings_intervenable_qwen3 import *
 from .esm.modelings_intervenable_esm import *
 from .mllama.modelings_intervenable_mllama import *
 from .gpt_oss.modelings_intervenable_gpt_oss import *
@@ -67,6 +69,10 @@
     hf_models.gemma2.modeling_gemma2.Gemma2ForCausalLM: gemma2_lm_type_to_module_mapping,
     hf_models.olmo.modeling_olmo.OlmoModel: olmo_type_to_module_mapping,
     hf_models.olmo.modeling_olmo.OlmoForCausalLM: olmo_lm_type_to_module_mapping,
+    hf_models.olmo2.modeling_olmo2.Olmo2Model: olmo2_type_to_module_mapping,
+    hf_models.olmo2.modeling_olmo2.Olmo2ForCausalLM: olmo2_lm_type_to_module_mapping,
+    hf_models.qwen3.modeling_qwen3.Qwen3Model: qwen3_type_to_module_mapping,
+    hf_models.qwen3.modeling_qwen3.Qwen3ForCausalLM: qwen3_lm_type_to_module_mapping,
     hf_models.esm.modeling_esm.EsmModel: esm_type_to_module_mapping,
     hf_models.esm.modeling_esm.EsmForMaskedLM: esm_mlm_type_to_module_mapping,
     hf_models.blip.modeling_blip.BlipForQuestionAnswering: blip_type_to_module_mapping,
@@ -109,6 +115,10 @@
     hf_models.gemma2.modeling_gemma2.Gemma2ForCausalLM: gemma2_lm_type_to_dimension_mapping,
     hf_models.olmo.modeling_olmo.OlmoModel: olmo_type_to_dimension_mapping,
     hf_models.olmo.modeling_olmo.OlmoForCausalLM: olmo_lm_type_to_dimension_mapping,
+    hf_models.olmo2.modeling_olmo2.Olmo2Model: olmo2_type_to_dimension_mapping,
+    hf_models.olmo2.modeling_olmo2.Olmo2ForCausalLM: olmo2_lm_type_to_dimension_mapping,
+    hf_models.qwen3.modeling_qwen3.Qwen3Model: qwen3_type_to_dimension_mapping,
+    hf_models.qwen3.modeling_qwen3.Qwen3ForCausalLM: qwen3_lm_type_to_dimension_mapping,
     hf_models.esm.modeling_esm.EsmModel: esm_type_to_dimension_mapping,
     hf_models.esm.modeling_esm.EsmForMaskedLM: esm_mlm_type_to_dimension_mapping,
     hf_models.blip.modeling_blip.BlipForQuestionAnswering: blip_type_to_dimension_mapping,
 
@@ -0,0 +1,94 @@
+"""
+Each modeling file in this library is a mapping between
+abstract naming of intervention anchor points and actual
+model module defined in the huggingface library.
+
+We also want to let the intervention library know how to
+config the dimensions of intervention based on model config
+defined in the huggingface library.
+"""
+
+
+import torch
+from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer
+from ..constants import *
+
+
+olmo2_type_to_module_mapping = {
+    "block_input": ("layers[%s]", CONST_INPUT_HOOK),
+    "block_output": ("layers[%s]", CONST_OUTPUT_HOOK),
+    "mlp_activation": ("layers[%s].mlp.act_fn", CONST_OUTPUT_HOOK),
+    "mlp_output": ("layers[%s].mlp", CONST_OUTPUT_HOOK),
+    "mlp_input": ("layers[%s].mlp", CONST_INPUT_HOOK),
+    "attention_value_output": ("layers[%s].self_attn.o_proj", CONST_INPUT_HOOK),
+    "head_attention_value_output": ("layers[%s].self_attn.o_proj", CONST_INPUT_HOOK, (split_head_and_permute, "n_head")),
+    "attention_output": ("layers[%s].self_attn", CONST_OUTPUT_HOOK),
+    "attention_input": ("layers[%s].self_attn", CONST_INPUT_HOOK),
+    "query_output": ("layers[%s].self_attn.q_proj", CONST_OUTPUT_HOOK),
+    "key_output": ("layers[%s].self_attn.k_proj", CONST_OUTPUT_HOOK),
+    "value_output": ("layers[%s].self_attn.v_proj", CONST_OUTPUT_HOOK),
+    "head_query_output": ("layers[%s].self_attn.q_proj", CONST_OUTPUT_HOOK, (split_head_and_permute, "n_head")),
+    "head_key_output": ("layers[%s].self_attn.k_proj", CONST_OUTPUT_HOOK, (split_head_and_permute, "n_kv_head")),
+    "head_value_output": ("layers[%s].self_attn.v_proj", CONST_OUTPUT_HOOK, (split_head_and_permute, "n_kv_head")),
+}
+
+
+olmo2_type_to_dimension_mapping = {
+    "n_head": ("num_attention_heads",),
+    "n_kv_head": ("num_key_value_heads",),
+    "block_input": ("hidden_size",),
+    "block_output": ("hidden_size",),
+    "mlp_activation": ("intermediate_size",),
+    "mlp_output": ("hidden_size",),
+    "mlp_input": ("hidden_size",),
+    "attention_value_output": ("hidden_size",),
+    "head_attention_value_output": ("hidden_size/num_attention_heads",),
+    "attention_output": ("hidden_size",),
+    "attention_input": ("hidden_size",),
+    "query_output": ("hidden_size",),
+    "key_output": ("hidden_size",),
+    "value_output": ("hidden_size",),
+    "head_query_output": ("hidden_size/num_attention_heads",),
+    "head_key_output": ("hidden_size/num_attention_heads",),
+    "head_value_output": ("hidden_size/num_attention_heads",),
+}
+
+
+"""olmo2 model with LM head"""
+olmo2_lm_type_to_module_mapping = {}
+for k, v in olmo2_type_to_module_mapping.items():
+    olmo2_lm_type_to_module_mapping[k] = (f"model.{v[0]}", ) + v[1:]
+
+
+olmo2_lm_type_to_dimension_mapping = olmo2_type_to_dimension_mapping
+
+
+"""olmo2 model with classifier head"""
+olmo2_classifier_type_to_module_mapping = {}
+for k, v in olmo2_type_to_module_mapping.items():
+    olmo2_classifier_type_to_module_mapping[k] = (f"model.{v[0]}", ) + v[1:]
+
+
+olmo2_classifier_type_to_dimension_mapping = olmo2_type_to_dimension_mapping
+
+
+def create_olmo2(
+    name="allenai/OLMo-2-1124-7B", cache_dir=None, dtype=torch.bfloat16, config=None,
+    revision='main'
+):
+    """Creates a OLMo2 Causal LM model, config, and tokenizer from the given name and revision"""
+    if config is None:
+        config = AutoConfig.from_pretrained(name, cache_dir=cache_dir)
+        olmo2 = AutoModelForCausalLM.from_pretrained(
+            name,
+            config=config,
+            cache_dir=cache_dir,
+            torch_dtype=dtype,
+            revision=revision
+        )
+        tokenizer = AutoTokenizer.from_pretrained(name, cache_dir=cache_dir)
+    else:
+        olmo2 = AutoModelForCausalLM(config, cache_dir=cache_dir, revision=revision)
+        tokenizer = AutoTokenizer.from_pretrained(name, cache_dir=cache_dir)
+    print("loaded model")
+    return config, tokenizer, olmo2
@@ -0,0 +1,77 @@
+"""
+Each modeling file in this library is a mapping between
+abstract naming of intervention anchor points and actual
+model module defined in the huggingface library.
+We also want to let the intervention library know how to
+config the dimensions of intervention based on model config
+defined in the huggingface library.
+"""
+import torch
+from ..constants import *
+
+qwen3_type_to_module_mapping = {
+    "block_input": ("layers[%s]", CONST_INPUT_HOOK),
+    "block_output": ("layers[%s]", CONST_OUTPUT_HOOK),
+    "mlp_activation": ("layers[%s].mlp.act_fn", CONST_OUTPUT_HOOK),
+    "mlp_output": ("layers[%s].mlp", CONST_OUTPUT_HOOK),
+    "mlp_input": ("layers[%s].mlp", CONST_INPUT_HOOK),
+    "attention_value_output": ("layers[%s].self_attn.o_proj", CONST_INPUT_HOOK),
+    "head_attention_value_output": ("layers[%s].self_attn.o_proj", CONST_INPUT_HOOK, (split_head_and_permute, "n_head")),
+    "attention_output": ("layers[%s].self_attn", CONST_OUTPUT_HOOK),
+    "attention_input": ("layers[%s].self_attn", CONST_INPUT_HOOK),
+    "query_output": ("layers[%s].self_attn.q_proj", CONST_OUTPUT_HOOK),
+    "key_output": ("layers[%s].self_attn.k_proj", CONST_OUTPUT_HOOK),
+    "value_output": ("layers[%s].self_attn.v_proj", CONST_OUTPUT_HOOK),
+    "head_query_output": ("layers[%s].self_attn.q_proj", CONST_OUTPUT_HOOK, (split_head_and_permute, "n_head")),
+    "head_key_output": ("layers[%s].self_attn.k_proj", CONST_OUTPUT_HOOK, (split_head_and_permute, "n_kv_head")),
+    "head_value_output": ("layers[%s].self_attn.v_proj", CONST_OUTPUT_HOOK, (split_head_and_permute, "n_kv_head")),
+}
+
+qwen3_type_to_dimension_mapping = {
+    "n_head": ("num_attention_heads",),
+    "n_kv_head": ("num_key_value_heads",), 
+    "block_input": ("hidden_size",),
+    "block_output": ("hidden_size",),
+    "mlp_activation": ("intermediate_size",),
+    "mlp_output": ("hidden_size",),
+    "mlp_input": ("hidden_size",),
+    "attention_value_output": ("hidden_size",),
+    "head_attention_value_output": ("hidden_size/num_attention_heads",),
+    "attention_output": ("hidden_size",),
+    "attention_input": ("hidden_size",),
+    "query_output": ("hidden_size",),
+    "key_output": ("hidden_size",),
+    "value_output": ("hidden_size",),
+    "head_query_output": ("hidden_size/num_attention_heads",),
+    "head_key_output": ("hidden_size/num_attention_heads",),
+    "head_value_output": ("hidden_size/num_attention_heads",),
+}
+
+"""qwen3 model with LM head"""
+qwen3_lm_type_to_module_mapping = {}
+for k, v in qwen3_type_to_module_mapping.items():
+    qwen3_lm_type_to_module_mapping[k] = (f"model.{v[0]}", ) + v[1:]
+qwen3_lm_type_to_dimension_mapping = qwen3_type_to_dimension_mapping
+
+"""qwen3 model with classifier head"""
+qwen3_classifier_type_to_module_mapping = {}
+for k, v in qwen3_type_to_module_mapping.items():
+    qwen3_classifier_type_to_module_mapping[k] = (f"model.{v[0]}", ) + v[1:]
+qwen3_classifier_type_to_dimension_mapping = qwen3_type_to_dimension_mapping
+
+def create_qwen3(
+    name="Qwen/Qwen3-8B", cache_dir=None, dtype=torch.bfloat16
+):
+    """Creates a Causal LM model, config, and tokenizer from the given name and revision"""
+    from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer
+    
+    config = AutoConfig.from_pretrained(name, cache_dir=cache_dir)
+    tokenizer = AutoTokenizer.from_pretrained(name, cache_dir=cache_dir)
+    model = AutoModelForCausalLM.from_pretrained(
+        name,
+        config=config,
+        cache_dir=cache_dir,
+        torch_dtype=dtype,
+    )
+    print("loaded model")
+    return config, tokenizer, model