pyvene.models.olmo2.modelings_intervenable_olmo2.olmo2_lm_type_to_dimension_mapping

pyvene.models.olmo2.modelings_intervenable_olmo2.olmo2_lm_type_to_dimension_mapping#

olmo2_lm_type_to_dimension_mapping = {'attention_input': ('hidden_size',), 'attention_output': ('hidden_size',), 'attention_value_output': ('hidden_size',), 'block_input': ('hidden_size',), 'block_output': ('hidden_size',), 'head_attention_value_output': ('head_dim', 'hidden_size/num_attention_heads'), 'head_key_output': ('head_dim', 'hidden_size/num_attention_heads'), 'head_query_output': ('head_dim', 'hidden_size/num_attention_heads'), 'head_value_output': ('head_dim', 'hidden_size/num_attention_heads'), 'key_output': ('num_key_value_heads*hidden_size/num_attention_heads',), 'mlp_activation': ('intermediate_size',), 'mlp_input': ('hidden_size',), 'mlp_output': ('hidden_size',), 'n_head': ('num_attention_heads',), 'n_kv_head': ('num_key_value_heads',), 'query_output': ('hidden_size',), 'value_output': ('num_key_value_heads*hidden_size/num_attention_heads',)}#

olmo2 model with classifier head