pyvene.models.gpt2.modelings_intervenable_gpt2.gpt2_lm_type_to_dimension_mapping#
- gpt2_lm_type_to_dimension_mapping = {'attention_input': ('n_embd',), 'attention_output': ('n_embd',), 'attention_value_output': ('n_embd',), 'attention_weight': ('max_position_embeddings',), 'block_input': ('n_embd',), 'block_output': ('n_embd',), 'head_attention_value_output': ('n_embd/n_head',), 'head_key_output': ('n_embd/n_head',), 'head_query_output': ('n_embd/n_head',), 'head_value_output': ('n_embd/n_head',), 'key_output': ('n_embd',), 'mlp_activation': ('n_inner', 'n_embd*4'), 'mlp_input': ('n_embd',), 'mlp_output': ('n_embd',), 'n_head': ('n_head',), 'query_output': ('n_embd',), 'value_output': ('n_embd',)}#
gpt2 model with classifier head