|
36 | 36 | "mlp_output": ("hidden_size",), |
37 | 37 | "mlp_input": ("hidden_size",), |
38 | 38 | "attention_value_output": ("hidden_size",), |
39 | | - "head_attention_value_output": ("hidden_size/num_attention_heads",), |
| 39 | + "head_attention_value_output": ("head_dim", "hidden_size/num_attention_heads",), |
40 | 40 | "attention_output": ("hidden_size",), |
41 | 41 | "attention_input": ("hidden_size",), |
42 | 42 | "query_output": ("hidden_size",), |
43 | 43 | "key_output": ("num_key_value_heads*hidden_size/num_attention_heads",), |
44 | 44 | "value_output": ("num_key_value_heads*hidden_size/num_attention_heads",), |
45 | | - "head_query_output": ("hidden_size/num_attention_heads",), |
46 | | - "head_key_output": ("hidden_size/num_attention_heads",), |
47 | | - "head_value_output": ("hidden_size/num_attention_heads",), |
| 45 | + "head_query_output": ("head_dim", "hidden_size/num_attention_heads",), |
| 46 | + "head_key_output": ("head_dim", "hidden_size/num_attention_heads",), |
| 47 | + "head_value_output": ("head_dim", "hidden_size/num_attention_heads",), |
48 | 48 | } |
49 | 49 |
|
50 | 50 | """qwen2 model with LM head""" |
|
0 commit comments