1
+ + odict_keys ([' model.embed_tokens.weight'
2
+ ' model.layers.0.self_attn.q_proj.weight_scale'
3
+ ' model.layers.0.self_attn.q_proj.weight_zero_point'
4
+ ' model.layers.0.self_attn.q_proj.weight'
5
+ ' model.layers.0.self_attn.k_proj.weight_scale'
6
+ ' model.layers.0.self_attn.k_proj.weight_zero_point'
7
+ ' model.layers.0.self_attn.k_proj.weight'
8
+ ' model.layers.0.self_attn.v_proj.weight_scale'
9
+ ' model.layers.0.self_attn.v_proj.weight_zero_point'
10
+ ' model.layers.0.self_attn.v_proj.weight'
11
+ ' model.layers.0.self_attn.o_proj.weight_scale'
12
+ ' model.layers.0.self_attn.o_proj.weight_zero_point'
13
+ ' model.layers.0.self_attn.o_proj.weight'
14
+ ' model.layers.0.mlp.gate_proj.weight_scale'
15
+ ' model.layers.0.mlp.gate_proj.weight_zero_point'
16
+ ' model.layers.0.mlp.gate_proj.weight'
17
+ ' model.layers.0.mlp.up_proj.weight_scale'
18
+ ' model.layers.0.mlp.up_proj.weight_zero_point'
19
+ ' model.layers.0.mlp.up_proj.weight'
20
+ ' model.layers.0.mlp.down_proj.weight_scale'
21
+ ' model.layers.0.mlp.down_proj.weight_zero_point'
22
+ ' model.layers.0.mlp.down_proj.weight'
23
+ ' model.layers.0.input_layernorm.weight'
24
+ ' model.layers.0.post_attention_layernorm.weight'
25
+ ' model.layers.1.self_attn.q_proj.weight_scale'
26
+ ' model.layers.1.self_attn.q_proj.weight_zero_point'
27
+ ' model.layers.1.self_attn.q_proj.weight'
28
+ ' model.layers.1.self_attn.k_proj.weight_scale'
29
+ ' model.layers.1.self_attn.k_proj.weight_zero_point'
30
+ ' model.layers.1.self_attn.k_proj.weight'
31
+ ' model.layers.1.self_attn.v_proj.weight_scale'
32
+ ' model.layers.1.self_attn.v_proj.weight_zero_point'
33
+ ' model.layers.1.self_attn.v_proj.weight'
34
+ ' model.layers.1.self_attn.o_proj.weight_scale'
35
+ ' model.layers.1.self_attn.o_proj.weight_zero_point'
36
+ ' model.layers.1.self_attn.o_proj.weight'
37
+ ' model.layers.1.mlp.gate_proj.weight_scale'
38
+ ' model.layers.1.mlp.gate_proj.weight_zero_point'
39
+ ' model.layers.1.mlp.gate_proj.weight'
40
+ ' model.layers.1.mlp.up_proj.weight_scale'
41
+ ' model.layers.1.mlp.up_proj.weight_zero_point'
42
+ ' model.layers.1.mlp.up_proj.weight'
43
+ ' model.layers.1.mlp.down_proj.weight_scale'
44
+ ' model.layers.1.mlp.down_proj.weight_zero_point'
45
+ ' model.layers.1.mlp.down_proj.weight'
46
+ ' model.layers.1.input_layernorm.weight'
47
+ ' model.layers.1.post_attention_layernorm.weight'
48
+ ' model.layers.2.self_attn.q_proj.weight_scale'
49
+ ' model.layers.2.self_attn.q_proj.weight_zero_point'
50
+ ' model.layers.2.self_attn.q_proj.weight'
51
+ ' model.layers.2.self_attn.k_proj.weight_scale'
52
+ ' model.layers.2.self_attn.k_proj.weight_zero_point'
53
+ ' model.layers.2.self_attn.k_proj.weight'
54
+ ' model.layers.2.self_attn.v_proj.weight_scale'
55
+ ' model.layers.2.self_attn.v_proj.weight_zero_point'
56
+ ' model.layers.2.self_attn.v_proj.weight'
57
+ ' model.layers.2.self_attn.o_proj.weight_scale'
58
+ ' model.layers.2.self_attn.o_proj.weight_zero_point'
59
+ ' model.layers.2.self_attn.o_proj.weight'
60
+ ' model.layers.2.mlp.gate_proj.weight_scale'
61
+ ' model.layers.2.mlp.gate_proj.weight_zero_point'
62
+ ' model.layers.2.mlp.gate_proj.weight'
63
+ ' model.layers.2.mlp.up_proj.weight_scale'
64
+ ' model.layers.2.mlp.up_proj.weight_zero_point'
65
+ ' model.layers.2.mlp.up_proj.weight'
66
+ ' model.layers.2.mlp.down_proj.weight_scale'
67
+ ' model.layers.2.mlp.down_proj.weight_zero_point'
68
+ ' model.layers.2.mlp.down_proj.weight'
69
+ ' model.layers.2.input_layernorm.weight'
70
+ ' model.layers.2.post_attention_layernorm.weight'
71
+ ' model.layers.3.self_attn.q_proj.weight_scale'
72
+ ' model.layers.3.self_attn.q_proj.weight_zero_point'
73
+ ' model.layers.3.self_attn.q_proj.weight'
74
+ ' model.layers.3.self_attn.k_proj.weight_scale'
75
+ ' model.layers.3.self_attn.k_proj.weight_zero_point'
76
+ ' model.layers.3.self_attn.k_proj.weight'
77
+ ' model.layers.3.self_attn.v_proj.weight_scale'
78
+ ' model.layers.3.self_attn.v_proj.weight_zero_point'
79
+ ' model.layers.3.self_attn.v_proj.weight'
80
+ ' model.layers.3.self_attn.o_proj.weight_scale'
81
+ ' model.layers.3.self_attn.o_proj.weight_zero_point'
82
+ ' model.layers.3.self_attn.o_proj.weight' ' model.layers.3.mlp.gate_proj.weight_scale'
83
+ ' model.layers.3.mlp.gate_proj.weight_zero_point'
84
+ ' model.layers.3.mlp.gate_proj.weight'
85
+ ' model.layers.3.mlp.up_proj.weight_scale'
86
+ ' model.layers.3.mlp.up_proj.weight_zero_point'
87
+ ' model.layers.3.mlp.up_proj.weight'
88
+ ' model.layers.3.mlp.down_proj.weight_scale'
89
+ ' model.layers.3.mlp.down_proj.weight_zero_point'
90
+ ' model.layers.3.mlp.down_proj.weight'
91
+ ' model.layers.3.input_layernorm.weight'
92
+ ' model.layers.3.post_attention_layernorm.weight'
93
+ ' model.layers.4.self_attn.q_proj.weight_scale'
94
+ ' model.layers.4.self_attn.q_proj.weight_zero_point'
95
+ ' model.layers.4.self_attn.q_proj.weight'
96
+ ' model.layers.4.self_attn.k_proj.weight_scale'
97
+ ' model.layers.4.self_attn.k_proj.weight_zero_point'
98
+ ' model.layers.4.self_attn.k_proj.weight'
99
+ ' model.layers.4.self_attn.v_proj.weight_scale'
100
+ ' model.layers.4.self_attn.v_proj.weight_zero_point'
101
+ ' model.layers.4.self_attn.v_proj.weight'
102
+ ' model.layers.4.self_attn.o_proj.weight_scale'
103
+ ' model.layers.4.self_attn.o_proj.weight_zero_point'
104
+ ' model.layers.4.self_attn.o_proj.weight'
105
+ ' model.layers.4.mlp.gate_proj.weight_scale'
106
+ ' model.layers.4.mlp.gate_proj.weight_zero_point'
107
+ ' model.layers.4.mlp.gate_proj.weight'
108
+ ' model.layers.4.mlp.up_proj.weight_scale'
109
+ ' model.layers.4.mlp.up_proj.weight_zero_point'
110
+ ' model.layers.4.mlp.up_proj.weight'
111
+ ' model.layers.4.mlp.down_proj.weight_scale'
112
+ ' model.layers.4.mlp.down_proj.weight_zero_point'
113
+ ' model.layers.4.mlp.down_proj.weight'
114
+ ' model.layers.4.input_layernorm.weight'
115
+ ' model.layers.4.post_attention_layernorm.weight'
116
+ ' model.layers.5.self_attn.q_proj.weight_scale'
117
+ ' model.layers.5.self_attn.q_proj.weight_zero_point'
118
+ ' model.layers.5.self_attn.q_proj.weight'
119
+ ' model.layers.5.self_attn.k_proj.weight_scale'
120
+ ' model.layers.5.self_attn.k_proj.weight_zero_point'
121
+ ' model.layers.5.self_attn.k_proj.weight'
122
+ ' model.layers.5.self_attn.v_proj.weight_scale'
123
+ ' model.layers.5.self_attn.v_proj.weight_zero_point'
124
+ ' model.layers.5.self_attn.v_proj.weight'
125
+ ' model.layers.5.self_attn.o_proj.weight_scale'
126
+ ' model.layers.5.self_attn.o_proj.weight_zero_point'
127
+ ' model.layers.5.self_attn.o_proj.weight'
128
+ ' model.layers.5.mlp.gate_proj.weight_scale'
129
+ ' model.layers.5.mlp.gate_proj.weight_zero_point'
130
+ ' model.layers.5.mlp.gate_proj.weight'
131
+ ' model.layers.5.mlp.up_proj.weight_scale'
132
+ ' model.layers.5.mlp.up_proj.weight_zero_point'
133
+ ' model.layers.5.mlp.up_proj.weight'
134
+ ' model.layers.5.mlp.down_proj.weight_scale'
135
+ ' model.layers.5.mlp.down_proj.weight_zero_point'
136
+ ' model.layers.5.mlp.down_proj.weight'
137
+ ' model.layers.5.input_layernorm.weight'
138
+ ' model.layers.5.post_attention_layernorm.weight'
139
+ ' model.layers.6.self_attn.q_proj.weight_scale'
140
+ ' model.layers.6.self_attn.q_proj.weight_zero_point'
141
+ ' model.layers.6.self_attn.q_proj.weight'
142
+ ' model.layers.6.self_attn.k_proj.weight_scale'
143
+ ' model.layers.6.self_attn.k_proj.weight_zero_point'
144
+ ' model.layers.6.self_attn.k_proj.weight'
145
+ ' model.layers.6.self_attn.v_proj.weight_scale'
146
+ ' model.layers.6.self_attn.v_proj.weight_zero_point'
147
+ ' model.layers.6.self_attn.v_proj.weight'
148
+ ' model.layers.6.self_attn.o_proj.weight_scale'
149
+ ' model.layers.6.self_attn.o_proj.weight_zero_point'
150
+ ' model.layers.6.self_attn.o_proj.weight'
151
+ ' model.layers.6.mlp.gate_proj.weight_scale'
152
+ ' model.layers.6.mlp.gate_proj.weight_zero_point'
153
+ ' model.layers.6.mlp.gate_proj.weight'
154
+ ' model.layers.6.mlp.up_proj.weight_scale'
155
+ ' model.layers.6.mlp.up_proj.weight_zero_point'
156
+ ' model.layers.6.mlp.up_proj.weight'
157
+ ' model.layers.6.mlp.down_proj.weight_scale'
158
+ ' model.layers.6.mlp.down_proj.weight_zero_point'
159
+ ' model.layers.6.mlp.down_proj.weight'
160
+ ' model.layers.6.input_layernorm.weight'
161
+ ' model.layers.6.post_attention_layernorm.weight'
162
+ ' model.layers.7.self_attn.q_proj.weight_scale'
163
+ ' model.layers.7.self_attn.q_proj.weight_zero_point'
164
+ ' model.layers.7.self_attn.q_proj.weight'
165
+ ' model.layers.7.self_attn.k_proj.weight_scale'
166
+ ' model.layers.7.self_attn.k_proj.weight_zero_point'
167
+ ' model.layers.7.self_attn.k_proj.weight'
168
+ ' model.layers.7.self_attn.v_proj.weight_scale'
169
+ ' model.layers.7.self_attn.v_proj.weight_zero_point'
170
+ ' model.layers.7.self_attn.v_proj.weight'
171
+ ' model.layers.7.self_attn.o_proj.weight_scale'
172
+ ' model.layers.7.self_attn.o_proj.weight_zero_point'
173
+ ' model.layers.7.self_attn.o_proj.weight'
174
+ ' model.layers.7.mlp.gate_proj.weight_scale'
175
+ ' model.layers.7.mlp.gate_proj.weight_zero_point'
176
+ ' model.layers.7.mlp.gate_proj.weight'
177
+ ' model.layers.7.mlp.up_proj.weight_scale'
178
+ ' model.layers.7.mlp.up_proj.weight_zero_point'
179
+ ' model.layers.7.mlp.up_proj.weight'
180
+ ' model.layers.7.mlp.down_proj.weight_scale'
181
+ ' model.layers.7.mlp.down_proj.weight_zero_point'
182
+ ' model.layers.7.mlp.down_proj.weight'
183
+ ' model.layers.7.input_layernorm.weight'
184
+ ' model.layers.7.post_attention_layernorm.weight'
185
+ ' model.norm.weight'
186
+ ' lm_head.weight' ])
0 commit comments