We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent db97782 commit 2ac2d08Copy full SHA for 2ac2d08
internlm/checkpoint/load_funcs.py
@@ -148,12 +148,6 @@ def load_hf_llama_pretrained_weights(folder, model):
148
if f"model.layers.{layer_ids}.self_attn.rotary_emb.inv_freq" in states:
149
states.pop(f"model.layers.{layer_ids}.self_attn.rotary_emb.inv_freq")
150
151
- if gpc.config.model_type in ("LLAMA2",):
152
- w2 = states.pop(f"layers.{i}.feed_forward.w2.weight")
153
- w3 = states.pop(f"layers.{i}.feed_forward.w3.weight")
154
- states[f"layers.{i}.feed_forward.w2.weight"] = w3
155
- states[f"layers.{i}.feed_forward.w3.weight"] = w2
156
-
157
for name in list(states.keys()):
158
if name.startswith(f"layers.{i}"):
159
current_states[name.replace(f".{i}.", f".{idx}.")] = states.pop(name)
0 commit comments