Skip to content

Commit b9c5dee

Browse files
author
tangbinhan
committed
update
1 parent ef4e9e0 commit b9c5dee

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

fastdeploy/model_executor/layers/linear.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -391,7 +391,7 @@ def load_state_dict(self, state_dict: dict):
391391

392392
state_dict[self.weight_key] = weight_tensor
393393

394-
super().load_state_dict(state_dict)
394+
super().load_state_dict(state_dict)
395395

396396

397397
class QKVParallelLinear(ColumnParallelLinear):

fastdeploy/model_executor/model_loader/load_time_quantization_loader.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -76,12 +76,12 @@ def _get_quantized_weights(
7676
apply_quant_action(
7777
quant_filtered_map,
7878
key,
79-
weight.clone(),
79+
weight,
8080
state_dict,
8181
quant_layer_instance_map,
8282
)
8383
else:
84-
state_dict[key] = weight.clone()
84+
state_dict[key] = weight
8585
deal_state_dict(state_dict)
8686
paddle.device.cuda.empty_cache()
8787
paddle.device.cuda.synchronize()

0 commit comments

Comments
 (0)