mirror of
				https://github.com/PaddlePaddle/FastDeploy.git
				synced 2025-10-31 03:46:40 +08:00 
			
		
		
		
	support W4A8 EPLB (#3075)
This commit is contained in:
		| @@ -276,7 +276,7 @@ class GCUWeightOnlyMoEMethod(GCUFusedMoeMethod): | ||||
|         up_gate_proj_expert_weight_scale_key = layer.weight_key_map.get("up_gate_proj_expert_weight_scale_key", None) | ||||
|         down_proj_expert_weight_scale_key = layer.weight_key_map.get("down_proj_expert_weight_scale_key", None) | ||||
|  | ||||
|         up_gate_proj_weights, down_proj_weights, _ = layer.load_experts_weight( | ||||
|         up_gate_proj_weights, down_proj_weights, _, _ = layer.load_experts_weight( | ||||
|             state_dict, | ||||
|             up_gate_proj_expert_weight_key, | ||||
|             down_proj_expert_weight_key, | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Yuan Xiaolan
					Yuan Xiaolan