refactor rl get_name_mappings_to_training (#2847)
Some checks failed
Deploy GitHub Pages / deploy (push) Has been cancelled

* refactor rl get_name_mappings_to_training

* fix tp>1

* change variable name(ffn1->up_gate_proj/ffn2->down_proj)

* change variable name(linear_weight->weight/linear_bias->bias)

* add rl names mapping for vl

* fix ernie 0.3B error

* fix develop code

* fix
This commit is contained in:
Yuanle Liu
2025-07-15 22:31:42 +08:00
committed by GitHub
parent e7bcbbab52
commit 61b3997b85
47 changed files with 1591 additions and 1629 deletions

View File

@@ -311,18 +311,18 @@ def w4a8_weight_convert(state_dict):
w4a8_weight_bites_layers_map = {}
w4a8_weight_bites_layers_map["qkv_gemm_bits_map"] = []
w4a8_weight_bites_layers_map["out_gemm_bits_map"] = []
w4a8_weight_bites_layers_map["ffn1_gemm_bits_map"] = []
w4a8_weight_bites_layers_map["ffn2_gemm_bits_map"] = []
w4a8_weight_bites_layers_map["up_gate_proj_gemm_bits_map"] = []
w4a8_weight_bites_layers_map["down_proj_gemm_bits_map"] = []
for name_keys, gemm_bits in w4a8_weight_bites_name_map.items():
if "qkv_proj" in name_keys:
w4a8_weight_bites_layers_map["qkv_gemm_bits_map"].append(gemm_bits)
elif "out_proj" in name_keys:
w4a8_weight_bites_layers_map["out_gemm_bits_map"].append(gemm_bits)
elif "linear1" in name_keys:
w4a8_weight_bites_layers_map["ffn1_gemm_bits_map"].append(
w4a8_weight_bites_layers_map["up_gate_proj_gemm_bits_map"].append(
gemm_bits)
elif "linear2" in name_keys:
w4a8_weight_bites_layers_map["ffn2_gemm_bits_map"].append(
w4a8_weight_bites_layers_map["down_proj_gemm_bits_map"].append(
gemm_bits)
logger.debug(
f"w4a8_weight_bites_layers_map:{w4a8_weight_bites_layers_map}")