in picotron/checkpoint.py [0:0]
def convert_safetensors_to_hf_name(self, sft_name):
"""Convert safetensors naming convention to HuggingFace naming convention."""
name_mapping = {
"model.": "",
"layers.": "decoder_layers.",
"embed_tokens": "embedding",
"self_attn.": "attention.",
"o_proj": "out_proj",
"lm_head": "final_proj",
"input_layernorm": "input_layernorm",
"post_attention_layernorm": "post_attention_layernorm",
r'^norm': 'final_norm'
}
result = sft_name
for pattern, replacement in name_mapping.items():
result = re.sub(pattern, replacement, result)
return result