graph G { compound="true" rankdir="TB" bgcolor="white" fontname="Tahoma" node [ fixedsize="false" fontname="Tahoma" color="white" fillcolor="deepskyblue2" fontcolor="black" shape="box" style="filled" penwidth="1.0" ] edge [ fontname="Arial" color="#00688b" fontcolor="black" fontsize="12" arrowsize="0.5" penwidth="1.0" ] "[toolkits/model_checkpoints_convertor/utils/__init__.py]" -- "[toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe.py]" [label=" 4 ", penwidth="4", color="#00688b93"]; "[megatron_patch/data/utils.py]" -- "[megatron_patch/template/helper.py]" [label=" 3 ", penwidth="3", color="#00688b82"]; "[megatron_patch/data/utils.py]" -- "[toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe.py]" [label=" 3 ", penwidth="3", color="#00688b82"]; "[toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe.py]" -- "[megatron_patch/arguments.py]" [label=" 3 ", penwidth="3", color="#00688b82"]; "[toolkits/model_checkpoints_convertor/utils/__init__.py]" -- "[megatron_patch/arguments.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[megatron_patch/arguments.py]" -- "[megatron_patch/template/helper.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[megatron_patch/model/deepseek_v2/transformer_config.py]" -- "[megatron_patch/arguments.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[megatron_patch/data/__init__.py]" -- "[megatron_patch/template/helper.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[megatron_patch/data/__init__.py]" -- "[megatron_patch/data/utils.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[toolkits/distributed_checkpoints_convertor/impl/general/synchronizer.py]" -- "[toolkits/distributed_checkpoints_convertor/impl/general/m2h_synchronizer.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[toolkits/distributed_checkpoints_convertor/impl/general/synchronizer.py]" -- "[toolkits/distributed_checkpoints_convertor/impl/general/h2m_synchronizer.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[toolkits/model_checkpoints_convertor/utils/__init__.py]" -- "[megatron_patch/template/helper.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[megatron_patch/data/utils.py]" -- "[toolkits/model_checkpoints_convertor/utils/__init__.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[toolkits/distributed_checkpoints_convertor/impl/general/m2h_synchronizer.py]" -- "[toolkits/distributed_checkpoints_convertor/impl/general/h2m_synchronizer.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[megatron_patch/data/utils.py]" -- "[megatron_patch/arguments.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe.py]" -- "[megatron_patch/template/helper.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_vl.py]" -- "[megatron_patch/template/helper.py]" [label=" 2 ", penwidth="2", color="#00688b70"]; "[megatron_patch/data/__init__.py]" -- "[megatron_patch/model/deepseek_v2/transformer_config.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/model_checkpoints_convertor/llama/hf2mcore_llama3_1.py]" -- "[megatron_patch/data/__init__.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/model_checkpoints_convertor/mistral/hf2mcore.py]" -- "[megatron_patch/model/qwen2_vl/layer_specs.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen2_5_vl/model.py]" -- "[megatron_patch/data/image_processing.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/multimodal_data_preprocessing/convert_llava_pretrain_to_wds.py]" -- "[megatron_patch/model/qwen2_5_vl/transformer_config.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/multimodal_data_preprocessing/build_llava_frame_dataset.py]" -- "[megatron_patch/data/dataset_helpers.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/multimodal_data_preprocessing/replace_llava_image_key.py]" -- "[megatron_patch/model/qwen2_5_vl/model.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v2_moe.py]" -- "[toolkits/model_checkpoints_convertor/utils/__init__.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen2_5_vl/transformer_block.py]" -- "[megatron_patch/model/qwen2_5_vl/visionmodel.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/multimodal_data_preprocessing/build_llava_frame_dataset.py]" -- "[megatron_patch/model/qwen2_5_vl/transformer_config.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/pretrain_data_preprocessing/preprocess_data_megatron.py]" -- "[megatron_patch/model/qwen3_moe/moe_module_specs.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/deepseek_v2/transformer_config.py]" -- "[megatron_patch/model/deepseek_v2/multi_latent_attention.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/m2h_synchronizer.py]" -- "[toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/h2m_synchronizer.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_vl.py]" -- "[megatron_patch/model/deepseek_v2/transformer_config.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen3_moe/moe_module_specs.py]" -- "[megatron_patch/model/qwen3_moe/moe/moe_layer.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen3_moe/moe_module_specs.py]" -- "[megatron_patch/model/qwen3_moe/gpt_layer_specs.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/model_checkpoints_convertor/mistral/hf2mcore.py]" -- "[megatron_patch/template/helper.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen3_moe/moe_module_specs.py]" -- "[megatron_patch/model/qwen3_moe/moe/moe_utils.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/model_checkpoints_convertor/mistral/hf2mcore.py]" -- "[toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/data/json_sft.py]" -- "[megatron_patch/template/helper.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/multimodal_data_preprocessing/convert_llava_pretrain_to_wds.py]" -- "[megatron_patch/model/qwen2_5_vl/transformer_block.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen2_vl/attention_vision.py]" -- "[toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_vl.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen2_vl/layer_specs.py]" -- "[toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_vl.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/data/json_sft.py]" -- "[megatron_patch/arguments.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/data/json_sft.py]" -- "[megatron_patch/data/__init__.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen2_vl/attention_vision.py]" -- "[megatron_patch/data/utils.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_moe.py]" -- "[megatron_patch/model/qwen3_moe/moe_module_specs.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/multimodal_data_preprocessing/convert_llava_pretrain_to_wds.py]" -- "[toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2.5_vl.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/qwen2_vl/attention.py]" -- "[toolkits/model_checkpoints_convertor/utils/__init__.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/model/deepseek_v2/transformer_config.py]" -- "[megatron_patch/template/helper.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[megatron_patch/data/json_sft.py]" -- "[toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/multimodal_data_preprocessing/convert_custom_dataset_to_wds_chatml.py]" -- "[toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2.5_vl.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; "[toolkits/multimodal_data_preprocessing/replace_llava_image_key.py]" -- "[megatron_patch/model/qwen2_5_vl/transformer_config.py]" [label=" 1 ", penwidth="1", color="#00688b5E"]; }