in train.py [0:0]
def get_run_name(train_cfg, vlm_cfg):
dataset_size = "full_ds" if train_cfg.data_cutoff_idx is None else f"{train_cfg.data_cutoff_idx}samples"
batch_size = f"bs{int(train_cfg.batch_size*get_world_size()*train_cfg.gradient_accumulation_steps)}"
max_training_steps = f"{train_cfg.max_training_steps}"
learning_rate = f"lr{train_cfg.lr_backbones}-{train_cfg.lr_mp}"
num_gpus = f"{get_world_size()}xGPU"
date = time.strftime("%m%d-%H%M%S")
vit = f"{vlm_cfg.vit_model_type.split('/')[-1]}"
mp = f"mp{vlm_cfg.mp_pixel_shuffle_factor}"
llm = f"{vlm_cfg.lm_model_type.split('/')[-1]}"
return f"nanoVLM_{vit}_{mp}_{llm}_{num_gpus}_{dataset_size}_{batch_size}_{max_training_steps}_{learning_rate}_{date}"