in scripts/launcher_single.py [0:0]
def finetune_model() -> None:
"""
Fine-tune a model
Returns:
None
"""
print("***** Starting model fine-tuning *****")
# Set custom environment variables
# NCCL_DEBUG=INFO will dump a lot of NCCL-related debug information, which you can then search online if you find that some problems are reported.
# Or if you’re not sure how to interpret the output you can share the log file in an Issue.
custom_env: Dict[str, str] = {
"HF_DATASETS_TRUST_REMOTE_CODE": "TRUE",
"HF_TOKEN": args.hf_token,
# "NCCL_DEBUG": "INFO",
"WANDB_API_KEY": args.wandb_api_key,
"WANDB_PROJECT": args.wandb_project,
"WANDB_WATCH": args.wandb_watch,
"WANDB_DIR": args.log_dir,
}
set_custom_env(custom_env)
os.makedirs(args.model_dir, exist_ok=True)
os.makedirs(args.log_dir, exist_ok=True)
os.makedirs(args.model_output_dir, exist_ok=True)
# Download the model
download_model(args.model_id, args.model_dir)
# Construct the fine-tuning command
print("***** Single Device Training *****")
full_command = f"tune run {args.tune_recipe} --config {args.tune_finetune_yaml}"
# Run the fine-tuning command
run_command(full_command)