Files
pretrain_kaiyuan2b/scripts/convert_megatron_weight_to_hf.sh
2026-05-06 15:06:07 +08:00

11 lines
337 B
Bash

CKPT_DIR=/apps/yi/model_training/artifacts/checkpoints/smoke_gpt
MEGATRON_PATH=/apps/yi/model_training/Megatron-LM
HF_OUT=/apps/yi/model_training/artifacts/hf_models/smoke_gpt_15000
python $MEGATRON_PATH/tools/checkpoint/convert.py \
--model-type GPT \
--loader core \
--saver core \
--load-dir $CKPT_DIR \
--save-dir $HF_OUT