JAV-Gen / scripts /bash /train.sh
kaiw7's picture
Upload folder using huggingface_hub
e490e7e verified
# export CUDA_HOME="~/shared/kail/workspace/envs/cuda-12.2"
# export PATH="~/shared/kail/workspace/envs/cuda-12.2/bin/":$PATH
export CUDA_VISIBLE_DEVICES="6,7"
## Audio PreTrain
data_path="/root/workspace/projects/JavisDiT-dev/debug/meta/JavisDiT_train_audio_v1.csv"
# # cfg_path="debug/cfg/stage1_audio.py"
cfg_path="configs/wan2.1/train/stage1_audio.py"
# cfg_path="configs/wan2.1/ablation/audio_pe/interleave_window.py"
## AudioVideo PreTrain
# data_path="/mnt/HithinkOmniSSD/user_workspace/liukai4/datasets/JavisDiT/train/video_dev/TAVGBench_train_fps16_sft_120k_ths.csv"
# data_path="/mnt/HithinkOmniSSD/user_workspace/liukai4/datasets/JavisDiT/train/video/TAVGBench_train_fps16_sft_330k_ths.csv"
# cfg_path="configs/wan2.1/train/stage2_audio_video.py" # 37G-22:01-17:38
# cfg_path="configs/wan2.1/ablation/avsync/frameattn.py" # 44G-27:58-24:27
# cfg_path="configs/wan2.1/ablation/avsync/frameattnfast.py" # 44G-25:27-21:16
# cfg_path='/mnt/HithinkOmniSSD/user_workspace/liukai4/projects/JavisDiT-dev/configs/wan2.1/ablation/avsync/interleave_window.py'
# ## AudioVideo DPO
# data_path="/mnt/HithinkOmniSSD/user_workspace/liukai4/datasets/JavisDiT/train/dpo_gen/v1_interleave_330kep2/TAVGBench_train_fps16_dpo_30k_consistency_macro_ths.csv"
# cfg_path="configs/wan2.1/train/stage3_audio_video_dpo.py"
torchrun --standalone --nproc_per_node 2 \
scripts/train.py \
${cfg_path} \
--data-path ${data_path}
# export CUDA_VISIBLE_DEVICES="1,6"
# nohup python scripts/misc/auto_resume.py >nohup.log 2>&1 &