#!/bin/bash export TOKENIZERS_PARALLELISM="false" export DECORD_DUPLICATE_WARNING_THRESHOLD=1.0 export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/home/haofei/miniconda3/envs/javisdit/lib MAX_FRAMES=16 IMAGE_SIZE=224 MAX_AUDIO_LEN_S=4.0 WINDOW_SIZE_S=2.0 WINDOW_OVERLAP_S=1.5 dataset="JavisBench-mini" INPUT_FILE="data/eval/JavisBench/${dataset}.csv" FVD_AVCACHE_PATH="data/eval/av_cache/${dataset}-vanilla-max4s.pt" # list of metrics to calculate, "all" for all metrics # METRICS="fvd+kvd+fad imagebind-score cxxp-score av-align av-score" METRICS="desync" for aspect in sft ; do for model_dir in samples/audio_video_eval/${aspect}/* ; do for data_path in ${model_dir}/epoch* ; do echo ${data_path} model=$(basename "$model_dir") step=$(basename "$data_path") RESULTS_DIR="./evaluation_results/audio_video_eval/${aspect}" # Evaluation export CUDA_VISIBLE_DEVICES=7 torchrun --nproc_per_node=1 --master_port 23456 -m eval.javisbench.main \ --input_file "${INPUT_FILE}" \ --infer_data_dir "${data_path}" \ --output_file "${RESULTS_DIR}/${model}_${step}.json" \ --max_frames ${MAX_FRAMES} \ --image_size ${IMAGE_SIZE} \ --max_audio_len_s ${MAX_AUDIO_LEN_S} \ --window_size_s ${WINDOW_SIZE_S} \ --window_overlap_s ${WINDOW_OVERLAP_S} \ --fvd_avcache_path ${FVD_AVCACHE_PATH} \ --metrics ${METRICS} --exclude cavp_score --force_eval done done done