File size: 1,186 Bytes
e490e7e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
#!/bin/bash

export TOKENIZERS_PARALLELISM="false"
export DECORD_DUPLICATE_WARNING_THRESHOLD=1.0

METRICS="audio-score" 
RESULTS_DIR="./evaluation_results/audio_eval"
INFER_DATA_ROOT="samples/audio_eval"

declare -a DATASETS=("audiocaps" "javismini")  #  
declare -a MAX_AUDIO_LENS=(8.0 4.0) # 

for model in "Wan2.1"; do  # "baseline" 

for folder in "${INFER_DATA_ROOT}"/"${model}"/*; do
method=$(basename "$folder")

for subfolder in "${folder}"/ep*; do
ep=$(basename "$subfolder")

for i in "${!DATASETS[@]}"; do
dataset=${DATASETS[$i]}
max_audio_len_s=${MAX_AUDIO_LENS[$i]}
gpu=0

# model="baseline"
# method="audioldm2"
# ep="ep-1"
# dataset="javismini"
# max_audio_len_s="4.0"

INPUT_FILE="data/meta/audio_eval/${dataset}.csv"
INFER_DATA_DIR="${INFER_DATA_ROOT}/${model}/${method}/${ep}/${dataset}"
OUTPUT_FILE_PATH="${RESULTS_DIR}/${model}_${method}_${ep}_${dataset}.json"

export CUDA_VISIBLE_DEVICES=${gpu} 
torchrun --nproc_per_node=1 -m eval.javisbench.main \
    --input_file "${INPUT_FILE}" \
    --infer_data_dir "${INFER_DATA_DIR}" \
    --output_file "${OUTPUT_FILE_PATH}" \
    --max_audio_len_s "${max_audio_len_s}" \
    --metrics ${METRICS}

done

done

done

done