File size: 1,203 Bytes
a84a65c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
# music prompt genneration
python3 scripts/txt2audio_for_2cap_flow.py \
--outdir output_dir_text -r useful_ckpts/music_generation/119.ckpt  -b configs/txt2music-cfm1-cfg-LargeDiT3.yaml --scale 3.0 \
--vocoder-ckpt useful_ckpts/bigvnat

# music test dataset genneration
python3 scripts/txt2audio_for_2cap_flow.py \
--outdir results/music/dataset -r useful_ckpts/music_generation/119.ckpt  -b configs/txt2music-cfm1-cfg-LargeDiT3.yaml --scale 3.0 \
--vocoder-ckpt useful_ckpts/bigvnat --test-dataset testset 

# audio prompt genneration
python3 scripts/txt2audio_for_2cap_flow.py \
--prompt 'A train running on a railroad track followed by a vehicle door closing and a man talking in the distance while a train horn honks and railroad crossing warning signals ring' \
--outdir results/auido/text -r useful_ckpts/audio_generation/324.ckpt  -b configs/txt2audio-cfm1-cfg-LargeDiT3.yaml --scale 3.0 \
--vocoder-ckpt useful_ckpts/bigvnat

# audio test dataset genneration
python3 scripts/txt2audio_for_2cap_flow.py \
--outdir results/auido/dataset -r useful_ckpts/audio_generation/324.ckpt  -b configs/txt2audio-cfm1-cfg-LargeDiT3.yaml --scale 3.0 \
--vocoder-ckpt useful_ckpts/bigvnat --test-dataset testset