#!/bin/bash
|
# Copyright 2015 David Snyder
|
# Apache 2.0.
|
#
|
# This script, called by ../run.sh, creates the MUSAN
|
# data directory. The required dataset is freely available at
|
# http://www.openslr.org/17/
|
|
set -e
|
in_dir=$1
|
data_dir=$2
|
use_vocals='Y'
|
|
mkdir -p local/musan.tmp
|
|
echo "Preparing ${data_dir}/musan..."
|
mkdir -p ${data_dir}/musan
|
local/make_musan.py ${in_dir} ${data_dir}/musan ${use_vocals}
|
|
utils/fix_data_dir.sh ${data_dir}/musan
|
|
grep "music" ${data_dir}/musan/utt2spk > local/musan.tmp/utt2spk_music
|
grep "speech" ${data_dir}/musan/utt2spk > local/musan.tmp/utt2spk_speech
|
grep "noise" ${data_dir}/musan/utt2spk > local/musan.tmp/utt2spk_noise
|
utils/subset_data_dir.sh --utt-list local/musan.tmp/utt2spk_music \
|
${data_dir}/musan ${data_dir}/musan_music
|
utils/subset_data_dir.sh --utt-list local/musan.tmp/utt2spk_speech \
|
${data_dir}/musan ${data_dir}/musan_speech
|
utils/subset_data_dir.sh --utt-list local/musan.tmp/utt2spk_noise \
|
${data_dir}/musan ${data_dir}/musan_noise
|
|
utils/fix_data_dir.sh ${data_dir}/musan_music
|
utils/fix_data_dir.sh ${data_dir}/musan_speech
|
utils/fix_data_dir.sh ${data_dir}/musan_noise
|
|
rm -rf local/musan.tmp
|