make_musan.sh 2.27 KB
edit raw blame history



1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71


#!/bin/bash
# Copyright 2015   David Snyder
#           2019   Phani Sankar Nidadavolu
# Apache 2.0.
#
# This script creates the MUSAN data directory.
# Consists of babble, music and noise files.
# Used to create augmented data
# The required dataset is freely available at http://www.openslr.org/17/

# The corpus can be cited as follows:
# @misc{musan2015,
#  author = {David Snyder and Guoguo Chen and Daniel Povey},
#  title = {{MUSAN}: {A} {M}usic, {S}peech, and {N}oise {C}orpus},
#  year = {2015},
#  eprint = {1510.08484},
#  note = {arXiv:1510.08484v1}
# }

set -e
use_vocals=true
sampling_rate=16000
stage=0

echo "$0 $@"  # Print the command line for logging

if [ -f path.sh ]; then . ./path.sh; fi
. parse_options.sh || exit 1;

if [ $# -ne 2 ]; then
    echo USAGE: $0 input_dir output_dir
    echo input_dir is the path where the MUSAN corpus is located
    echo e.g: $0 /export/corpora/JHU/musan data
    echo "main options (for others, see top of script file)"
    echo "  --sampling-rate <sampling frequency>        # Sampling frequency of source dir"
    echo "  --use-vocals <true/false>        # Use vocals from music portion of MUSAN corpus"
    exit 1;
fi

in_dir=$1
data_dir=$2

mkdir -p local/musan.tmp

# The below script will create the musan corpus
steps/data/make_musan.py --use-vocals ${use_vocals} \
                        --sampling-rate ${sampling_rate} \
                        ${in_dir} ${data_dir}/musan || exit 1;

utils/fix_data_dir.sh ${data_dir}/musan

grep "music" ${data_dir}/musan/utt2spk > local/musan.tmp/utt2spk_music
grep "speech" ${data_dir}/musan/utt2spk > local/musan.tmp/utt2spk_speech
grep "noise" ${data_dir}/musan/utt2spk > local/musan.tmp/utt2spk_noise

utils/subset_data_dir.sh --utt-list local/musan.tmp/utt2spk_music \
        ${data_dir}/musan ${data_dir}/musan_music
utils/subset_data_dir.sh --utt-list local/musan.tmp/utt2spk_speech \
        ${data_dir}/musan ${data_dir}/musan_speech
utils/subset_data_dir.sh --utt-list local/musan.tmp/utt2spk_noise \
        ${data_dir}/musan ${data_dir}/musan_noise

utils/fix_data_dir.sh ${data_dir}/musan_music
utils/fix_data_dir.sh ${data_dir}/musan_speech
utils/fix_data_dir.sh ${data_dir}/musan_noise

rm -rf local/musan.tmp

for name in speech noise music; do
    utils/data/get_reco2dur.sh ${data_dir}/musan_${name}
done