NeMo / scripts /freesound_download_resample /download_resample_freesound.sh
camenduru's picture
thanks to NVIDIA ❤
7934b29
# Copyright (c) 2020, NVIDIA CORPORATION. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#!/bin/bash
# This is bash script actually run the downloading and resampling script.
# See instructions in freesound_download.py
# Change this arguments if you want
page_size=100 # Number of sounds per page
max_samples=200 # Maximum number of sound samples
min_filesize=0 # Minimum filesize allowed (in MB)
max_filesize=100 # Maximum filesize allowed (in MB)
if [[ $# -ne 3 ]]; then
echo "Require number of all files | data directory | resample data directory as arguments to the script"
exit 2
fi
NUM_ALL_FILES=$1
DATADIR=$2
RESAMPLE_DATADIR=$3
if [ ! -d "$DATADIR" ]; then
echo "Creating dir $DATADIR"
mkdir -p "$DATADIR"
fi
if [ ! -d "$RESAMPLE_DATADIR" ]; then
echo "Creating dir $RESAMPLE_DATADIR"
mkdir -p "$RESAMPLE_DATADIR"
fi
# we just need background categories for constructing dataset, feel free to include other (speech) categories for testing and training your VAD model
# background
categories=(
"Air brake"
"Static"
"Acoustic environment"
"Distortion"
"Tape hiss"
"Hubbub"
"Vibration"
"Cacophony"
"Throbbing"
"Reverberation"
"Inside, public space"
"Inside, small room"
"Echo"
"Outside, rural"
"Outside, natural"
"Outside, urban"
"Outside, manmade"
"Car"
"Bus"
"Traffic noise"
"Roadway noise"
"Truck"
"Emergency vehicle"
"Motorcycle"
"Aircraft engine"
"Aircraft"
"Helicopter"
"Bicycle"
"Skateboard"
"Subway, metro, underground"
"Railroad car"
"Train wagon"
"Train"
"Sailboat"
"Rowboat"
"Ship"
)
WAV_FILECOUNT="$(find $DATADIR -name '*.wav' -type f | wc -l)"
FLAC_FILECOUNT="$(find $DATADIR -name '*.flac' -type f | wc -l)"
FILECOUNT="$((WAV_FILECOUNT + FLAC_FILECOUNT))"
echo "File count: " $FILECOUNT
while((FILECOUNT <= NUM_ALL_FILES))
do
for category in "${categories[@]}"
do
python freesound_download.py --data_dir "${DATADIR}" --category "${category}" --page_size "${page_size}" --max_samples "${max_samples}" --min_filesize "${min_filesize}" --max_filesize "${max_filesize}"
ret=$?
if [ $ret -ne 0 ]; then
exit 1
fi
done
WAV_FILECOUNT="$(find $DATADIR -name '*.wav' -type f | wc -l)"
FLAC_FILECOUNT="$(find $DATADIR -name '*.flac' -type f | wc -l)"
FILECOUNT="$((WAV_FILECOUNT + FLAC_FILECOUNT))"
echo "Current file count is: " $FILECOUNT
done
# RESAMPLE
echo "Got enough data. Start resample!"
python freesound_resample.py --data_dir="${DATADIR}" --resampled_dir="${RESAMPLE_DATADIR}"
echo "Done resample data!"