Skip to content
Snippets Groups Projects
Select Git revision
  • 6bae84358382a12eebdc3cfac96143e68fb8b0f4
  • master default protected
  • r1.8
  • r1.6
  • r1.9
  • r1.5
  • r1.7
  • r1.3
  • r1.4
  • r1.2
  • v1.6.0
  • v1.5.0
12 results

preprocess_librispeech.sh

Blame
  • preprocess_librispeech.sh 2.30 KiB
    #!/usr/bin/env bash
    # Copyright 2022 Huawei Technologies Co., Ltd
    #
    # Licensed under the Apache License, Version 2.0 (the "License");
    # you may not use this file except in compliance with the License.
    # You may obtain a copy of the License at
    #
    # http://www.apache.org/licenses/LICENSE-2.0
    #
    # Unless required by applicable law or agreed to in writing, software
    # distributed under the License is distributed on an "AS IS" BASIS,
    # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    # See the License for the specific language governing permissions and
    # limitations under the License.
    # ============================================================================
    SPEEDS=$1
    [ -n "$SPEEDS" ] && SPEED_FLAG="--speed $SPEEDS"
    
    python ./utils/convert_librispeech.py \
        --input_dir /datasets/LibriSpeech/train-clean-100 \
        --dest_dir /datasets/LibriSpeech/train-clean-100-wav \
        --output_json /datasets/LibriSpeech/librispeech-train-clean-100-wav.json \
        $SPEED_FLAG
    python ./utils/convert_librispeech.py \
        --input_dir /datasets/LibriSpeech/train-clean-360 \
        --dest_dir /datasets/LibriSpeech/train-clean-360-wav \
        --output_json /datasets/LibriSpeech/librispeech-train-clean-360-wav.json \
        $SPEED_FLAG
    python ./utils/convert_librispeech.py \
        --input_dir /datasets/LibriSpeech/train-other-500 \
        --dest_dir /datasets/LibriSpeech/train-other-500-wav \
        --output_json /datasets/LibriSpeech/librispeech-train-other-500-wav.json \
        $SPEED_FLAG
    python ./utils/convert_librispeech.py \
        --input_dir /datasets/LibriSpeech/dev-clean \
        --dest_dir /datasets/LibriSpeech/dev-clean-wav \
        --output_json /datasets/LibriSpeech/librispeech-dev-clean-wav.json
    python ./utils/convert_librispeech.py \
        --input_dir /datasets/LibriSpeech/dev-other \
        --dest_dir /datasets/LibriSpeech/dev-other-wav \
        --output_json /datasets/LibriSpeech/librispeech-dev-other-wav.json
    python ./utils/convert_librispeech.py \
        --input_dir /datasets/LibriSpeech/test-clean \
        --dest_dir /datasets/LibriSpeech/test-clean-wav \
        --output_json /datasets/LibriSpeech/librispeech-test-clean-wav.json
    python ./utils/convert_librispeech.py \
        --input_dir /datasets/LibriSpeech/test-other \
        --dest_dir /datasets/LibriSpeech/test-other-wav \
        --output_json /datasets/LibriSpeech/librispeech-test-other-wav.json