# Copyright 2021 Fangjun Kuang (csukuangfj@gmail.com) # See ../../LICENSE for clarification regarding multiple authors # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. name: run-pre-trained-trandsucer-stateless-multi-datasets-librispeech-100h on: push: branches: - master pull_request: types: [labeled] schedule: # minute (0-59) # hour (0-23) # day of the month (1-31) # month (1-12) # day of the week (0-6) # nightly build at 15:50 UTC time every day - cron: "50 15 * * *" jobs: run_pre_trained_transducer_stateless_multi_datasets_librispeech_100h: if: github.event.label.name == 'ready' || github.event.label.name == 'run-decode' || github.event_name == 'push' || github.event_name == 'schedule' runs-on: ${{ matrix.os }} strategy: matrix: os: [ubuntu-18.04] python-version: [3.7, 3.8, 3.9] fail-fast: false steps: - uses: actions/checkout@v2 with: fetch-depth: 0 - name: Setup Python ${{ matrix.python-version }} uses: actions/setup-python@v2 with: python-version: ${{ matrix.python-version }} cache: 'pip' cache-dependency-path: '**/requirements-ci.txt' - name: Install Python dependencies run: | grep -v '^#' ./requirements-ci.txt | xargs -n 1 -L 1 pip install - name: Cache kaldifeat id: my-cache uses: actions/cache@v2 with: path: | ~/tmp/kaldifeat key: cache-tmp-${{ matrix.python-version }} - name: Install kaldifeat if: steps.my-cache.outputs.cache-hit != 'true' shell: bash run: | .github/scripts/install-kaldifeat.sh - name: Cache LibriSpeech test-clean and test-other datasets id: libri-test-clean-and-test-other-data uses: actions/cache@v2 with: path: | ~/tmp/download key: cache-libri-test-clean-and-test-other - name: Download LibriSpeech test-clean and test-other if: steps.libri-test-clean-and-test-other-data.outputs.cache-hit != 'true' shell: bash run: | .github/scripts/download-librispeech-test-clean-and-test-other-dataset.sh - name: Prepare manifests for LibriSpeech test-clean and test-other shell: bash run: | .github/scripts/prepare-librispeech-test-clean-and-test-other-manifests.sh - name: Cache LibriSpeech test-clean and test-other fbank features id: libri-test-clean-and-test-other-fbank uses: actions/cache@v2 with: path: | ~/tmp/fbank-libri key: cache-libri-fbank-test-clean-and-test-other - name: Compute fbank for LibriSpeech test-clean and test-other if: steps.libri-test-clean-and-test-other-fbank.outputs.cache-hit != 'true' shell: bash run: | .github/scripts/compute-fbank-librispeech-test-clean-and-test-other.sh - name: Inference with pre-trained model shell: bash env: GITHUB_EVENT_NAME: ${{ github.event_name }} GITHUB_EVENT_LABEL_NAME: ${{ github.event.label.name }} run: | mkdir -p egs/librispeech/ASR/data ln -sfv ~/tmp/fbank-libri egs/librispeech/ASR/data/fbank ls -lh egs/librispeech/ASR/data/* sudo apt-get -qq install git-lfs tree sox export PYTHONPATH=$PWD:$PYTHONPATH export PYTHONPATH=~/tmp/kaldifeat/kaldifeat/python:$PYTHONPATH export PYTHONPATH=~/tmp/kaldifeat/build/lib:$PYTHONPATH .github/scripts/run-pre-trained-transducer-stateless-librispeech-100h.sh - name: Display decoding results for transducer_stateless_multi_datasets if: github.event_name == 'schedule' || github.event.label.name == 'run-decode' shell: bash run: | cd egs/librispeech/ASR/ tree ./transducer_stateless_multi_datasets/exp cd transducer_stateless_multi_datasets echo "results for transducer_stateless_multi_datasets" echo "===greedy search===" find exp/greedy_search -name "log-*" -exec grep -n --color "best for test-clean" {} + | sort -n -k2 find exp/greedy_search -name "log-*" -exec grep -n --color "best for test-other" {} + | sort -n -k2 echo "===fast_beam_search===" find exp/fast_beam_search -name "log-*" -exec grep -n --color "best for test-clean" {} + | sort -n -k2 find exp/fast_beam_search -name "log-*" -exec grep -n --color "best for test-other" {} + | sort -n -k2 echo "===modified beam search===" find exp/modified_beam_search -name "log-*" -exec grep -n --color "best for test-clean" {} + | sort -n -k2 find exp/modified_beam_search -name "log-*" -exec grep -n --color "best for test-other" {} + | sort -n -k2 - name: Upload decoding results for transducer_stateless_multi_datasets uses: actions/upload-artifact@v2 if: github.event_name == 'schedule' || github.event.label.name == 'run-decode' with: name: torch-${{ matrix.torch }}-python-${{ matrix.python-version }}-ubuntu-18.04-cpu-transducer_stateless_multi_datasets-100h-2022-02-21 path: egs/librispeech/ASR/transducer_stateless_multi_datasets/exp/