mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-09 18:12:19 +00:00
175 lines
8.2 KiB
YAML
175 lines
8.2 KiB
YAML
# Copyright 2021 Fangjun Kuang (csukuangfj@gmail.com)
|
|
|
|
# See ../../LICENSE for clarification regarding multiple authors
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
name: run-pre-trained-trandsucer-stateless-multi-datasets-librispeech-960h
|
|
|
|
on:
|
|
push:
|
|
branches:
|
|
- master
|
|
pull_request:
|
|
types: [labeled]
|
|
|
|
jobs:
|
|
run_pre_trained_transducer_stateless_multi_datasets_librispeech_960h:
|
|
if: github.event.label.name == 'ready' || github.event_name == 'push'
|
|
runs-on: ${{ matrix.os }}
|
|
strategy:
|
|
matrix:
|
|
os: [ubuntu-18.04]
|
|
python-version: [3.7, 3.8, 3.9]
|
|
|
|
fail-fast: false
|
|
|
|
steps:
|
|
- uses: actions/checkout@v2
|
|
with:
|
|
fetch-depth: 0
|
|
|
|
- name: Install graphviz
|
|
shell: bash
|
|
run: |
|
|
sudo apt-get -qq install graphviz
|
|
|
|
- name: Setup Python ${{ matrix.python-version }}
|
|
uses: actions/setup-python@v2
|
|
with:
|
|
python-version: ${{ matrix.python-version }}
|
|
cache: 'pip'
|
|
cache-dependency-path: '**/requirements-ci.txt'
|
|
|
|
- name: Install Python dependencies
|
|
run: |
|
|
grep -v '^#' ./requirements-ci.txt | xargs -n 1 -L 1 pip install
|
|
|
|
- name: Cache kaldifeat
|
|
id: my-cache
|
|
uses: actions/cache@v2
|
|
with:
|
|
path: |
|
|
~/tmp/kaldifeat
|
|
key: cache-tmp-${{ matrix.python-version }}
|
|
|
|
- name: Install kaldifeat
|
|
if: steps.my-cache.outputs.cache-hit != 'true'
|
|
shell: bash
|
|
run: |
|
|
mkdir -p ~/tmp
|
|
cd ~/tmp
|
|
git clone https://github.com/csukuangfj/kaldifeat
|
|
cd kaldifeat
|
|
mkdir build
|
|
cd build
|
|
cmake -DCMAKE_BUILD_TYPE=Release ..
|
|
make -j2 _kaldifeat
|
|
|
|
- name: Download pre-trained model
|
|
shell: bash
|
|
run: |
|
|
sudo apt-get -qq install git-lfs tree sox
|
|
cd egs/librispeech/ASR
|
|
mkdir tmp
|
|
cd tmp
|
|
git lfs install
|
|
git clone https://huggingface.co/csukuangfj/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01
|
|
|
|
|
|
cd ..
|
|
tree tmp
|
|
soxi tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/*.wav
|
|
ls -lh tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/*.wav
|
|
|
|
- name: Run greedy search decoding (max-sym-per-frame 1)
|
|
shell: bash
|
|
run: |
|
|
export PYTHONPATH=$PWD:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/kaldifeat/python:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/build/lib:$PYTHONPATH
|
|
cd egs/librispeech/ASR
|
|
./transducer_stateless_multi_datasets/pretrained.py \
|
|
--method greedy_search \
|
|
--max-sym-per-frame 1 \
|
|
--checkpoint ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/exp/pretrained.pt \
|
|
--bpe-model ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/data/lang_bpe_500/bpe.model \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1089-134686-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0002.wav
|
|
|
|
- name: Run greedy search decoding (max-sym-per-frame 2)
|
|
shell: bash
|
|
run: |
|
|
export PYTHONPATH=$PWD:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/kaldifeat/python:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/build/lib:$PYTHONPATH
|
|
cd egs/librispeech/ASR
|
|
./transducer_stateless_multi_datasets/pretrained.py \
|
|
--method greedy_search \
|
|
--max-sym-per-frame 2 \
|
|
--checkpoint ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/exp/pretrained.pt \
|
|
--bpe-model ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/data/lang_bpe_500/bpe.model \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1089-134686-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0002.wav
|
|
|
|
- name: Run greedy search decoding (max-sym-per-frame 3)
|
|
shell: bash
|
|
run: |
|
|
export PYTHONPATH=$PWD:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/kaldifeat/python:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/build/lib:$PYTHONPATH
|
|
cd egs/librispeech/ASR
|
|
./transducer_stateless_multi_datasets/pretrained.py \
|
|
--method greedy_search \
|
|
--max-sym-per-frame 3 \
|
|
--checkpoint ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/exp/pretrained.pt \
|
|
--bpe-model ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/data/lang_bpe_500/bpe.model \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1089-134686-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0002.wav
|
|
|
|
- name: Run beam search decoding
|
|
shell: bash
|
|
run: |
|
|
export PYTHONPATH=$PWD:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/kaldifeat/python:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/build/lib:$PYTHONPATH
|
|
cd egs/librispeech/ASR
|
|
./transducer_stateless_multi_datasets/pretrained.py \
|
|
--method beam_search \
|
|
--beam-size 4 \
|
|
--checkpoint ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/exp/pretrained.pt \
|
|
--bpe-model ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/data/lang_bpe_500/bpe.model \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1089-134686-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0002.wav
|
|
|
|
|
|
- name: Run modified beam search decoding
|
|
shell: bash
|
|
run: |
|
|
export PYTHONPATH=$PWD:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/kaldifeat/python:$PYTHONPATH
|
|
export PYTHONPATH=~/tmp/kaldifeat/build/lib:$PYTHONPATH
|
|
cd egs/librispeech/ASR
|
|
./transducer_stateless_multi_datasets/pretrained.py \
|
|
--method modified_beam_search \
|
|
--beam-size 4 \
|
|
--checkpoint ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/exp/pretrained.pt \
|
|
--bpe-model ./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/data/lang_bpe_500/bpe.model \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1089-134686-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0001.wav \
|
|
./tmp/icefall-asr-librispeech-transducer-stateless-multi-datasets-bpe-500-2022-03-01/test_wavs/1221-135766-0002.wav
|