From c5796e3f9afd96a3b70d701e88de891d415cd893 Mon Sep 17 00:00:00 2001
From: csukuangfj <csukuangfj@users.noreply.github.com>
Date: Fri, 14 Oct 2022 02:18:34 +0000
Subject: [PATCH] deploy: 11bff575863064b0d0ee6792b1505a82bff0a5fd

---
 _sources/index.rst.txt                        |   1 +
 .../export-model-state-dict.rst.txt           | 135 +++++++++
 _sources/model-export/export-ncnn.rst.txt     |  12 +
 _sources/model-export/export-onnx.rst.txt     |  69 +++++
 .../export-with-torch-jit-script.rst.txt      |  58 ++++
 .../export-with-torch-jit-trace.rst.txt       |  69 +++++
 _sources/model-export/index.rst.txt           |  14 +
 .../lstm_pruned_stateless_transducer.rst.txt  |   2 +
 contributing/code-style.html                  |   1 +
 contributing/doc.html                         |   1 +
 contributing/how-to-create-a-recipe.html      |   1 +
 contributing/index.html                       |   1 +
 genindex.html                                 |   1 +
 huggingface/index.html                        |   1 +
 huggingface/pretrained-models.html            |   1 +
 huggingface/spaces.html                       |   1 +
 index.html                                    |   9 +
 installation/index.html                       |   5 +-
 model-export/export-model-state-dict.html     | 262 ++++++++++++++++++
 model-export/export-ncnn.html                 | 125 +++++++++
 model-export/export-onnx.html                 | 182 ++++++++++++
 .../export-with-torch-jit-script.html         | 172 ++++++++++++
 model-export/export-with-torch-jit-trace.html | 183 ++++++++++++
 model-export/index.html                       | 148 ++++++++++
 objects.inv                                   | Bin 719 -> 908 bytes
 recipes/aishell/conformer_ctc.html            |   1 +
 recipes/aishell/index.html                    |   1 +
 recipes/aishell/stateless_transducer.html     |   1 +
 recipes/aishell/tdnn_lstm_ctc.html            |   1 +
 recipes/index.html                            |   5 +-
 recipes/librispeech/conformer_ctc.html        |   1 +
 recipes/librispeech/index.html                |   1 +
 .../lstm_pruned_stateless_transducer.html     |   7 +-
 recipes/librispeech/tdnn_lstm_ctc.html        |   1 +
 recipes/timit/index.html                      |   1 +
 recipes/timit/tdnn_ligru_ctc.html             |   1 +
 recipes/timit/tdnn_lstm_ctc.html              |   1 +
 recipes/yesno/index.html                      |   1 +
 recipes/yesno/tdnn.html                       |   1 +
 search.html                                   |   1 +
 searchindex.js                                |   2 +-
 41 files changed, 1473 insertions(+), 8 deletions(-)
 create mode 100644 _sources/model-export/export-model-state-dict.rst.txt
 create mode 100644 _sources/model-export/export-ncnn.rst.txt
 create mode 100644 _sources/model-export/export-onnx.rst.txt
 create mode 100644 _sources/model-export/export-with-torch-jit-script.rst.txt
 create mode 100644 _sources/model-export/export-with-torch-jit-trace.rst.txt
 create mode 100644 _sources/model-export/index.rst.txt
 create mode 100644 model-export/export-model-state-dict.html
 create mode 100644 model-export/export-ncnn.html
 create mode 100644 model-export/export-onnx.html
 create mode 100644 model-export/export-with-torch-jit-script.html
 create mode 100644 model-export/export-with-torch-jit-trace.html
 create mode 100644 model-export/index.html

diff --git a/_sources/index.rst.txt b/_sources/index.rst.txt
index 29491e3dc..be9977ca9 100644
--- a/_sources/index.rst.txt
+++ b/_sources/index.rst.txt
@@ -21,6 +21,7 @@ speech recognition recipes using `k2 <https://github.com/k2-fsa/k2>`_.
    :caption: Contents:
 
    installation/index
+   model-export/index
    recipes/index
    contributing/index
    huggingface/index
diff --git a/_sources/model-export/export-model-state-dict.rst.txt b/_sources/model-export/export-model-state-dict.rst.txt
new file mode 100644
index 000000000..c3bbd5708
--- /dev/null
+++ b/_sources/model-export/export-model-state-dict.rst.txt
@@ -0,0 +1,135 @@
+Export model.state_dict()
+=========================
+
+When to use it
+--------------
+
+During model training, we save checkpoints periodically to disk.
+
+A checkpoint contains the following information:
+
+  - ``model.state_dict()``
+  - ``optimizer.state_dict()``
+  - and some other information related to training
+
+When we need to resume the training process from some point, we need a checkpoint.
+However, if we want to publish the model for inference, then only
+``model.state_dict()`` is needed. In this case, we need to strip all other information
+except ``model.state_dict()`` to reduce the file size of the published model.
+
+How to export
+-------------
+
+Every recipe contains a file ``export.py`` that you can use to
+export ``model.state_dict()`` by taking some checkpoints as inputs.
+
+.. hint::
+
+   Each ``export.py`` contains well-documented usage information.
+
+In the following, we use
+`<https://github.com/k2-fsa/icefall/blob/master/egs/librispeech/ASR/pruned_transducer_stateless3/export.py>`_
+as an example.
+
+.. note::
+
+   The steps for other recipes are almost the same.
+
+.. code-block:: bash
+
+  cd egs/librispeech/ASR
+
+  ./pruned_transducer_stateless3/export.py \
+    --exp-dir ./pruned_transducer_stateless3/exp \
+    --bpe-model data/lang_bpe_500/bpe.model \
+    --epoch 20 \
+    --avg 10
+
+will generate a file ``pruned_transducer_stateless3/exp/pretrained.pt``, which
+is a dict containing ``{"model": model.state_dict()}`` saved by ``torch.save()``.
+
+How to use the exported model
+-----------------------------
+
+For each recipe, we provide pretrained models hosted on huggingface.
+You can find links to pretrained models in ``RESULTS.md`` of each dataset.
+
+In the following, we demonstrate how to use the pretrained model from
+`<https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13>`_.
+
+.. code-block:: bash
+
+   cd egs/librispeech/ASR
+
+   git lfs install
+   git clone https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13
+
+After cloning the repo with ``git lfs``, you will find several files in the folder
+``icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp``
+that have a prefix ``pretrained-``. Those files contain ``model.state_dict()``
+exported by the above ``export.py``.
+
+In each recipe, there is also a file ``pretrained.py``, which can use
+``pretrained-xxx.pt`` to decode waves. The following is an example:
+
+.. code-block:: bash
+
+   cd egs/librispeech/ASR
+
+   ./pruned_transducer_stateless3/pretrained.py \
+      --checkpoint ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp/pretrained-iter-1224000-avg-14.pt \
+      --bpe-model ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/data/lang_bpe_500/bpe.model \
+      --method greedy_search \
+      ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1089-134686-0001.wav \
+      ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1221-135766-0001.wav \
+      ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1221-135766-0002.wav
+
+The above commands show how to use the exported model with ``pretrained.py`` to
+decode multiple sound files. Its output is given as follows for reference:
+
+.. literalinclude:: ./code/export-model-state-dict-pretrained-out.txt
+
+Use the exported model to run decode.py
+---------------------------------------
+
+When we publish the model, we always note down its WERs on some test
+dataset in ``RESULTS.md``. This section describes how to use the
+pretrained model to reproduce the WER.
+
+.. code-block:: bash
+
+   cd egs/librispeech/ASR
+   git lfs install
+   git clone https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13
+
+   cd icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp
+   ln -s pretrained-iter-1224000-avg-14.pt epoch-9999.pt
+   cd ../..
+
+We create a symlink with name ``epoch-9999.pt`` to ``pretrained-iter-1224000-avg-14.pt``,
+so that we can pass ``--epoch 9999 --avg 1`` to ``decode.py`` in the following
+command:
+
+.. code-block:: bash
+
+  ./pruned_transducer_stateless3/decode.py \
+      --epoch 9999 \
+      --avg 1 \
+      --exp-dir ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp \
+      --lang-dir ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/data/lang_bpe_500 \
+      --max-duration 600 \
+      --decoding-method greedy_search
+
+You will find the decoding results in
+``./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp/greedy_search``.
+
+.. caution::
+
+   For some recipes, you also need to pass ``--use-averaged-model False``
+   to ``decode.py``. The reason is that the exported pretrained model is already
+   the averaged one.
+
+.. hint::
+
+   Before running ``decode.py``, we assume that you have already run
+   ``prepare.sh`` to prepare the test dataset.
diff --git a/_sources/model-export/export-ncnn.rst.txt b/_sources/model-export/export-ncnn.rst.txt
new file mode 100644
index 000000000..3dbb8b514
--- /dev/null
+++ b/_sources/model-export/export-ncnn.rst.txt
@@ -0,0 +1,12 @@
+Export to ncnn
+==============
+
+We support exporting LSTM transducer models to `ncnn <https://github.com/tencent/ncnn>`_.
+
+Please refer to :ref:`export-model-for-ncnn` for details.
+
+We also provide `<https://github.com/k2-fsa/sherpa-ncnn>`_
+performing speech recognition using ``ncnn`` with exported models.
+It has been tested on Linux, macOS, Windows, and Raspberry Pi. The project is
+self-contained and can be statically linked to produce a binary containing
+everything needed.
diff --git a/_sources/model-export/export-onnx.rst.txt b/_sources/model-export/export-onnx.rst.txt
new file mode 100644
index 000000000..dd4b3437a
--- /dev/null
+++ b/_sources/model-export/export-onnx.rst.txt
@@ -0,0 +1,69 @@
+Export to ONNX
+==============
+
+In this section, we describe how to export models to ONNX.
+
+.. hint::
+
+  Only non-streaming conformer transducer models are tested.
+
+
+When to use it
+--------------
+
+It you want to use an inference framework that supports ONNX
+to run the pretrained model.
+
+
+How to export
+-------------
+
+We use
+`<https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/pruned_transducer_stateless3>`_
+as an example in the following.
+
+.. code-block:: bash
+
+    cd egs/librispeech/ASR
+    epoch=14
+    avg=2
+
+    ./pruned_transducer_stateless3/export.py \
+      --exp-dir ./pruned_transducer_stateless3/exp \
+      --bpe-model data/lang_bpe_500/bpe.model \
+      --epoch $epoch \
+      --avg $avg \
+      --onnx 1
+
+It will generate the following files inside ``pruned_transducer_stateless3/exp``:
+
+  - ``encoder.onnx``
+  - ``decoder.onnx``
+  - ``joiner.onnx``
+  - ``joiner_encoder_proj.onnx``
+  - ``joiner_decoder_proj.onnx``
+
+You can use ``./pruned_transducer_stateless3/exp/onnx_pretrained.py`` to decode
+waves with the generated files:
+
+.. code-block:: bash
+
+  ./pruned_transducer_stateless3/onnx_pretrained.py \
+    --bpe-model ./data/lang_bpe_500/bpe.model \
+    --encoder-model-filename ./pruned_transducer_stateless3/exp/encoder.onnx \
+    --decoder-model-filename ./pruned_transducer_stateless3/exp/decoder.onnx \
+    --joiner-model-filename ./pruned_transducer_stateless3/exp/joiner.onnx \
+    --joiner-encoder-proj-model-filename ./pruned_transducer_stateless3/exp/joiner_encoder_proj.onnx \
+    --joiner-decoder-proj-model-filename ./pruned_transducer_stateless3/exp/joiner_decoder_proj.onnx \
+    /path/to/foo.wav \
+    /path/to/bar.wav \
+    /path/to/baz.wav
+
+
+How to use the exported model
+-----------------------------
+
+We also provide `<https://github.com/k2-fsa/sherpa-onnx>`_
+performing speech recognition using `onnxruntime <https://github.com/microsoft/onnxruntime>`_
+with exported models.
+It has been tested on Linux, macOS, and Windows.
diff --git a/_sources/model-export/export-with-torch-jit-script.rst.txt b/_sources/model-export/export-with-torch-jit-script.rst.txt
new file mode 100644
index 000000000..a041dc1d5
--- /dev/null
+++ b/_sources/model-export/export-with-torch-jit-script.rst.txt
@@ -0,0 +1,58 @@
+.. _export-model-with-torch-jit-script:
+
+Export model with torch.jit.script()
+===================================
+
+In this section, we describe how to export a model via
+``torch.jit.script()``.
+
+When to use it
+--------------
+
+If we want to use our trained model with torchscript,
+we can use ``torch.jit.script()``.
+
+.. hint::
+
+  See :ref:`export-model-with-torch-jit-trace`
+  if you want to use ``torch.jit.trace()``.
+
+How to export
+-------------
+
+We use
+`<https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/pruned_transducer_stateless3>`_
+as an example in the following.
+
+.. code-block:: bash
+
+    cd egs/librispeech/ASR
+    epoch=14
+    avg=1
+
+    ./pruned_transducer_stateless3/export.py \
+      --exp-dir ./pruned_transducer_stateless3/exp \
+      --bpe-model data/lang_bpe_500/bpe.model \
+      --epoch $epoch \
+      --avg $avg \
+      --jit 1
+
+It will generate a file ``cpu_jit.pt`` in ``pruned_transducer_stateless3/exp``.
+
+.. caution::
+
+   Don't be confused by ``cpu`` in ``cpu_jit.pt``. We move all parameters
+   to CPU before saving it into a ``pt`` file; that's why we use ``cpu``
+   in the filename.
+
+How to use the exported model
+-----------------------------
+
+Please refer to the following pages for usage:
+
+- `<https://k2-fsa.github.io/sherpa/python/streaming_asr/emformer/index.html>`_
+- `<https://k2-fsa.github.io/sherpa/python/streaming_asr/conv_emformer/index.html>`_
+- `<https://k2-fsa.github.io/sherpa/python/streaming_asr/conformer/index.html>`_
+- `<https://k2-fsa.github.io/sherpa/python/offline_asr/conformer/index.html>`_
+- `<https://k2-fsa.github.io/sherpa/cpp/offline_asr/gigaspeech.html>`_
+- `<https://k2-fsa.github.io/sherpa/cpp/offline_asr/wenetspeech.html>`_
diff --git a/_sources/model-export/export-with-torch-jit-trace.rst.txt b/_sources/model-export/export-with-torch-jit-trace.rst.txt
new file mode 100644
index 000000000..506459909
--- /dev/null
+++ b/_sources/model-export/export-with-torch-jit-trace.rst.txt
@@ -0,0 +1,69 @@
+.. _export-model-with-torch-jit-trace:
+
+Export model with torch.jit.trace()
+===================================
+
+In this section, we describe how to export a model via
+``torch.jit.trace()``.
+
+When to use it
+--------------
+
+If we want to use our trained model with torchscript,
+we can use ``torch.jit.trace()``.
+
+.. hint::
+
+  See :ref:`export-model-with-torch-jit-script`
+  if you want to use ``torch.jit.script()``.
+
+How to export
+-------------
+
+We use
+`<https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/lstm_transducer_stateless2>`_
+as an example in the following.
+
+.. code-block:: bash
+
+    iter=468000
+    avg=16
+
+    cd egs/librispeech/ASR
+
+    ./lstm_transducer_stateless2/export.py \
+      --exp-dir ./lstm_transducer_stateless2/exp \
+      --bpe-model data/lang_bpe_500/bpe.model \
+      --iter $iter \
+      --avg  $avg \
+      --jit-trace 1
+
+It will generate three files inside ``lstm_transducer_stateless2/exp``:
+
+  - ``encoder_jit_trace.pt``
+  - ``decoder_jit_trace.pt``
+  - ``joiner_jit_trace.pt``
+
+You can use
+`<https://github.com/k2-fsa/icefall/blob/master/egs/librispeech/ASR/lstm_transducer_stateless2/jit_pretrained.py>`_
+to decode sound files with the following commands:
+
+.. code-block:: bash
+
+    cd egs/librispeech/ASR
+    ./lstm_transducer_stateless2/jit_pretrained.py \
+      --bpe-model ./data/lang_bpe_500/bpe.model \
+      --encoder-model-filename ./lstm_transducer_stateless2/exp/encoder_jit_trace.pt \
+      --decoder-model-filename ./lstm_transducer_stateless2/exp/decoder_jit_trace.pt \
+      --joiner-model-filename ./lstm_transducer_stateless2/exp/joiner_jit_trace.pt \
+      /path/to/foo.wav \
+      /path/to/bar.wav \
+      /path/to/baz.wav
+
+How to use the exported models
+------------------------------
+
+Please refer to
+`<https://k2-fsa.github.io/sherpa/python/streaming_asr/lstm/index.html>`_
+for its usage in `sherpa <https://k2-fsa.github.io/sherpa/python/streaming_asr/lstm/index.html>`_.
+You can also find pretrained models there.
diff --git a/_sources/model-export/index.rst.txt b/_sources/model-export/index.rst.txt
new file mode 100644
index 000000000..9b7a2ee2d
--- /dev/null
+++ b/_sources/model-export/index.rst.txt
@@ -0,0 +1,14 @@
+Model export
+============
+
+In this section, we describe various ways to export models.
+
+
+
+.. toctree::
+
+   export-model-state-dict
+   export-with-torch-jit-trace
+   export-with-torch-jit-script
+   export-onnx
+   export-ncnn
diff --git a/_sources/recipes/librispeech/lstm_pruned_stateless_transducer.rst.txt b/_sources/recipes/librispeech/lstm_pruned_stateless_transducer.rst.txt
index b9d5bdcba..643855cc2 100644
--- a/_sources/recipes/librispeech/lstm_pruned_stateless_transducer.rst.txt
+++ b/_sources/recipes/librispeech/lstm_pruned_stateless_transducer.rst.txt
@@ -515,6 +515,8 @@ To use the generated files with ``./lstm_transducer_stateless2/jit_pretrained``:
    Please see `<https://k2-fsa.github.io/sherpa/python/streaming_asr/lstm/english/server.html>`_
    for how to use the exported models in ``sherpa``.
 
+.. _export-model-for-ncnn:
+
 Export model for ncnn
 ~~~~~~~~~~~~~~~~~~~~~
 
diff --git a/contributing/code-style.html b/contributing/code-style.html
index 514e1c12d..8e3785bf5 100644
--- a/contributing/code-style.html
+++ b/contributing/code-style.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="index.html">Contributing</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="doc.html">Contributing to Documentation</a></li>
diff --git a/contributing/doc.html b/contributing/doc.html
index 39fa0c6ea..b965da43c 100644
--- a/contributing/doc.html
+++ b/contributing/doc.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="index.html">Contributing</a><ul class="current">
 <li class="toctree-l2 current"><a class="current reference internal" href="#">Contributing to Documentation</a></li>
diff --git a/contributing/how-to-create-a-recipe.html b/contributing/how-to-create-a-recipe.html
index b82597c54..528ede4de 100644
--- a/contributing/how-to-create-a-recipe.html
+++ b/contributing/how-to-create-a-recipe.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="index.html">Contributing</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="doc.html">Contributing to Documentation</a></li>
diff --git a/contributing/index.html b/contributing/index.html
index 2d6005c7a..b9754b93c 100644
--- a/contributing/index.html
+++ b/contributing/index.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
 <li class="toctree-l1 current"><a class="current reference internal" href="#">Contributing</a><ul>
 <li class="toctree-l2"><a class="reference internal" href="doc.html">Contributing to Documentation</a></li>
diff --git a/genindex.html b/genindex.html
index 47fa5b42e..c81e4666e 100644
--- a/genindex.html
+++ b/genindex.html
@@ -39,6 +39,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul>
 <li class="toctree-l1"><a class="reference internal" href="installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="recipes/index.html">Recipes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="contributing/index.html">Contributing</a></li>
 <li class="toctree-l1"><a class="reference internal" href="huggingface/index.html">Huggingface</a></li>
diff --git a/huggingface/index.html b/huggingface/index.html
index 1c0bac312..1b8085f25 100644
--- a/huggingface/index.html
+++ b/huggingface/index.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
 <li class="toctree-l1 current"><a class="current reference internal" href="#">Huggingface</a><ul>
diff --git a/huggingface/pretrained-models.html b/huggingface/pretrained-models.html
index a96d50cc3..4103606f6 100644
--- a/huggingface/pretrained-models.html
+++ b/huggingface/pretrained-models.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="index.html">Huggingface</a><ul class="current">
diff --git a/huggingface/spaces.html b/huggingface/spaces.html
index f6e662956..1f719cb49 100644
--- a/huggingface/spaces.html
+++ b/huggingface/spaces.html
@@ -41,6 +41,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="index.html">Huggingface</a><ul class="current">
diff --git a/index.html b/index.html
index 4327402c4..5879713b2 100644
--- a/index.html
+++ b/index.html
@@ -41,6 +41,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul>
 <li class="toctree-l1"><a class="reference internal" href="installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="recipes/index.html">Recipes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="contributing/index.html">Contributing</a></li>
 <li class="toctree-l1"><a class="reference internal" href="huggingface/index.html">Huggingface</a></li>
@@ -88,6 +89,14 @@ speech recognition recipes using <a class="reference external" href="https://git
 <li class="toctree-l2"><a class="reference internal" href="installation/index.html#youtube-video">YouTube Video</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="model-export/index.html">Model export</a><ul>
+<li class="toctree-l2"><a class="reference internal" href="model-export/export-model-state-dict.html">Export model.state_dict()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="model-export/export-with-torch-jit-trace.html">Export model with torch.jit.trace()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="model-export/export-with-torch-jit-script.html">Export model with torch.jit.script()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="model-export/export-onnx.html">Export to ONNX</a></li>
+<li class="toctree-l2"><a class="reference internal" href="model-export/export-ncnn.html">Export to ncnn</a></li>
+</ul>
+</li>
 <li class="toctree-l1"><a class="reference internal" href="recipes/index.html">Recipes</a><ul>
 <li class="toctree-l2"><a class="reference internal" href="recipes/aishell/index.html">aishell</a></li>
 <li class="toctree-l2"><a class="reference internal" href="recipes/librispeech/index.html">LibriSpeech</a></li>
diff --git a/installation/index.html b/installation/index.html
index 09af4c947..692db633f 100644
--- a/installation/index.html
+++ b/installation/index.html
@@ -20,7 +20,7 @@
     <script src="../_static/js/theme.js"></script>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="Recipes" href="../recipes/index.html" />
+    <link rel="next" title="Model export" href="../model-export/index.html" />
     <link rel="prev" title="Icefall" href="../index.html" /> 
 </head>
 
@@ -63,6 +63,7 @@
 <li class="toctree-l2"><a class="reference internal" href="#youtube-video">YouTube Video</a></li>
 </ul>
 </li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
 <li class="toctree-l1"><a class="reference internal" href="../huggingface/index.html">Huggingface</a></li>
@@ -547,7 +548,7 @@ the following YouTube channel by <a class="reference external" href="https://www
           </div>
           <footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
         <a href="../index.html" class="btn btn-neutral float-left" title="Icefall" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
-        <a href="../recipes/index.html" class="btn btn-neutral float-right" title="Recipes" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
+        <a href="../model-export/index.html" class="btn btn-neutral float-right" title="Model export" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
     </div>
 
   <hr/>
diff --git a/model-export/export-model-state-dict.html b/model-export/export-model-state-dict.html
new file mode 100644
index 000000000..4f3c708e9
--- /dev/null
+++ b/model-export/export-model-state-dict.html
@@ -0,0 +1,262 @@
+<!DOCTYPE html>
+<html class="writer-html5" lang="en" >
+<head>
+  <meta charset="utf-8" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+
+  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+  <title>Export model.state_dict() &mdash; icefall 0.1 documentation</title>
+      <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
+      <link rel="stylesheet" href="../_static/css/theme.css" type="text/css" />
+  <!--[if lt IE 9]>
+    <script src="../_static/js/html5shiv.min.js"></script>
+  <![endif]-->
+  
+        <script data-url_root="../" id="documentation_options" src="../_static/documentation_options.js"></script>
+        <script src="../_static/jquery.js"></script>
+        <script src="../_static/underscore.js"></script>
+        <script src="../_static/_sphinx_javascript_frameworks_compat.js"></script>
+        <script src="../_static/doctools.js"></script>
+        <script src="../_static/sphinx_highlight.js"></script>
+    <script src="../_static/js/theme.js"></script>
+    <link rel="index" title="Index" href="../genindex.html" />
+    <link rel="search" title="Search" href="../search.html" />
+    <link rel="next" title="Export model with torch.jit.trace()" href="export-with-torch-jit-trace.html" />
+    <link rel="prev" title="Model export" href="index.html" /> 
+</head>
+
+<body class="wy-body-for-nav"> 
+  <div class="wy-grid-for-nav">
+    <nav data-toggle="wy-nav-shift" class="wy-nav-side">
+      <div class="wy-side-scroll">
+        <div class="wy-side-nav-search" >
+            <a href="../index.html" class="icon icon-home"> icefall
+          </a>
+<div role="search">
+  <form id="rtd-search-form" class="wy-form" action="../search.html" method="get">
+    <input type="text" name="q" placeholder="Search docs" />
+    <input type="hidden" name="check_keywords" value="yes" />
+    <input type="hidden" name="area" value="default" />
+  </form>
+</div>
+        </div><div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="Navigation menu">
+              <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
+<ul class="current">
+<li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1 current"><a class="reference internal" href="index.html">Model export</a><ul class="current">
+<li class="toctree-l2 current"><a class="current reference internal" href="#">Export model.state_dict()</a><ul>
+<li class="toctree-l3"><a class="reference internal" href="#when-to-use-it">When to use it</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#how-to-export">How to export</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#how-to-use-the-exported-model">How to use the exported model</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#use-the-exported-model-to-run-decode-py">Use the exported model to run decode.py</a></li>
+</ul>
+</li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-trace.html">Export model with torch.jit.trace()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-script.html">Export model with torch.jit.script()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-onnx.html">Export to ONNX</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-ncnn.html">Export to ncnn</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../huggingface/index.html">Huggingface</a></li>
+</ul>
+
+        </div>
+      </div>
+    </nav>
+
+    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap"><nav class="wy-nav-top" aria-label="Mobile navigation menu" >
+          <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
+          <a href="../index.html">icefall</a>
+      </nav>
+
+      <div class="wy-nav-content">
+        <div class="rst-content">
+          <div role="navigation" aria-label="Page navigation">
+  <ul class="wy-breadcrumbs">
+      <li><a href="../index.html" class="icon icon-home"></a> &raquo;</li>
+          <li><a href="index.html">Model export</a> &raquo;</li>
+      <li>Export model.state_dict()</li>
+      <li class="wy-breadcrumbs-aside">
+              <a href="https://github.com/k2-fsa/icefall/blob/master/icefall/docs/source/model-export/export-model-state-dict.rst" class="fa fa-github"> Edit on GitHub</a>
+      </li>
+  </ul>
+  <hr/>
+</div>
+          <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
+           <div itemprop="articleBody">
+             
+  <section id="export-model-state-dict">
+<h1>Export model.state_dict()<a class="headerlink" href="#export-model-state-dict" title="Permalink to this heading"></a></h1>
+<section id="when-to-use-it">
+<h2>When to use it<a class="headerlink" href="#when-to-use-it" title="Permalink to this heading"></a></h2>
+<p>During model training, we save checkpoints periodically to disk.</p>
+<p>A checkpoint contains the following information:</p>
+<blockquote>
+<div><ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">model.state_dict()</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">optimizer.state_dict()</span></code></p></li>
+<li><p>and some other information related to training</p></li>
+</ul>
+</div></blockquote>
+<p>When we need to resume the training process from some point, we need a checkpoint.
+However, if we want to publish the model for inference, then only
+<code class="docutils literal notranslate"><span class="pre">model.state_dict()</span></code> is needed. In this case, we need to strip all other information
+except <code class="docutils literal notranslate"><span class="pre">model.state_dict()</span></code> to reduce the file size of the published model.</p>
+</section>
+<section id="how-to-export">
+<h2>How to export<a class="headerlink" href="#how-to-export" title="Permalink to this heading"></a></h2>
+<p>Every recipe contains a file <code class="docutils literal notranslate"><span class="pre">export.py</span></code> that you can use to
+export <code class="docutils literal notranslate"><span class="pre">model.state_dict()</span></code> by taking some checkpoints as inputs.</p>
+<div class="admonition hint">
+<p class="admonition-title">Hint</p>
+<p>Each <code class="docutils literal notranslate"><span class="pre">export.py</span></code> contains well-documented usage information.</p>
+</div>
+<p>In the following, we use
+<a class="reference external" href="https://github.com/k2-fsa/icefall/blob/master/egs/librispeech/ASR/pruned_transducer_stateless3/export.py">https://github.com/k2-fsa/icefall/blob/master/egs/librispeech/ASR/pruned_transducer_stateless3/export.py</a>
+as an example.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>The steps for other recipes are almost the same.</p>
+</div>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="nb">cd</span> egs/librispeech/ASR
+
+./pruned_transducer_stateless3/export.py <span class="se">\</span>
+  --exp-dir ./pruned_transducer_stateless3/exp <span class="se">\</span>
+  --bpe-model data/lang_bpe_500/bpe.model <span class="se">\</span>
+  --epoch <span class="m">20</span> <span class="se">\</span>
+  --avg <span class="m">10</span>
+</pre></div>
+</div>
+<p>will generate a file <code class="docutils literal notranslate"><span class="pre">pruned_transducer_stateless3/exp/pretrained.pt</span></code>, which
+is a dict containing <code class="docutils literal notranslate"><span class="pre">{&quot;model&quot;:</span> <span class="pre">model.state_dict()}</span></code> saved by <code class="docutils literal notranslate"><span class="pre">torch.save()</span></code>.</p>
+</section>
+<section id="how-to-use-the-exported-model">
+<h2>How to use the exported model<a class="headerlink" href="#how-to-use-the-exported-model" title="Permalink to this heading"></a></h2>
+<p>For each recipe, we provide pretrained models hosted on huggingface.
+You can find links to pretrained models in <code class="docutils literal notranslate"><span class="pre">RESULTS.md</span></code> of each dataset.</p>
+<p>In the following, we demonstrate how to use the pretrained model from
+<a class="reference external" href="https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13">https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13</a>.</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="nb">cd</span> egs/librispeech/ASR
+
+git lfs install
+git clone https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13
+</pre></div>
+</div>
+<p>After cloning the repo with <code class="docutils literal notranslate"><span class="pre">git</span> <span class="pre">lfs</span></code>, you will find several files in the folder
+<code class="docutils literal notranslate"><span class="pre">icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp</span></code>
+that have a prefix <code class="docutils literal notranslate"><span class="pre">pretrained-</span></code>. Those files contain <code class="docutils literal notranslate"><span class="pre">model.state_dict()</span></code>
+exported by the above <code class="docutils literal notranslate"><span class="pre">export.py</span></code>.</p>
+<p>In each recipe, there is also a file <code class="docutils literal notranslate"><span class="pre">pretrained.py</span></code>, which can use
+<code class="docutils literal notranslate"><span class="pre">pretrained-xxx.pt</span></code> to decode waves. The following is an example:</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="nb">cd</span> egs/librispeech/ASR
+
+./pruned_transducer_stateless3/pretrained.py <span class="se">\</span>
+   --checkpoint ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp/pretrained-iter-1224000-avg-14.pt <span class="se">\</span>
+   --bpe-model ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/data/lang_bpe_500/bpe.model <span class="se">\</span>
+   --method greedy_search <span class="se">\</span>
+   ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1089-134686-0001.wav <span class="se">\</span>
+   ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1221-135766-0001.wav <span class="se">\</span>
+   ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1221-135766-0002.wav
+</pre></div>
+</div>
+<p>The above commands show how to use the exported model with <code class="docutils literal notranslate"><span class="pre">pretrained.py</span></code> to
+decode multiple sound files. Its output is given as follows for reference:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">02</span><span class="p">,</span><span class="mi">233</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">265</span><span class="p">]</span> <span class="p">{</span><span class="s1">&#39;best_train_loss&#39;</span><span class="p">:</span> <span class="n">inf</span><span class="p">,</span> <span class="s1">&#39;best_valid_loss&#39;</span><span class="p">:</span> <span class="n">inf</span><span class="p">,</span> <span class="s1">&#39;best_train_epoch&#39;</span><span class="p">:</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="s1">&#39;best_valid_epoch&#39;</span><span class="p">:</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="s1">&#39;batch_idx_train&#39;</span><span class="p">:</span> <span class="mi">0</span><span class="p">,</span> <span class="s1">&#39;log_interval&#39;</span><span class="p">:</span> <span class="mi">50</span><span class="p">,</span> <span class="s1">&#39;reset_interval&#39;</span><span class="p">:</span> <span class="mi">200</span><span class="p">,</span> <span class="s1">&#39;valid_interval&#39;</span><span class="p">:</span> <span class="mi">3000</span><span class="p">,</span> <span class="s1">&#39;feature_dim&#39;</span><span class="p">:</span> <span class="mi">80</span><span class="p">,</span> <span class="s1">&#39;subsampling_factor&#39;</span><span class="p">:</span> <span class="mi">4</span><span class="p">,</span> <span class="s1">&#39;encoder_dim&#39;</span><span class="p">:</span> <span class="mi">512</span><span class="p">,</span> <span class="s1">&#39;nhead&#39;</span><span class="p">:</span> <span class="mi">8</span><span class="p">,</span> <span class="s1">&#39;dim_feedforward&#39;</span><span class="p">:</span> <span class="mi">2048</span><span class="p">,</span> <span class="s1">&#39;num_encoder_layers&#39;</span><span class="p">:</span> <span class="mi">12</span><span class="p">,</span> <span class="s1">&#39;decoder_dim&#39;</span><span class="p">:</span> <span class="mi">512</span><span class="p">,</span> <span class="s1">&#39;joiner_dim&#39;</span><span class="p">:</span> <span class="mi">512</span><span class="p">,</span> <span class="s1">&#39;model_warm_step&#39;</span><span class="p">:</span> <span class="mi">3000</span><span class="p">,</span> <span class="s1">&#39;env_info&#39;</span><span class="p">:</span> <span class="p">{</span><span class="s1">&#39;k2-version&#39;</span><span class="p">:</span> <span class="s1">&#39;1.21&#39;</span><span class="p">,</span> <span class="s1">&#39;k2-build-type&#39;</span><span class="p">:</span> <span class="s1">&#39;Release&#39;</span><span class="p">,</span> <span class="s1">&#39;k2-with-cuda&#39;</span><span class="p">:</span> <span class="kc">True</span><span class="p">,</span> <span class="s1">&#39;k2-git-sha1&#39;</span><span class="p">:</span> <span class="s1">&#39;4810e00d8738f1a21278b0156a42ff396a2d40ac&#39;</span><span class="p">,</span> <span class="s1">&#39;k2-git-date&#39;</span><span class="p">:</span> <span class="s1">&#39;Fri Oct 7 19:35:03 2022&#39;</span><span class="p">,</span> <span class="s1">&#39;lhotse-version&#39;</span><span class="p">:</span> <span class="s1">&#39;1.3.0.dev+missing.version.file&#39;</span><span class="p">,</span> <span class="s1">&#39;torch-version&#39;</span><span class="p">:</span> <span class="s1">&#39;1.10.0+cu102&#39;</span><span class="p">,</span> <span class="s1">&#39;torch-cuda-available&#39;</span><span class="p">:</span> <span class="kc">False</span><span class="p">,</span> <span class="s1">&#39;torch-cuda-version&#39;</span><span class="p">:</span> <span class="s1">&#39;10.2&#39;</span><span class="p">,</span> <span class="s1">&#39;python-version&#39;</span><span class="p">:</span> <span class="s1">&#39;3.8&#39;</span><span class="p">,</span> <span class="s1">&#39;icefall-git-branch&#39;</span><span class="p">:</span> <span class="s1">&#39;onnx-doc-1013&#39;</span><span class="p">,</span> <span class="s1">&#39;icefall-git-sha1&#39;</span><span class="p">:</span> <span class="s1">&#39;c39cba5-dirty&#39;</span><span class="p">,</span> <span class="s1">&#39;icefall-git-date&#39;</span><span class="p">:</span> <span class="s1">&#39;Thu Oct 13 15:17:20 2022&#39;</span><span class="p">,</span> <span class="s1">&#39;icefall-path&#39;</span><span class="p">:</span> <span class="s1">&#39;/k2-dev/fangjun/open-source/icefall-master&#39;</span><span class="p">,</span> <span class="s1">&#39;k2-path&#39;</span><span class="p">:</span> <span class="s1">&#39;/k2-dev/fangjun/open-source/k2-master/k2/python/k2/__init__.py&#39;</span><span class="p">,</span> <span class="s1">&#39;lhotse-path&#39;</span><span class="p">:</span> <span class="s1">&#39;/ceph-fj/fangjun/open-source-2/lhotse-jsonl/lhotse/__init__.py&#39;</span><span class="p">,</span> <span class="s1">&#39;hostname&#39;</span><span class="p">:</span> <span class="s1">&#39;de-74279-k2-test-4-0324160024-65bfd8b584-jjlbn&#39;</span><span class="p">,</span> <span class="s1">&#39;IP address&#39;</span><span class="p">:</span> <span class="s1">&#39;10.177.74.203&#39;</span><span class="p">},</span> <span class="s1">&#39;checkpoint&#39;</span><span class="p">:</span> <span class="s1">&#39;./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp/pretrained-iter-1224000-avg-14.pt&#39;</span><span class="p">,</span> <span class="s1">&#39;bpe_model&#39;</span><span class="p">:</span> <span class="s1">&#39;./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/data/lang_bpe_500/bpe.model&#39;</span><span class="p">,</span> <span class="s1">&#39;method&#39;</span><span class="p">:</span> <span class="s1">&#39;greedy_search&#39;</span><span class="p">,</span> <span class="s1">&#39;sound_files&#39;</span><span class="p">:</span> <span class="p">[</span><span class="s1">&#39;./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1089-134686-0001.wav&#39;</span><span class="p">,</span> <span class="s1">&#39;./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1221-135766-0001.wav&#39;</span><span class="p">,</span> <span class="s1">&#39;./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1221-135766-0002.wav&#39;</span><span class="p">],</span> <span class="s1">&#39;sample_rate&#39;</span><span class="p">:</span> <span class="mi">16000</span><span class="p">,</span> <span class="s1">&#39;beam_size&#39;</span><span class="p">:</span> <span class="mi">4</span><span class="p">,</span> <span class="s1">&#39;beam&#39;</span><span class="p">:</span> <span class="mi">4</span><span class="p">,</span> <span class="s1">&#39;max_contexts&#39;</span><span class="p">:</span> <span class="mi">4</span><span class="p">,</span> <span class="s1">&#39;max_states&#39;</span><span class="p">:</span> <span class="mi">8</span><span class="p">,</span> <span class="s1">&#39;context_size&#39;</span><span class="p">:</span> <span class="mi">2</span><span class="p">,</span> <span class="s1">&#39;max_sym_per_frame&#39;</span><span class="p">:</span> <span class="mi">1</span><span class="p">,</span> <span class="s1">&#39;simulate_streaming&#39;</span><span class="p">:</span> <span class="kc">False</span><span class="p">,</span> <span class="s1">&#39;decode_chunk_size&#39;</span><span class="p">:</span> <span class="mi">16</span><span class="p">,</span> <span class="s1">&#39;left_context&#39;</span><span class="p">:</span> <span class="mi">64</span><span class="p">,</span> <span class="s1">&#39;dynamic_chunk_training&#39;</span><span class="p">:</span> <span class="kc">False</span><span class="p">,</span> <span class="s1">&#39;causal_convolution&#39;</span><span class="p">:</span> <span class="kc">False</span><span class="p">,</span> <span class="s1">&#39;short_chunk_size&#39;</span><span class="p">:</span> <span class="mi">25</span><span class="p">,</span> <span class="s1">&#39;num_left_chunks&#39;</span><span class="p">:</span> <span class="mi">4</span><span class="p">,</span> <span class="s1">&#39;blank_id&#39;</span><span class="p">:</span> <span class="mi">0</span><span class="p">,</span> <span class="s1">&#39;unk_id&#39;</span><span class="p">:</span> <span class="mi">2</span><span class="p">,</span> <span class="s1">&#39;vocab_size&#39;</span><span class="p">:</span> <span class="mi">500</span><span class="p">}</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">02</span><span class="p">,</span><span class="mi">233</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">271</span><span class="p">]</span> <span class="n">device</span><span class="p">:</span> <span class="n">cpu</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">02</span><span class="p">,</span><span class="mi">233</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">273</span><span class="p">]</span> <span class="n">Creating</span> <span class="n">model</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">02</span><span class="p">,</span><span class="mi">612</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">train</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">458</span><span class="p">]</span> <span class="n">Disable</span> <span class="n">giga</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">02</span><span class="p">,</span><span class="mi">623</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">277</span><span class="p">]</span> <span class="n">Number</span> <span class="n">of</span> <span class="n">model</span> <span class="n">parameters</span><span class="p">:</span> <span class="mi">78648040</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">02</span><span class="p">,</span><span class="mi">951</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">285</span><span class="p">]</span> <span class="n">Constructing</span> <span class="n">Fbank</span> <span class="n">computer</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">02</span><span class="p">,</span><span class="mi">952</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">295</span><span class="p">]</span> <span class="n">Reading</span> <span class="n">sound</span> <span class="n">files</span><span class="p">:</span> <span class="p">[</span><span class="s1">&#39;./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1089-134686-0001.wav&#39;</span><span class="p">,</span> <span class="s1">&#39;./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1221-135766-0001.wav&#39;</span><span class="p">,</span> <span class="s1">&#39;./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/test_wavs/1221-135766-0002.wav&#39;</span><span class="p">]</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">02</span><span class="p">,</span><span class="mi">957</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">301</span><span class="p">]</span> <span class="n">Decoding</span> <span class="n">started</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">06</span><span class="p">,</span><span class="mi">700</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">329</span><span class="p">]</span> <span class="n">Using</span> <span class="n">greedy_search</span>
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">06</span><span class="p">,</span><span class="mi">912</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">388</span><span class="p">]</span>
+<span class="o">./</span><span class="n">icefall</span><span class="o">-</span><span class="n">asr</span><span class="o">-</span><span class="n">librispeech</span><span class="o">-</span><span class="n">pruned</span><span class="o">-</span><span class="n">transducer</span><span class="o">-</span><span class="n">stateless3</span><span class="o">-</span><span class="mi">2022</span><span class="o">-</span><span class="mi">05</span><span class="o">-</span><span class="mi">13</span><span class="o">/</span><span class="n">test_wavs</span><span class="o">/</span><span class="mi">1089</span><span class="o">-</span><span class="mi">134686</span><span class="o">-</span><span class="mf">0001.</span><span class="n">wav</span><span class="p">:</span>
+<span class="n">AFTER</span> <span class="n">EARLY</span> <span class="n">NIGHTFALL</span> <span class="n">THE</span> <span class="n">YELLOW</span> <span class="n">LAMPS</span> <span class="n">WOULD</span> <span class="n">LIGHT</span> <span class="n">UP</span> <span class="n">HERE</span> <span class="n">AND</span> <span class="n">THERE</span> <span class="n">THE</span> <span class="n">SQUALID</span> <span class="n">QUARTER</span> <span class="n">OF</span> <span class="n">THE</span> <span class="n">BROTHELS</span>
+
+<span class="o">./</span><span class="n">icefall</span><span class="o">-</span><span class="n">asr</span><span class="o">-</span><span class="n">librispeech</span><span class="o">-</span><span class="n">pruned</span><span class="o">-</span><span class="n">transducer</span><span class="o">-</span><span class="n">stateless3</span><span class="o">-</span><span class="mi">2022</span><span class="o">-</span><span class="mi">05</span><span class="o">-</span><span class="mi">13</span><span class="o">/</span><span class="n">test_wavs</span><span class="o">/</span><span class="mi">1221</span><span class="o">-</span><span class="mi">135766</span><span class="o">-</span><span class="mf">0001.</span><span class="n">wav</span><span class="p">:</span>
+<span class="n">GOD</span> <span class="n">AS</span> <span class="n">A</span> <span class="n">DIRECT</span> <span class="n">CONSEQUENCE</span> <span class="n">OF</span> <span class="n">THE</span> <span class="n">SIN</span> <span class="n">WHICH</span> <span class="n">MAN</span> <span class="n">THUS</span> <span class="n">PUNISHED</span> <span class="n">HAD</span> <span class="n">GIVEN</span> <span class="n">HER</span> <span class="n">A</span> <span class="n">LOVELY</span> <span class="n">CHILD</span> <span class="n">WHOSE</span> <span class="n">PLACE</span> <span class="n">WAS</span> <span class="n">ON</span> <span class="n">THAT</span> <span class="n">SAME</span> <span class="n">DISHONORED</span> <span class="n">BOSOM</span> <span class="n">TO</span> <span class="n">CONNECT</span> <span class="n">HER</span> <span class="n">PARENT</span> <span class="n">FOREVER</span> <span class="n">WITH</span> <span class="n">THE</span> <span class="n">RACE</span> <span class="n">AND</span> <span class="n">DESCENT</span> <span class="n">OF</span> <span class="n">MORTALS</span> <span class="n">AND</span> <span class="n">TO</span> <span class="n">BE</span> <span class="n">FINALLY</span> <span class="n">A</span> <span class="n">BLESSED</span> <span class="n">SOUL</span> <span class="n">IN</span> <span class="n">HEAVEN</span>
+
+<span class="o">./</span><span class="n">icefall</span><span class="o">-</span><span class="n">asr</span><span class="o">-</span><span class="n">librispeech</span><span class="o">-</span><span class="n">pruned</span><span class="o">-</span><span class="n">transducer</span><span class="o">-</span><span class="n">stateless3</span><span class="o">-</span><span class="mi">2022</span><span class="o">-</span><span class="mi">05</span><span class="o">-</span><span class="mi">13</span><span class="o">/</span><span class="n">test_wavs</span><span class="o">/</span><span class="mi">1221</span><span class="o">-</span><span class="mi">135766</span><span class="o">-</span><span class="mf">0002.</span><span class="n">wav</span><span class="p">:</span>
+<span class="n">YET</span> <span class="n">THESE</span> <span class="n">THOUGHTS</span> <span class="n">AFFECTED</span> <span class="n">HESTER</span> <span class="n">PRYNNE</span> <span class="n">LESS</span> <span class="n">WITH</span> <span class="n">HOPE</span> <span class="n">THAN</span> <span class="n">APPREHENSION</span>
+
+
+<span class="mi">2022</span><span class="o">-</span><span class="mi">10</span><span class="o">-</span><span class="mi">13</span> <span class="mi">19</span><span class="p">:</span><span class="mi">09</span><span class="p">:</span><span class="mi">06</span><span class="p">,</span><span class="mi">912</span> <span class="n">INFO</span> <span class="p">[</span><span class="n">pretrained</span><span class="o">.</span><span class="n">py</span><span class="p">:</span><span class="mi">390</span><span class="p">]</span> <span class="n">Decoding</span> <span class="n">Done</span>
+</pre></div>
+</div>
+</section>
+<section id="use-the-exported-model-to-run-decode-py">
+<h2>Use the exported model to run decode.py<a class="headerlink" href="#use-the-exported-model-to-run-decode-py" title="Permalink to this heading"></a></h2>
+<p>When we publish the model, we always note down its WERs on some test
+dataset in <code class="docutils literal notranslate"><span class="pre">RESULTS.md</span></code>. This section describes how to use the
+pretrained model to reproduce the WER.</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="nb">cd</span> egs/librispeech/ASR
+git lfs install
+git clone https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13
+
+<span class="nb">cd</span> icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp
+ln -s pretrained-iter-1224000-avg-14.pt epoch-9999.pt
+<span class="nb">cd</span> ../..
+</pre></div>
+</div>
+<p>We create a symlink with name <code class="docutils literal notranslate"><span class="pre">epoch-9999.pt</span></code> to <code class="docutils literal notranslate"><span class="pre">pretrained-iter-1224000-avg-14.pt</span></code>,
+so that we can pass <code class="docutils literal notranslate"><span class="pre">--epoch</span> <span class="pre">9999</span> <span class="pre">--avg</span> <span class="pre">1</span></code> to <code class="docutils literal notranslate"><span class="pre">decode.py</span></code> in the following
+command:</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span>./pruned_transducer_stateless3/decode.py <span class="se">\</span>
+    --epoch <span class="m">9999</span> <span class="se">\</span>
+    --avg <span class="m">1</span> <span class="se">\</span>
+    --exp-dir ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp <span class="se">\</span>
+    --lang-dir ./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/data/lang_bpe_500 <span class="se">\</span>
+    --max-duration <span class="m">600</span> <span class="se">\</span>
+    --decoding-method greedy_search
+</pre></div>
+</div>
+<p>You will find the decoding results in
+<code class="docutils literal notranslate"><span class="pre">./icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13/exp/greedy_search</span></code>.</p>
+<div class="admonition caution">
+<p class="admonition-title">Caution</p>
+<p>For some recipes, you also need to pass <code class="docutils literal notranslate"><span class="pre">--use-averaged-model</span> <span class="pre">False</span></code>
+to <code class="docutils literal notranslate"><span class="pre">decode.py</span></code>. The reason is that the exported pretrained model is already
+the averaged one.</p>
+</div>
+<div class="admonition hint">
+<p class="admonition-title">Hint</p>
+<p>Before running <code class="docutils literal notranslate"><span class="pre">decode.py</span></code>, we assume that you have already run
+<code class="docutils literal notranslate"><span class="pre">prepare.sh</span></code> to prepare the test dataset.</p>
+</div>
+</section>
+</section>
+
+
+           </div>
+          </div>
+          <footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
+        <a href="index.html" class="btn btn-neutral float-left" title="Model export" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
+        <a href="export-with-torch-jit-trace.html" class="btn btn-neutral float-right" title="Export model with torch.jit.trace()" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
+    </div>
+
+  <hr/>
+
+  <div role="contentinfo">
+    <p>&#169; Copyright 2021, icefall development team.</p>
+  </div>
+
+  Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
+    <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
+    provided by <a href="https://readthedocs.org">Read the Docs</a>.
+   
+
+</footer>
+        </div>
+      </div>
+    </section>
+  </div>
+  <script>
+      jQuery(function () {
+          SphinxRtdTheme.Navigation.enable(true);
+      });
+  </script> 
+
+</body>
+</html>
\ No newline at end of file
diff --git a/model-export/export-ncnn.html b/model-export/export-ncnn.html
new file mode 100644
index 000000000..2338e1df1
--- /dev/null
+++ b/model-export/export-ncnn.html
@@ -0,0 +1,125 @@
+<!DOCTYPE html>
+<html class="writer-html5" lang="en" >
+<head>
+  <meta charset="utf-8" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+
+  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+  <title>Export to ncnn &mdash; icefall 0.1 documentation</title>
+      <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
+      <link rel="stylesheet" href="../_static/css/theme.css" type="text/css" />
+  <!--[if lt IE 9]>
+    <script src="../_static/js/html5shiv.min.js"></script>
+  <![endif]-->
+  
+        <script data-url_root="../" id="documentation_options" src="../_static/documentation_options.js"></script>
+        <script src="../_static/jquery.js"></script>
+        <script src="../_static/underscore.js"></script>
+        <script src="../_static/_sphinx_javascript_frameworks_compat.js"></script>
+        <script src="../_static/doctools.js"></script>
+        <script src="../_static/sphinx_highlight.js"></script>
+    <script src="../_static/js/theme.js"></script>
+    <link rel="index" title="Index" href="../genindex.html" />
+    <link rel="search" title="Search" href="../search.html" />
+    <link rel="next" title="Recipes" href="../recipes/index.html" />
+    <link rel="prev" title="Export to ONNX" href="export-onnx.html" /> 
+</head>
+
+<body class="wy-body-for-nav"> 
+  <div class="wy-grid-for-nav">
+    <nav data-toggle="wy-nav-shift" class="wy-nav-side">
+      <div class="wy-side-scroll">
+        <div class="wy-side-nav-search" >
+            <a href="../index.html" class="icon icon-home"> icefall
+          </a>
+<div role="search">
+  <form id="rtd-search-form" class="wy-form" action="../search.html" method="get">
+    <input type="text" name="q" placeholder="Search docs" />
+    <input type="hidden" name="check_keywords" value="yes" />
+    <input type="hidden" name="area" value="default" />
+  </form>
+</div>
+        </div><div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="Navigation menu">
+              <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
+<ul class="current">
+<li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1 current"><a class="reference internal" href="index.html">Model export</a><ul class="current">
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html">Export model.state_dict()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-trace.html">Export model with torch.jit.trace()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-script.html">Export model with torch.jit.script()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-onnx.html">Export to ONNX</a></li>
+<li class="toctree-l2 current"><a class="current reference internal" href="#">Export to ncnn</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../huggingface/index.html">Huggingface</a></li>
+</ul>
+
+        </div>
+      </div>
+    </nav>
+
+    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap"><nav class="wy-nav-top" aria-label="Mobile navigation menu" >
+          <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
+          <a href="../index.html">icefall</a>
+      </nav>
+
+      <div class="wy-nav-content">
+        <div class="rst-content">
+          <div role="navigation" aria-label="Page navigation">
+  <ul class="wy-breadcrumbs">
+      <li><a href="../index.html" class="icon icon-home"></a> &raquo;</li>
+          <li><a href="index.html">Model export</a> &raquo;</li>
+      <li>Export to ncnn</li>
+      <li class="wy-breadcrumbs-aside">
+              <a href="https://github.com/k2-fsa/icefall/blob/master/icefall/docs/source/model-export/export-ncnn.rst" class="fa fa-github"> Edit on GitHub</a>
+      </li>
+  </ul>
+  <hr/>
+</div>
+          <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
+           <div itemprop="articleBody">
+             
+  <section id="export-to-ncnn">
+<h1>Export to ncnn<a class="headerlink" href="#export-to-ncnn" title="Permalink to this heading"></a></h1>
+<p>We support exporting LSTM transducer models to <a class="reference external" href="https://github.com/tencent/ncnn">ncnn</a>.</p>
+<p>Please refer to <a class="reference internal" href="../recipes/librispeech/lstm_pruned_stateless_transducer.html#export-model-for-ncnn"><span class="std std-ref">Export model for ncnn</span></a> for details.</p>
+<p>We also provide <a class="reference external" href="https://github.com/k2-fsa/sherpa-ncnn">https://github.com/k2-fsa/sherpa-ncnn</a>
+performing speech recognition using <code class="docutils literal notranslate"><span class="pre">ncnn</span></code> with exported models.
+It has been tested on Linux, macOS, Windows, and Raspberry Pi. The project is
+self-contained and can be statically linked to produce a binary containing
+everything needed.</p>
+</section>
+
+
+           </div>
+          </div>
+          <footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
+        <a href="export-onnx.html" class="btn btn-neutral float-left" title="Export to ONNX" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
+        <a href="../recipes/index.html" class="btn btn-neutral float-right" title="Recipes" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
+    </div>
+
+  <hr/>
+
+  <div role="contentinfo">
+    <p>&#169; Copyright 2021, icefall development team.</p>
+  </div>
+
+  Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
+    <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
+    provided by <a href="https://readthedocs.org">Read the Docs</a>.
+   
+
+</footer>
+        </div>
+      </div>
+    </section>
+  </div>
+  <script>
+      jQuery(function () {
+          SphinxRtdTheme.Navigation.enable(true);
+      });
+  </script> 
+
+</body>
+</html>
\ No newline at end of file
diff --git a/model-export/export-onnx.html b/model-export/export-onnx.html
new file mode 100644
index 000000000..0c316d7d0
--- /dev/null
+++ b/model-export/export-onnx.html
@@ -0,0 +1,182 @@
+<!DOCTYPE html>
+<html class="writer-html5" lang="en" >
+<head>
+  <meta charset="utf-8" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+
+  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+  <title>Export to ONNX &mdash; icefall 0.1 documentation</title>
+      <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
+      <link rel="stylesheet" href="../_static/css/theme.css" type="text/css" />
+  <!--[if lt IE 9]>
+    <script src="../_static/js/html5shiv.min.js"></script>
+  <![endif]-->
+  
+        <script data-url_root="../" id="documentation_options" src="../_static/documentation_options.js"></script>
+        <script src="../_static/jquery.js"></script>
+        <script src="../_static/underscore.js"></script>
+        <script src="../_static/_sphinx_javascript_frameworks_compat.js"></script>
+        <script src="../_static/doctools.js"></script>
+        <script src="../_static/sphinx_highlight.js"></script>
+    <script src="../_static/js/theme.js"></script>
+    <link rel="index" title="Index" href="../genindex.html" />
+    <link rel="search" title="Search" href="../search.html" />
+    <link rel="next" title="Export to ncnn" href="export-ncnn.html" />
+    <link rel="prev" title="Export model with torch.jit.script()" href="export-with-torch-jit-script.html" /> 
+</head>
+
+<body class="wy-body-for-nav"> 
+  <div class="wy-grid-for-nav">
+    <nav data-toggle="wy-nav-shift" class="wy-nav-side">
+      <div class="wy-side-scroll">
+        <div class="wy-side-nav-search" >
+            <a href="../index.html" class="icon icon-home"> icefall
+          </a>
+<div role="search">
+  <form id="rtd-search-form" class="wy-form" action="../search.html" method="get">
+    <input type="text" name="q" placeholder="Search docs" />
+    <input type="hidden" name="check_keywords" value="yes" />
+    <input type="hidden" name="area" value="default" />
+  </form>
+</div>
+        </div><div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="Navigation menu">
+              <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
+<ul class="current">
+<li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1 current"><a class="reference internal" href="index.html">Model export</a><ul class="current">
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html">Export model.state_dict()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-trace.html">Export model with torch.jit.trace()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-script.html">Export model with torch.jit.script()</a></li>
+<li class="toctree-l2 current"><a class="current reference internal" href="#">Export to ONNX</a><ul>
+<li class="toctree-l3"><a class="reference internal" href="#when-to-use-it">When to use it</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#how-to-export">How to export</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#how-to-use-the-exported-model">How to use the exported model</a></li>
+</ul>
+</li>
+<li class="toctree-l2"><a class="reference internal" href="export-ncnn.html">Export to ncnn</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../huggingface/index.html">Huggingface</a></li>
+</ul>
+
+        </div>
+      </div>
+    </nav>
+
+    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap"><nav class="wy-nav-top" aria-label="Mobile navigation menu" >
+          <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
+          <a href="../index.html">icefall</a>
+      </nav>
+
+      <div class="wy-nav-content">
+        <div class="rst-content">
+          <div role="navigation" aria-label="Page navigation">
+  <ul class="wy-breadcrumbs">
+      <li><a href="../index.html" class="icon icon-home"></a> &raquo;</li>
+          <li><a href="index.html">Model export</a> &raquo;</li>
+      <li>Export to ONNX</li>
+      <li class="wy-breadcrumbs-aside">
+              <a href="https://github.com/k2-fsa/icefall/blob/master/icefall/docs/source/model-export/export-onnx.rst" class="fa fa-github"> Edit on GitHub</a>
+      </li>
+  </ul>
+  <hr/>
+</div>
+          <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
+           <div itemprop="articleBody">
+             
+  <section id="export-to-onnx">
+<h1>Export to ONNX<a class="headerlink" href="#export-to-onnx" title="Permalink to this heading"></a></h1>
+<p>In this section, we describe how to export models to ONNX.</p>
+<div class="admonition hint">
+<p class="admonition-title">Hint</p>
+<p>Only non-streaming conformer transducer models are tested.</p>
+</div>
+<section id="when-to-use-it">
+<h2>When to use it<a class="headerlink" href="#when-to-use-it" title="Permalink to this heading"></a></h2>
+<p>It you want to use an inference framework that supports ONNX
+to run the pretrained model.</p>
+</section>
+<section id="how-to-export">
+<h2>How to export<a class="headerlink" href="#how-to-export" title="Permalink to this heading"></a></h2>
+<p>We use
+<a class="reference external" href="https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/pruned_transducer_stateless3">https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/pruned_transducer_stateless3</a>
+as an example in the following.</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="nb">cd</span> egs/librispeech/ASR
+<span class="nv">epoch</span><span class="o">=</span><span class="m">14</span>
+<span class="nv">avg</span><span class="o">=</span><span class="m">2</span>
+
+./pruned_transducer_stateless3/export.py <span class="se">\</span>
+  --exp-dir ./pruned_transducer_stateless3/exp <span class="se">\</span>
+  --bpe-model data/lang_bpe_500/bpe.model <span class="se">\</span>
+  --epoch <span class="nv">$epoch</span> <span class="se">\</span>
+  --avg <span class="nv">$avg</span> <span class="se">\</span>
+  --onnx <span class="m">1</span>
+</pre></div>
+</div>
+<p>It will generate the following files inside <code class="docutils literal notranslate"><span class="pre">pruned_transducer_stateless3/exp</span></code>:</p>
+<blockquote>
+<div><ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">encoder.onnx</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">decoder.onnx</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">joiner.onnx</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">joiner_encoder_proj.onnx</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">joiner_decoder_proj.onnx</span></code></p></li>
+</ul>
+</div></blockquote>
+<p>You can use <code class="docutils literal notranslate"><span class="pre">./pruned_transducer_stateless3/exp/onnx_pretrained.py</span></code> to decode
+waves with the generated files:</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span>./pruned_transducer_stateless3/onnx_pretrained.py <span class="se">\</span>
+  --bpe-model ./data/lang_bpe_500/bpe.model <span class="se">\</span>
+  --encoder-model-filename ./pruned_transducer_stateless3/exp/encoder.onnx <span class="se">\</span>
+  --decoder-model-filename ./pruned_transducer_stateless3/exp/decoder.onnx <span class="se">\</span>
+  --joiner-model-filename ./pruned_transducer_stateless3/exp/joiner.onnx <span class="se">\</span>
+  --joiner-encoder-proj-model-filename ./pruned_transducer_stateless3/exp/joiner_encoder_proj.onnx <span class="se">\</span>
+  --joiner-decoder-proj-model-filename ./pruned_transducer_stateless3/exp/joiner_decoder_proj.onnx <span class="se">\</span>
+  /path/to/foo.wav <span class="se">\</span>
+  /path/to/bar.wav <span class="se">\</span>
+  /path/to/baz.wav
+</pre></div>
+</div>
+</section>
+<section id="how-to-use-the-exported-model">
+<h2>How to use the exported model<a class="headerlink" href="#how-to-use-the-exported-model" title="Permalink to this heading"></a></h2>
+<p>We also provide <a class="reference external" href="https://github.com/k2-fsa/sherpa-onnx">https://github.com/k2-fsa/sherpa-onnx</a>
+performing speech recognition using <a class="reference external" href="https://github.com/microsoft/onnxruntime">onnxruntime</a>
+with exported models.
+It has been tested on Linux, macOS, and Windows.</p>
+</section>
+</section>
+
+
+           </div>
+          </div>
+          <footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
+        <a href="export-with-torch-jit-script.html" class="btn btn-neutral float-left" title="Export model with torch.jit.script()" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
+        <a href="export-ncnn.html" class="btn btn-neutral float-right" title="Export to ncnn" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
+    </div>
+
+  <hr/>
+
+  <div role="contentinfo">
+    <p>&#169; Copyright 2021, icefall development team.</p>
+  </div>
+
+  Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
+    <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
+    provided by <a href="https://readthedocs.org">Read the Docs</a>.
+   
+
+</footer>
+        </div>
+      </div>
+    </section>
+  </div>
+  <script>
+      jQuery(function () {
+          SphinxRtdTheme.Navigation.enable(true);
+      });
+  </script> 
+
+</body>
+</html>
\ No newline at end of file
diff --git a/model-export/export-with-torch-jit-script.html b/model-export/export-with-torch-jit-script.html
new file mode 100644
index 000000000..2d0771d0e
--- /dev/null
+++ b/model-export/export-with-torch-jit-script.html
@@ -0,0 +1,172 @@
+<!DOCTYPE html>
+<html class="writer-html5" lang="en" >
+<head>
+  <meta charset="utf-8" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+
+  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+  <title>Export model with torch.jit.script() &mdash; icefall 0.1 documentation</title>
+      <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
+      <link rel="stylesheet" href="../_static/css/theme.css" type="text/css" />
+  <!--[if lt IE 9]>
+    <script src="../_static/js/html5shiv.min.js"></script>
+  <![endif]-->
+  
+        <script data-url_root="../" id="documentation_options" src="../_static/documentation_options.js"></script>
+        <script src="../_static/jquery.js"></script>
+        <script src="../_static/underscore.js"></script>
+        <script src="../_static/_sphinx_javascript_frameworks_compat.js"></script>
+        <script src="../_static/doctools.js"></script>
+        <script src="../_static/sphinx_highlight.js"></script>
+    <script src="../_static/js/theme.js"></script>
+    <link rel="index" title="Index" href="../genindex.html" />
+    <link rel="search" title="Search" href="../search.html" />
+    <link rel="next" title="Export to ONNX" href="export-onnx.html" />
+    <link rel="prev" title="Export model with torch.jit.trace()" href="export-with-torch-jit-trace.html" /> 
+</head>
+
+<body class="wy-body-for-nav"> 
+  <div class="wy-grid-for-nav">
+    <nav data-toggle="wy-nav-shift" class="wy-nav-side">
+      <div class="wy-side-scroll">
+        <div class="wy-side-nav-search" >
+            <a href="../index.html" class="icon icon-home"> icefall
+          </a>
+<div role="search">
+  <form id="rtd-search-form" class="wy-form" action="../search.html" method="get">
+    <input type="text" name="q" placeholder="Search docs" />
+    <input type="hidden" name="check_keywords" value="yes" />
+    <input type="hidden" name="area" value="default" />
+  </form>
+</div>
+        </div><div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="Navigation menu">
+              <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
+<ul class="current">
+<li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1 current"><a class="reference internal" href="index.html">Model export</a><ul class="current">
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html">Export model.state_dict()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-trace.html">Export model with torch.jit.trace()</a></li>
+<li class="toctree-l2 current"><a class="current reference internal" href="#">Export model with torch.jit.script()</a><ul>
+<li class="toctree-l3"><a class="reference internal" href="#when-to-use-it">When to use it</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#how-to-export">How to export</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#how-to-use-the-exported-model">How to use the exported model</a></li>
+</ul>
+</li>
+<li class="toctree-l2"><a class="reference internal" href="export-onnx.html">Export to ONNX</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-ncnn.html">Export to ncnn</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../huggingface/index.html">Huggingface</a></li>
+</ul>
+
+        </div>
+      </div>
+    </nav>
+
+    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap"><nav class="wy-nav-top" aria-label="Mobile navigation menu" >
+          <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
+          <a href="../index.html">icefall</a>
+      </nav>
+
+      <div class="wy-nav-content">
+        <div class="rst-content">
+          <div role="navigation" aria-label="Page navigation">
+  <ul class="wy-breadcrumbs">
+      <li><a href="../index.html" class="icon icon-home"></a> &raquo;</li>
+          <li><a href="index.html">Model export</a> &raquo;</li>
+      <li>Export model with torch.jit.script()</li>
+      <li class="wy-breadcrumbs-aside">
+              <a href="https://github.com/k2-fsa/icefall/blob/master/icefall/docs/source/model-export/export-with-torch-jit-script.rst" class="fa fa-github"> Edit on GitHub</a>
+      </li>
+  </ul>
+  <hr/>
+</div>
+          <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
+           <div itemprop="articleBody">
+             
+  <section id="export-model-with-torch-jit-script">
+<span id="id1"></span><h1>Export model with torch.jit.script()<a class="headerlink" href="#export-model-with-torch-jit-script" title="Permalink to this heading"></a></h1>
+<p>In this section, we describe how to export a model via
+<code class="docutils literal notranslate"><span class="pre">torch.jit.script()</span></code>.</p>
+<section id="when-to-use-it">
+<h2>When to use it<a class="headerlink" href="#when-to-use-it" title="Permalink to this heading"></a></h2>
+<p>If we want to use our trained model with torchscript,
+we can use <code class="docutils literal notranslate"><span class="pre">torch.jit.script()</span></code>.</p>
+<div class="admonition hint">
+<p class="admonition-title">Hint</p>
+<p>See <a class="reference internal" href="export-with-torch-jit-trace.html#export-model-with-torch-jit-trace"><span class="std std-ref">Export model with torch.jit.trace()</span></a>
+if you want to use <code class="docutils literal notranslate"><span class="pre">torch.jit.trace()</span></code>.</p>
+</div>
+</section>
+<section id="how-to-export">
+<h2>How to export<a class="headerlink" href="#how-to-export" title="Permalink to this heading"></a></h2>
+<p>We use
+<a class="reference external" href="https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/pruned_transducer_stateless3">https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/pruned_transducer_stateless3</a>
+as an example in the following.</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="nb">cd</span> egs/librispeech/ASR
+<span class="nv">epoch</span><span class="o">=</span><span class="m">14</span>
+<span class="nv">avg</span><span class="o">=</span><span class="m">1</span>
+
+./pruned_transducer_stateless3/export.py <span class="se">\</span>
+  --exp-dir ./pruned_transducer_stateless3/exp <span class="se">\</span>
+  --bpe-model data/lang_bpe_500/bpe.model <span class="se">\</span>
+  --epoch <span class="nv">$epoch</span> <span class="se">\</span>
+  --avg <span class="nv">$avg</span> <span class="se">\</span>
+  --jit <span class="m">1</span>
+</pre></div>
+</div>
+<p>It will generate a file <code class="docutils literal notranslate"><span class="pre">cpu_jit.pt</span></code> in <code class="docutils literal notranslate"><span class="pre">pruned_transducer_stateless3/exp</span></code>.</p>
+<div class="admonition caution">
+<p class="admonition-title">Caution</p>
+<p>Don’t be confused by <code class="docutils literal notranslate"><span class="pre">cpu</span></code> in <code class="docutils literal notranslate"><span class="pre">cpu_jit.pt</span></code>. We move all parameters
+to CPU before saving it into a <code class="docutils literal notranslate"><span class="pre">pt</span></code> file; that’s why we use <code class="docutils literal notranslate"><span class="pre">cpu</span></code>
+in the filename.</p>
+</div>
+</section>
+<section id="how-to-use-the-exported-model">
+<h2>How to use the exported model<a class="headerlink" href="#how-to-use-the-exported-model" title="Permalink to this heading"></a></h2>
+<p>Please refer to the following pages for usage:</p>
+<ul class="simple">
+<li><p><a class="reference external" href="https://k2-fsa.github.io/sherpa/python/streaming_asr/emformer/index.html">https://k2-fsa.github.io/sherpa/python/streaming_asr/emformer/index.html</a></p></li>
+<li><p><a class="reference external" href="https://k2-fsa.github.io/sherpa/python/streaming_asr/conv_emformer/index.html">https://k2-fsa.github.io/sherpa/python/streaming_asr/conv_emformer/index.html</a></p></li>
+<li><p><a class="reference external" href="https://k2-fsa.github.io/sherpa/python/streaming_asr/conformer/index.html">https://k2-fsa.github.io/sherpa/python/streaming_asr/conformer/index.html</a></p></li>
+<li><p><a class="reference external" href="https://k2-fsa.github.io/sherpa/python/offline_asr/conformer/index.html">https://k2-fsa.github.io/sherpa/python/offline_asr/conformer/index.html</a></p></li>
+<li><p><a class="reference external" href="https://k2-fsa.github.io/sherpa/cpp/offline_asr/gigaspeech.html">https://k2-fsa.github.io/sherpa/cpp/offline_asr/gigaspeech.html</a></p></li>
+<li><p><a class="reference external" href="https://k2-fsa.github.io/sherpa/cpp/offline_asr/wenetspeech.html">https://k2-fsa.github.io/sherpa/cpp/offline_asr/wenetspeech.html</a></p></li>
+</ul>
+</section>
+</section>
+
+
+           </div>
+          </div>
+          <footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
+        <a href="export-with-torch-jit-trace.html" class="btn btn-neutral float-left" title="Export model with torch.jit.trace()" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
+        <a href="export-onnx.html" class="btn btn-neutral float-right" title="Export to ONNX" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
+    </div>
+
+  <hr/>
+
+  <div role="contentinfo">
+    <p>&#169; Copyright 2021, icefall development team.</p>
+  </div>
+
+  Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
+    <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
+    provided by <a href="https://readthedocs.org">Read the Docs</a>.
+   
+
+</footer>
+        </div>
+      </div>
+    </section>
+  </div>
+  <script>
+      jQuery(function () {
+          SphinxRtdTheme.Navigation.enable(true);
+      });
+  </script> 
+
+</body>
+</html>
\ No newline at end of file
diff --git a/model-export/export-with-torch-jit-trace.html b/model-export/export-with-torch-jit-trace.html
new file mode 100644
index 000000000..f67705231
--- /dev/null
+++ b/model-export/export-with-torch-jit-trace.html
@@ -0,0 +1,183 @@
+<!DOCTYPE html>
+<html class="writer-html5" lang="en" >
+<head>
+  <meta charset="utf-8" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+
+  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+  <title>Export model with torch.jit.trace() &mdash; icefall 0.1 documentation</title>
+      <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
+      <link rel="stylesheet" href="../_static/css/theme.css" type="text/css" />
+  <!--[if lt IE 9]>
+    <script src="../_static/js/html5shiv.min.js"></script>
+  <![endif]-->
+  
+        <script data-url_root="../" id="documentation_options" src="../_static/documentation_options.js"></script>
+        <script src="../_static/jquery.js"></script>
+        <script src="../_static/underscore.js"></script>
+        <script src="../_static/_sphinx_javascript_frameworks_compat.js"></script>
+        <script src="../_static/doctools.js"></script>
+        <script src="../_static/sphinx_highlight.js"></script>
+    <script src="../_static/js/theme.js"></script>
+    <link rel="index" title="Index" href="../genindex.html" />
+    <link rel="search" title="Search" href="../search.html" />
+    <link rel="next" title="Export model with torch.jit.script()" href="export-with-torch-jit-script.html" />
+    <link rel="prev" title="Export model.state_dict()" href="export-model-state-dict.html" /> 
+</head>
+
+<body class="wy-body-for-nav"> 
+  <div class="wy-grid-for-nav">
+    <nav data-toggle="wy-nav-shift" class="wy-nav-side">
+      <div class="wy-side-scroll">
+        <div class="wy-side-nav-search" >
+            <a href="../index.html" class="icon icon-home"> icefall
+          </a>
+<div role="search">
+  <form id="rtd-search-form" class="wy-form" action="../search.html" method="get">
+    <input type="text" name="q" placeholder="Search docs" />
+    <input type="hidden" name="check_keywords" value="yes" />
+    <input type="hidden" name="area" value="default" />
+  </form>
+</div>
+        </div><div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="Navigation menu">
+              <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
+<ul class="current">
+<li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1 current"><a class="reference internal" href="index.html">Model export</a><ul class="current">
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html">Export model.state_dict()</a></li>
+<li class="toctree-l2 current"><a class="current reference internal" href="#">Export model with torch.jit.trace()</a><ul>
+<li class="toctree-l3"><a class="reference internal" href="#when-to-use-it">When to use it</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#how-to-export">How to export</a></li>
+<li class="toctree-l3"><a class="reference internal" href="#how-to-use-the-exported-models">How to use the exported models</a></li>
+</ul>
+</li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-script.html">Export model with torch.jit.script()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-onnx.html">Export to ONNX</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-ncnn.html">Export to ncnn</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../huggingface/index.html">Huggingface</a></li>
+</ul>
+
+        </div>
+      </div>
+    </nav>
+
+    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap"><nav class="wy-nav-top" aria-label="Mobile navigation menu" >
+          <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
+          <a href="../index.html">icefall</a>
+      </nav>
+
+      <div class="wy-nav-content">
+        <div class="rst-content">
+          <div role="navigation" aria-label="Page navigation">
+  <ul class="wy-breadcrumbs">
+      <li><a href="../index.html" class="icon icon-home"></a> &raquo;</li>
+          <li><a href="index.html">Model export</a> &raquo;</li>
+      <li>Export model with torch.jit.trace()</li>
+      <li class="wy-breadcrumbs-aside">
+              <a href="https://github.com/k2-fsa/icefall/blob/master/icefall/docs/source/model-export/export-with-torch-jit-trace.rst" class="fa fa-github"> Edit on GitHub</a>
+      </li>
+  </ul>
+  <hr/>
+</div>
+          <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
+           <div itemprop="articleBody">
+             
+  <section id="export-model-with-torch-jit-trace">
+<span id="id1"></span><h1>Export model with torch.jit.trace()<a class="headerlink" href="#export-model-with-torch-jit-trace" title="Permalink to this heading"></a></h1>
+<p>In this section, we describe how to export a model via
+<code class="docutils literal notranslate"><span class="pre">torch.jit.trace()</span></code>.</p>
+<section id="when-to-use-it">
+<h2>When to use it<a class="headerlink" href="#when-to-use-it" title="Permalink to this heading"></a></h2>
+<p>If we want to use our trained model with torchscript,
+we can use <code class="docutils literal notranslate"><span class="pre">torch.jit.trace()</span></code>.</p>
+<div class="admonition hint">
+<p class="admonition-title">Hint</p>
+<p>See <a class="reference internal" href="export-with-torch-jit-script.html#export-model-with-torch-jit-script"><span class="std std-ref">Export model with torch.jit.script()</span></a>
+if you want to use <code class="docutils literal notranslate"><span class="pre">torch.jit.script()</span></code>.</p>
+</div>
+</section>
+<section id="how-to-export">
+<h2>How to export<a class="headerlink" href="#how-to-export" title="Permalink to this heading"></a></h2>
+<p>We use
+<a class="reference external" href="https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/lstm_transducer_stateless2">https://github.com/k2-fsa/icefall/tree/master/egs/librispeech/ASR/lstm_transducer_stateless2</a>
+as an example in the following.</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="nv">iter</span><span class="o">=</span><span class="m">468000</span>
+<span class="nv">avg</span><span class="o">=</span><span class="m">16</span>
+
+<span class="nb">cd</span> egs/librispeech/ASR
+
+./lstm_transducer_stateless2/export.py <span class="se">\</span>
+  --exp-dir ./lstm_transducer_stateless2/exp <span class="se">\</span>
+  --bpe-model data/lang_bpe_500/bpe.model <span class="se">\</span>
+  --iter <span class="nv">$iter</span> <span class="se">\</span>
+  --avg  <span class="nv">$avg</span> <span class="se">\</span>
+  --jit-trace <span class="m">1</span>
+</pre></div>
+</div>
+<p>It will generate three files inside <code class="docutils literal notranslate"><span class="pre">lstm_transducer_stateless2/exp</span></code>:</p>
+<blockquote>
+<div><ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">encoder_jit_trace.pt</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">decoder_jit_trace.pt</span></code></p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">joiner_jit_trace.pt</span></code></p></li>
+</ul>
+</div></blockquote>
+<p>You can use
+<a class="reference external" href="https://github.com/k2-fsa/icefall/blob/master/egs/librispeech/ASR/lstm_transducer_stateless2/jit_pretrained.py">https://github.com/k2-fsa/icefall/blob/master/egs/librispeech/ASR/lstm_transducer_stateless2/jit_pretrained.py</a>
+to decode sound files with the following commands:</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="nb">cd</span> egs/librispeech/ASR
+./lstm_transducer_stateless2/jit_pretrained.py <span class="se">\</span>
+  --bpe-model ./data/lang_bpe_500/bpe.model <span class="se">\</span>
+  --encoder-model-filename ./lstm_transducer_stateless2/exp/encoder_jit_trace.pt <span class="se">\</span>
+  --decoder-model-filename ./lstm_transducer_stateless2/exp/decoder_jit_trace.pt <span class="se">\</span>
+  --joiner-model-filename ./lstm_transducer_stateless2/exp/joiner_jit_trace.pt <span class="se">\</span>
+  /path/to/foo.wav <span class="se">\</span>
+  /path/to/bar.wav <span class="se">\</span>
+  /path/to/baz.wav
+</pre></div>
+</div>
+</section>
+<section id="how-to-use-the-exported-models">
+<h2>How to use the exported models<a class="headerlink" href="#how-to-use-the-exported-models" title="Permalink to this heading"></a></h2>
+<p>Please refer to
+<a class="reference external" href="https://k2-fsa.github.io/sherpa/python/streaming_asr/lstm/index.html">https://k2-fsa.github.io/sherpa/python/streaming_asr/lstm/index.html</a>
+for its usage in <a class="reference external" href="https://k2-fsa.github.io/sherpa/python/streaming_asr/lstm/index.html">sherpa</a>.
+You can also find pretrained models there.</p>
+</section>
+</section>
+
+
+           </div>
+          </div>
+          <footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
+        <a href="export-model-state-dict.html" class="btn btn-neutral float-left" title="Export model.state_dict()" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
+        <a href="export-with-torch-jit-script.html" class="btn btn-neutral float-right" title="Export model with torch.jit.script()" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
+    </div>
+
+  <hr/>
+
+  <div role="contentinfo">
+    <p>&#169; Copyright 2021, icefall development team.</p>
+  </div>
+
+  Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
+    <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
+    provided by <a href="https://readthedocs.org">Read the Docs</a>.
+   
+
+</footer>
+        </div>
+      </div>
+    </section>
+  </div>
+  <script>
+      jQuery(function () {
+          SphinxRtdTheme.Navigation.enable(true);
+      });
+  </script> 
+
+</body>
+</html>
\ No newline at end of file
diff --git a/model-export/index.html b/model-export/index.html
new file mode 100644
index 000000000..eba8286ed
--- /dev/null
+++ b/model-export/index.html
@@ -0,0 +1,148 @@
+<!DOCTYPE html>
+<html class="writer-html5" lang="en" >
+<head>
+  <meta charset="utf-8" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+
+  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+  <title>Model export &mdash; icefall 0.1 documentation</title>
+      <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
+      <link rel="stylesheet" href="../_static/css/theme.css" type="text/css" />
+  <!--[if lt IE 9]>
+    <script src="../_static/js/html5shiv.min.js"></script>
+  <![endif]-->
+  
+        <script data-url_root="../" id="documentation_options" src="../_static/documentation_options.js"></script>
+        <script src="../_static/jquery.js"></script>
+        <script src="../_static/underscore.js"></script>
+        <script src="../_static/_sphinx_javascript_frameworks_compat.js"></script>
+        <script src="../_static/doctools.js"></script>
+        <script src="../_static/sphinx_highlight.js"></script>
+    <script src="../_static/js/theme.js"></script>
+    <link rel="index" title="Index" href="../genindex.html" />
+    <link rel="search" title="Search" href="../search.html" />
+    <link rel="next" title="Export model.state_dict()" href="export-model-state-dict.html" />
+    <link rel="prev" title="Installation" href="../installation/index.html" /> 
+</head>
+
+<body class="wy-body-for-nav"> 
+  <div class="wy-grid-for-nav">
+    <nav data-toggle="wy-nav-shift" class="wy-nav-side">
+      <div class="wy-side-scroll">
+        <div class="wy-side-nav-search" >
+            <a href="../index.html" class="icon icon-home"> icefall
+          </a>
+<div role="search">
+  <form id="rtd-search-form" class="wy-form" action="../search.html" method="get">
+    <input type="text" name="q" placeholder="Search docs" />
+    <input type="hidden" name="check_keywords" value="yes" />
+    <input type="hidden" name="area" value="default" />
+  </form>
+</div>
+        </div><div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="Navigation menu">
+              <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
+<ul class="current">
+<li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1 current"><a class="current reference internal" href="#">Model export</a><ul>
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html">Export model.state_dict()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-trace.html">Export model with torch.jit.trace()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-script.html">Export model with torch.jit.script()</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-onnx.html">Export to ONNX</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-ncnn.html">Export to ncnn</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="../recipes/index.html">Recipes</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../contributing/index.html">Contributing</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../huggingface/index.html">Huggingface</a></li>
+</ul>
+
+        </div>
+      </div>
+    </nav>
+
+    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap"><nav class="wy-nav-top" aria-label="Mobile navigation menu" >
+          <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
+          <a href="../index.html">icefall</a>
+      </nav>
+
+      <div class="wy-nav-content">
+        <div class="rst-content">
+          <div role="navigation" aria-label="Page navigation">
+  <ul class="wy-breadcrumbs">
+      <li><a href="../index.html" class="icon icon-home"></a> &raquo;</li>
+      <li>Model export</li>
+      <li class="wy-breadcrumbs-aside">
+              <a href="https://github.com/k2-fsa/icefall/blob/master/icefall/docs/source/model-export/index.rst" class="fa fa-github"> Edit on GitHub</a>
+      </li>
+  </ul>
+  <hr/>
+</div>
+          <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
+           <div itemprop="articleBody">
+             
+  <section id="model-export">
+<h1>Model export<a class="headerlink" href="#model-export" title="Permalink to this heading"></a></h1>
+<p>In this section, we describe various ways to export models.</p>
+<div class="toctree-wrapper compound">
+<ul>
+<li class="toctree-l1"><a class="reference internal" href="export-model-state-dict.html">Export model.state_dict()</a><ul>
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html#when-to-use-it">When to use it</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html#how-to-export">How to export</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html#how-to-use-the-exported-model">How to use the exported model</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-model-state-dict.html#use-the-exported-model-to-run-decode-py">Use the exported model to run decode.py</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="export-with-torch-jit-trace.html">Export model with torch.jit.trace()</a><ul>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-trace.html#when-to-use-it">When to use it</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-trace.html#how-to-export">How to export</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-trace.html#how-to-use-the-exported-models">How to use the exported models</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="export-with-torch-jit-script.html">Export model with torch.jit.script()</a><ul>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-script.html#when-to-use-it">When to use it</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-script.html#how-to-export">How to export</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-with-torch-jit-script.html#how-to-use-the-exported-model">How to use the exported model</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="export-onnx.html">Export to ONNX</a><ul>
+<li class="toctree-l2"><a class="reference internal" href="export-onnx.html#when-to-use-it">When to use it</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-onnx.html#how-to-export">How to export</a></li>
+<li class="toctree-l2"><a class="reference internal" href="export-onnx.html#how-to-use-the-exported-model">How to use the exported model</a></li>
+</ul>
+</li>
+<li class="toctree-l1"><a class="reference internal" href="export-ncnn.html">Export to ncnn</a></li>
+</ul>
+</div>
+</section>
+
+
+           </div>
+          </div>
+          <footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
+        <a href="../installation/index.html" class="btn btn-neutral float-left" title="Installation" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
+        <a href="export-model-state-dict.html" class="btn btn-neutral float-right" title="Export model.state_dict()" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
+    </div>
+
+  <hr/>
+
+  <div role="contentinfo">
+    <p>&#169; Copyright 2021, icefall development team.</p>
+  </div>
+
+  Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
+    <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
+    provided by <a href="https://readthedocs.org">Read the Docs</a>.
+   
+
+</footer>
+        </div>
+      </div>
+    </section>
+  </div>
+  <script>
+      jQuery(function () {
+          SphinxRtdTheme.Navigation.enable(true);
+      });
+  </script> 
+
+</body>
+</html>
\ No newline at end of file
diff --git a/objects.inv b/objects.inv
index 622ff5f6a347feeb2362ed853bec6104db353214..fb4d813e5a32f83957bdc2a6b1bebceb341aeb23 100644
GIT binary patch
delta 803
zcmV+;1Kj-21&jxfc7IpFZrd;nz56Q!WQXmb1iS9qZe4&jE7}a$PJt^cu?9slBpGe~
zev;^<k}cUzFGWi}K0Z=3r4lKOVlS;>;;<sJqF9>~r%0RXTO|p?UlB<|mbE!@^h0tk
zUy-RPaxUauMHJ#_a&*=PJU4+A8HsKsX^&Kx(l9AvzFNLwBY!bbv@{f#SW&{7yy7$*
zvi@|^B?2ER5%}VCOjPtO%kI6y5(@g(NM-QR_JrfTR9FxpJPR*hD0e)NOs_b5QA{_K
zl6u9pIqn+O3R>;7EuM0!_0FhL=&B`D`AmyX=)0#!o*r3x<mlt1ugui8a7AkTj~T3q
zVvUIv01%>9U4L*gESc6Jkw-2qatX-KUq)5fN(jALgpZn|!2_*?eQGM>v}04ffOu@<
zaqvx~XZ=9M`-oiV&sG?XwfnWG+rz<T+gpvpsTw%D34J$5@r|OkSZ3!08m)6&10e7|
zDvCQhv{Fa(y0JgAoZuY@L|`ulwS}D^bYF6AF?PH;M}G|dj+@sx{kI=9W6|01IcOc=
zieXSJAxRliq(%{J{#(QqBPJxBgNHQX&@R1m=bUy_QyiCFF_On&B5u3K{1Qlkr4VmZ
zgbvdu{I%KqDQ0hpsSNqmGH<cW-4s{qc;7Cwc1y%Kn6sf5m>)bP*d0Y;Wi%&zc3fgw
zyLMoC1b^O%u*Z|BrHG@?cTLH3O*yv<PuN@INY##*=yo0jUhX+Cp_}c^fO*i7BmkH?
z(|{v&^NmqvZ%Xuh_Mq*>Ge~DDA$I=eooGe`gaq5$%?95;Zy%y&WSbBa{{*HY^$eIi
zo-BCmh{B+(!T|^v@16PCn~RS;T&7aZdiWsU=zqjXhD?*EnFaSw6o<Vt?8r>MYk|9C
zSwF0|y=X|r4yw&bOW{IQ?C$AzLe^x-3D{V%C#r?a7aO>N<uBD6*^73`^1;p<C~(O&
zE$ym}cN^HcPZ|7=<$)HxPPW=T-kbiDCjH#b_ITlJ*xRtRVasa&T?km=ZjYW$eytaA
h{~SN8COnx=j5S@U#rO9*4ZR~-_`k16`5#9*KmQBzh))0j

delta 612
zcmV-q0-ODe2hRnNc7ImEj@uv*z56SWa;B?Zd(EnCq)ilU(nC*?gC{l;1`DvZ`TK&$
z$$|}W)64GWy_q+UH#lCVq}BY~TQ2JtrYfMuUIh?it8bNJgnlI~UGk-|tsvi(5bA^2
z28gG~KowDom&wUF40YB4N~|KUiuEl>TUxGUtk<XyY87P~N`DKqq#79S@{ZHxIQ6Hu
zt_X6ZB*?|%xUAq$R()XSM<_0-Tm}_Uo<S_-y25_y`f0G0blNq@Pm_1~8;a&O{?DT6
z>)K7blnmzQnvr8hpK#RQX|THF5-Qp{FT&)sW`(G`*FZ;{ARft^&i%}4B0Dok5HDtD
z3zJ}QDTQz~#(%osgyZKpypbGkUl7J>#ObYR6Vw&+rr1JKGL~>bBv#p7>5agit*Ux=
z9dM}uyU@13+D6H^8?U^1DY<Dt2zL?XMd=pwiP`A6eOP#Z0uUnW<9en%OC(u<N+UGW
za8X$hV9d!~9cikbxnU0^Q}sCEaAU~v&dkQyO3ITkwtrm;BPzrJ$JgDCz8#L+D2!|f
z!QtN#y7vfv*4%UetXW=9w)oMC!ltalSrIC}dH68ENxdPJPWSFPKmF_ap6MT5_@EP;
z43!qQnJu1dl!n<^-g28yEucr0&31E~bmK5y>po{KRTsMAKi+>OY%Lx+QTFJtS1?lL
z4;#>^@?9IuPEES~uza&;0|$P%fl{+3{%%8Te3X&jmo*fVBzxmu>)rHK6KgGIyz&?w
yFzPVsRNX%kfhxY(qF371BSoD5f4d1cGn#SGlU{~=pYt$T$!hrg#K^x|!_N!3M>p*N

diff --git a/recipes/aishell/conformer_ctc.html b/recipes/aishell/conformer_ctc.html
index 459c14917..2a25508a4 100644
--- a/recipes/aishell/conformer_ctc.html
+++ b/recipes/aishell/conformer_ctc.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2 current"><a class="reference internal" href="index.html">aishell</a><ul class="current">
 <li class="toctree-l3"><a class="reference internal" href="tdnn_lstm_ctc.html">TDNN-LSTM CTC</a></li>
diff --git a/recipes/aishell/index.html b/recipes/aishell/index.html
index 03ed8f3d8..2efefb985 100644
--- a/recipes/aishell/index.html
+++ b/recipes/aishell/index.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2 current"><a class="current reference internal" href="#">aishell</a><ul>
 <li class="toctree-l3"><a class="reference internal" href="tdnn_lstm_ctc.html">TDNN-LSTM CTC</a></li>
diff --git a/recipes/aishell/stateless_transducer.html b/recipes/aishell/stateless_transducer.html
index 6c014698d..2a440bb9d 100644
--- a/recipes/aishell/stateless_transducer.html
+++ b/recipes/aishell/stateless_transducer.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2 current"><a class="reference internal" href="index.html">aishell</a><ul class="current">
 <li class="toctree-l3"><a class="reference internal" href="tdnn_lstm_ctc.html">TDNN-LSTM CTC</a></li>
diff --git a/recipes/aishell/tdnn_lstm_ctc.html b/recipes/aishell/tdnn_lstm_ctc.html
index fd852f7cc..ed81f1a9c 100644
--- a/recipes/aishell/tdnn_lstm_ctc.html
+++ b/recipes/aishell/tdnn_lstm_ctc.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2 current"><a class="reference internal" href="index.html">aishell</a><ul class="current">
 <li class="toctree-l3 current"><a class="current reference internal" href="#">TDNN-LSTM CTC</a><ul>
diff --git a/recipes/index.html b/recipes/index.html
index 37f8b2a47..ce20c5987 100644
--- a/recipes/index.html
+++ b/recipes/index.html
@@ -21,7 +21,7 @@
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
     <link rel="next" title="aishell" href="aishell/index.html" />
-    <link rel="prev" title="Installation" href="../installation/index.html" /> 
+    <link rel="prev" title="Export to ncnn" href="../model-export/export-ncnn.html" /> 
 </head>
 
 <body class="wy-body-for-nav"> 
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="current reference internal" href="#">Recipes</a><ul>
 <li class="toctree-l2"><a class="reference internal" href="aishell/index.html">aishell</a></li>
 <li class="toctree-l2"><a class="reference internal" href="librispeech/index.html">LibriSpeech</a></li>
@@ -114,7 +115,7 @@ Currently, only speech recognition recipes are provided.</p>
            </div>
           </div>
           <footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
-        <a href="../installation/index.html" class="btn btn-neutral float-left" title="Installation" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
+        <a href="../model-export/export-ncnn.html" class="btn btn-neutral float-left" title="Export to ncnn" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
         <a href="aishell/index.html" class="btn btn-neutral float-right" title="aishell" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
     </div>
 
diff --git a/recipes/librispeech/conformer_ctc.html b/recipes/librispeech/conformer_ctc.html
index 0d696ceb4..ea8e0b413 100644
--- a/recipes/librispeech/conformer_ctc.html
+++ b/recipes/librispeech/conformer_ctc.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2 current"><a class="reference internal" href="index.html">LibriSpeech</a><ul class="current">
diff --git a/recipes/librispeech/index.html b/recipes/librispeech/index.html
index 9e47c3417..bcbef6788 100644
--- a/recipes/librispeech/index.html
+++ b/recipes/librispeech/index.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2 current"><a class="current reference internal" href="#">LibriSpeech</a><ul>
diff --git a/recipes/librispeech/lstm_pruned_stateless_transducer.html b/recipes/librispeech/lstm_pruned_stateless_transducer.html
index fc6680fde..78e5fafba 100644
--- a/recipes/librispeech/lstm_pruned_stateless_transducer.html
+++ b/recipes/librispeech/lstm_pruned_stateless_transducer.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2 current"><a class="reference internal" href="index.html">LibriSpeech</a><ul class="current">
@@ -376,10 +377,10 @@ $ tensorboard dev upload --logdir . --description <span class="s2">&quot;LSTM tr
 <p>Note there is a URL in the above output. Click it and you will see
 the following screenshot:</p>
 <blockquote>
-<div><figure class="align-center" id="id2">
+<div><figure class="align-center" id="id3">
 <a class="reference external image-reference" href="https://tensorboard.dev/experiment/lzGnETjwRxC3yghNMd4kPw/"><img alt="TensorBoard screenshot" src="../../_images/librispeech-lstm-transducer-tensorboard-log.png" style="width: 600px;" /></a>
 <figcaption>
-<p><span class="caption-number">Fig. 5 </span><span class="caption-text">TensorBoard screenshot.</span><a class="headerlink" href="#id2" title="Permalink to this image"></a></p>
+<p><span class="caption-number">Fig. 5 </span><span class="caption-text">TensorBoard screenshot.</span><a class="headerlink" href="#id3" title="Permalink to this image"></a></p>
 </figcaption>
 </figure>
 </div></blockquote>
@@ -584,7 +585,7 @@ for how to use the exported models in <code class="docutils literal notranslate"
 </div>
 </section>
 <section id="export-model-for-ncnn">
-<h3>Export model for ncnn<a class="headerlink" href="#export-model-for-ncnn" title="Permalink to this heading"></a></h3>
+<span id="id2"></span><h3>Export model for ncnn<a class="headerlink" href="#export-model-for-ncnn" title="Permalink to this heading"></a></h3>
 <p>We support exporting pretrained LSTM transducer models to
 <a class="reference external" href="https://github.com/tencent/ncnn">ncnn</a> using
 <a class="reference external" href="https://github.com/Tencent/ncnn/tree/master/tools/pnnx">pnnx</a>.</p>
diff --git a/recipes/librispeech/tdnn_lstm_ctc.html b/recipes/librispeech/tdnn_lstm_ctc.html
index 3a0f8814d..4ef3a2efb 100644
--- a/recipes/librispeech/tdnn_lstm_ctc.html
+++ b/recipes/librispeech/tdnn_lstm_ctc.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2 current"><a class="reference internal" href="index.html">LibriSpeech</a><ul class="current">
diff --git a/recipes/timit/index.html b/recipes/timit/index.html
index 6dd718317..30cd4e2b4 100644
--- a/recipes/timit/index.html
+++ b/recipes/timit/index.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../librispeech/index.html">LibriSpeech</a></li>
diff --git a/recipes/timit/tdnn_ligru_ctc.html b/recipes/timit/tdnn_ligru_ctc.html
index 7017666a9..8007cb522 100644
--- a/recipes/timit/tdnn_ligru_ctc.html
+++ b/recipes/timit/tdnn_ligru_ctc.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../librispeech/index.html">LibriSpeech</a></li>
diff --git a/recipes/timit/tdnn_lstm_ctc.html b/recipes/timit/tdnn_lstm_ctc.html
index 4819714e5..a9d979d18 100644
--- a/recipes/timit/tdnn_lstm_ctc.html
+++ b/recipes/timit/tdnn_lstm_ctc.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../librispeech/index.html">LibriSpeech</a></li>
diff --git a/recipes/yesno/index.html b/recipes/yesno/index.html
index 710a4de5b..50f902d94 100644
--- a/recipes/yesno/index.html
+++ b/recipes/yesno/index.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../librispeech/index.html">LibriSpeech</a></li>
diff --git a/recipes/yesno/tdnn.html b/recipes/yesno/tdnn.html
index ea15c1be3..71897e405 100644
--- a/recipes/yesno/tdnn.html
+++ b/recipes/yesno/tdnn.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul class="current">
 <li class="toctree-l1"><a class="reference internal" href="../../installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="../../model-export/index.html">Model export</a></li>
 <li class="toctree-l1 current"><a class="reference internal" href="../index.html">Recipes</a><ul class="current">
 <li class="toctree-l2"><a class="reference internal" href="../aishell/index.html">aishell</a></li>
 <li class="toctree-l2"><a class="reference internal" href="../librispeech/index.html">LibriSpeech</a></li>
diff --git a/search.html b/search.html
index 32af9c8b1..83a4d96b8 100644
--- a/search.html
+++ b/search.html
@@ -42,6 +42,7 @@
               <p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
 <ul>
 <li class="toctree-l1"><a class="reference internal" href="installation/index.html">Installation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="model-export/index.html">Model export</a></li>
 <li class="toctree-l1"><a class="reference internal" href="recipes/index.html">Recipes</a></li>
 <li class="toctree-l1"><a class="reference internal" href="contributing/index.html">Contributing</a></li>
 <li class="toctree-l1"><a class="reference internal" href="huggingface/index.html">Huggingface</a></li>
diff --git a/searchindex.js b/searchindex.js
index 040663b26..a79764e32 100644
--- a/searchindex.js
+++ b/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"docnames": ["contributing/code-style", "contributing/doc", "contributing/how-to-create-a-recipe", "contributing/index", "huggingface/index", "huggingface/pretrained-models", "huggingface/spaces", "index", "installation/index", "recipes/aishell/conformer_ctc", "recipes/aishell/index", "recipes/aishell/stateless_transducer", "recipes/aishell/tdnn_lstm_ctc", "recipes/index", "recipes/librispeech/conformer_ctc", "recipes/librispeech/index", "recipes/librispeech/lstm_pruned_stateless_transducer", "recipes/librispeech/tdnn_lstm_ctc", "recipes/timit/index", "recipes/timit/tdnn_ligru_ctc", "recipes/timit/tdnn_lstm_ctc", "recipes/yesno/index", "recipes/yesno/tdnn"], "filenames": ["contributing/code-style.rst", "contributing/doc.rst", "contributing/how-to-create-a-recipe.rst", "contributing/index.rst", "huggingface/index.rst", "huggingface/pretrained-models.rst", "huggingface/spaces.rst", "index.rst", "installation/index.rst", "recipes/aishell/conformer_ctc.rst", "recipes/aishell/index.rst", "recipes/aishell/stateless_transducer.rst", "recipes/aishell/tdnn_lstm_ctc.rst", "recipes/index.rst", "recipes/librispeech/conformer_ctc.rst", "recipes/librispeech/index.rst", "recipes/librispeech/lstm_pruned_stateless_transducer.rst", "recipes/librispeech/tdnn_lstm_ctc.rst", "recipes/timit/index.rst", "recipes/timit/tdnn_ligru_ctc.rst", "recipes/timit/tdnn_lstm_ctc.rst", "recipes/yesno/index.rst", "recipes/yesno/tdnn.rst"], "titles": ["Follow the code style", "Contributing to Documentation", "How to create a recipe", "Contributing", "Huggingface", "Pre-trained models", "Huggingface spaces", "Icefall", "Installation", "Conformer CTC", "aishell", "Stateless Transducer", "TDNN-LSTM CTC", "Recipes", "Conformer CTC", "LibriSpeech", "LSTM Transducer", "TDNN-LSTM-CTC", "TIMIT", "TDNN-LiGRU-CTC", "TDNN-LSTM-CTC", "YesNo", "TDNN-CTC"], "terms": {"we": [0, 1, 2, 3, 5, 6, 8, 9, 10, 11, 12, 13, 14, 16, 17, 19, 20, 22], "us": [0, 1, 2, 4, 6, 7, 8, 9, 10, 11, 12, 14, 17, 19, 20, 22], "tool": [0, 16], "make": [0, 1, 3, 9, 11, 14, 16], "consist": [0, 11, 16], "possibl": [0, 2, 3, 8, 9, 14], "black": 0, "format": [0, 9, 11, 12, 14, 16, 17, 19, 20, 22], "flake8": 0, "check": [0, 14], "qualiti": [0, 10], "isort": 0, "sort": [0, 8], "import": 0, "The": [0, 1, 2, 6, 8, 9, 10, 12, 14, 16, 17, 19, 20, 22], "version": [0, 8, 9, 11, 12, 14, 16, 17, 19, 20], "abov": [0, 8, 9, 10, 11, 12, 14, 16, 22], "ar": [0, 1, 3, 8, 9, 10, 11, 12, 13, 14, 16, 17, 19, 20, 22], "12": [0, 8, 9, 11, 12, 14, 16, 19, 22], "6b0": 0, "3": [0, 7, 12, 16, 17, 22], "9": [0, 8, 9, 11, 12, 14, 16, 17, 19, 22], "2": [0, 7, 16, 17, 19, 20, 22], "5": [0, 9, 11, 12, 14, 16, 17, 19, 20, 22], "after": [0, 1, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "run": [0, 2, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "command": [0, 1, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "git": [0, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "clone": [0, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "http": [0, 1, 2, 5, 6, 8, 9, 10, 11, 12, 14, 16, 17, 19, 20, 22], "github": [0, 2, 5, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "com": [0, 2, 5, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "k2": [0, 2, 5, 6, 7, 9, 11, 12, 14, 16, 17, 19, 20], "fsa": [0, 2, 5, 6, 8, 9, 11, 14, 16], "icefal": [0, 2, 3, 5, 6, 9, 11, 12, 13, 14, 16, 17, 19, 20, 22], "cd": [0, 1, 2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "pip": [0, 1, 8, 11, 16], "instal": [0, 1, 4, 6, 7, 16, 22], "pre": [0, 3, 4, 6, 7, 8], "commit": 0, "whenev": 0, "you": [0, 1, 2, 5, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "automat": [0, 6], "hook": 0, "invok": 0, "fail": [0, 8], "If": [0, 2, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "ani": [0, 8, 9, 11, 12, 14, 16, 22], "your": [0, 1, 2, 4, 6, 7, 9, 11, 12, 14, 16, 17, 19, 20, 22], "wa": [0, 8, 14, 17], "success": [0, 8], "pleas": [0, 1, 2, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "fix": [0, 8, 14], "issu": [0, 8, 14], "report": [0, 8], "some": [0, 1, 9, 11, 12, 14, 16, 17, 19, 20, 22], "i": [0, 1, 2, 6, 8, 9, 10, 11, 12, 14, 16, 17, 19, 20, 22], "e": [0, 2, 9, 11, 12, 14, 16, 17, 19, 20, 22], "modifi": [0, 9, 12, 14, 16, 17, 19, 20, 22], "file": [0, 2, 6, 9, 11, 12, 14, 16, 17, 19, 20, 22], "place": [0, 8, 11, 14, 17], "so": [0, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "statu": 0, "failur": 0, "see": [0, 1, 6, 9, 11, 12, 14, 16, 17, 19, 20, 22], "which": [0, 2, 6, 9, 10, 11, 12, 14, 17, 19, 20, 22], "ha": [0, 2, 9, 11, 12, 14, 16, 17, 19, 20], "been": [0, 11], "befor": [0, 1, 9, 11, 12, 14, 16], "further": 0, "chang": [0, 9, 11, 12, 14, 16, 17, 19, 20, 22], "all": [0, 5, 6, 9, 11, 12, 14, 16, 17, 19, 20, 22], "again": [0, 22], "should": [0, 2, 9, 11, 12, 14, 16, 17, 19, 20, 22], "succe": 0, "thi": [0, 2, 3, 4, 8, 9, 11, 12, 13, 14, 16, 17, 19, 20, 22], "time": [0, 9, 11, 12, 14, 16, 17, 19, 20, 22], "succeed": 0, "want": [0, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "can": [0, 1, 2, 5, 6, 8, 9, 10, 11, 12, 14, 16, 17, 19, 20, 22], "do": [0, 2, 9, 11, 12, 14, 16, 17, 19, 20, 22], "21": [0, 8, 9, 11, 14, 19, 20], "your_changed_fil": 0, "py": [0, 2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "sphinx": 1, "write": [1, 2, 3], "have": [1, 2, 5, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "prepar": [1, 3], "environ": [1, 9, 10, 11, 12, 14, 16, 17, 19, 20, 22], "doc": 1, "r": [1, 8, 19, 20], "requir": [1, 8], "txt": [1, 8, 9, 11, 12, 14, 17, 19, 20, 22], "set": [1, 8, 9, 11, 12, 14, 16, 22], "up": [1, 8, 9, 12, 14, 17], "readi": [1, 9, 14], "refer": [1, 2, 8, 9, 11, 12, 14, 17, 19, 20, 22], "restructuredtext": 1, "primer": 1, "familiar": 1, "build": [1, 8, 9, 11, 14, 16], "local": [1, 8, 16], "preview": 1, "what": [1, 2, 8, 11], "look": [1, 2, 5, 8, 9, 11, 12, 14], "like": [1, 2, 6, 8, 9, 11, 12, 14, 16, 22], "publish": [1, 10], "html": [1, 2, 8, 16], "gener": [1, 9, 11, 12, 14, 16], "view": [1, 9, 11, 12, 14, 16, 22], "follow": [1, 2, 3, 5, 6, 7, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "python3": [1, 8, 16], "m": [1, 11, 16, 19, 20], "server": [1, 6, 8, 16], "It": [1, 2, 4, 8, 9, 10, 11, 12, 14, 16, 17, 19, 20, 22], "print": [1, 9, 11, 12, 14, 16, 17, 19, 20, 22], "serv": [1, 16], "0": [1, 7, 9, 11, 12, 14, 16, 17, 19, 20, 22], "port": [1, 16], "8000": [1, 22], "open": [1, 10, 11, 14], "browser": [1, 4, 6, 16], "go": [1, 9, 11, 14, 16], "read": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "code": [2, 3, 7, 9, 14, 17, 19, 20, 22], "style": [2, 3, 7], "adjust": 2, "sytl": 2, "design": 2, "python": [2, 8, 9, 11, 14, 16], "recommend": [2, 8, 9, 11, 12, 14], "test": [2, 7, 9, 11, 12, 14, 17, 19, 20], "valid": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "dataset": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "lhots": [2, 7, 9, 11, 14], "readthedoc": [2, 8], "io": [2, 8, 16], "en": [2, 8], "latest": [2, 6, 8, 14, 16, 17], "index": [2, 8, 16], "yesno": [2, 7, 8, 13, 22], "veri": [2, 3, 11, 19, 20, 22], "good": 2, "exampl": [2, 6, 7, 17, 19, 20, 22], "speech": [2, 6, 7, 8, 10, 11, 13, 22], "pull": [2, 9, 11, 14], "380": [2, 20], "show": [2, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "add": [2, 9, 11, 12, 13], "new": [2, 3, 6, 8, 9, 10, 11, 12, 14, 16, 17, 22], "suppos": 2, "would": [2, 8, 14, 17], "name": [2, 9, 11], "foo": [2, 9, 14, 16], "eg": [2, 5, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "mkdir": [2, 9, 11, 12, 14, 16, 17, 19, 20, 22], "p": [2, 8, 11, 19, 20], "asr": [2, 5, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "touch": 2, "sh": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "chmod": 2, "x": 2, "simpl": [2, 11], "own": 2, "otherwis": [2, 9, 11, 14, 16], "librispeech": [2, 5, 7, 13, 14, 16, 17], "assum": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "fanci": 2, "call": 2, "bar": [2, 9, 14, 16], "organ": 2, "wai": [2, 3, 16], "readm": [2, 9, 11, 12, 14, 17, 19, 20, 22], "md": [2, 5, 9, 11, 12, 14, 16, 17, 19, 20, 22], "asr_datamodul": [2, 8], "pretrain": [2, 9, 11, 12, 14, 17, 19, 20, 22], "For": [2, 5, 9, 11, 12, 14, 16, 17, 19, 20, 22], "instanc": [2, 5, 9, 11, 12, 14, 16, 17, 19, 20, 22], "tdnn": [2, 8, 10, 13, 15, 18, 21], "its": [2, 11], "directori": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "structur": 2, "descript": [2, 9, 11, 12, 14, 16, 17, 19, 20, 22], "contain": [2, 7, 9, 11, 12, 13, 14, 16, 17, 19, 20, 22], "inform": [2, 9, 11, 12, 14, 16, 17, 19, 20, 22], "g": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "wer": [2, 8, 16, 17, 19, 20, 22], "etc": [2, 9, 11, 12, 14, 16, 17, 19, 20, 22], "provid": [2, 6, 8, 9, 10, 11, 12, 13, 14, 16, 17, 19, 20, 22], "pytorch": [2, 7, 11], "dataload": [2, 8], "take": [2, 22], "input": [2, 9, 11, 12, 14, 17, 19, 20, 22], "checkpoint": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "save": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "dure": [2, 6, 9, 11, 12, 14, 16, 17, 19, 20, 22], "stage": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "definit": 2, "neural": [2, 9, 14], "network": [2, 9, 11, 14, 16], "script": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "infer": 2, "tdnn_lstm_ctc": [2, 12, 17, 20], "conformer_ctc": [2, 9, 14], "get": [2, 6, 8, 9, 11, 12, 14, 16, 17, 22], "feel": [2, 16], "result": [2, 5, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "everi": [2, 16], "kept": 2, "self": 2, "toler": 2, "duplic": 2, "among": [2, 8], "differ": [2, 8, 9, 10, 14, 16], "invoc": 2, "help": [2, 9, 11, 12, 14, 16, 17, 19, 20, 22], "blob": [2, 5, 16], "master": [2, 5, 11, 16], "transform": [2, 9, 14, 16], "conform": [2, 10, 11, 13, 15, 16], "base": [2, 9, 11, 12, 14, 16], "lstm": [2, 10, 13, 15, 18], "attent": [2, 11, 12], "lm": [2, 8, 11, 17, 19, 20, 22], "rescor": [2, 12, 17, 19, 20, 22], "demonstr": [2, 4, 6], "consid": 2, "colab": 2, "notebook": 2, "welcom": 3, "There": [3, 9, 11, 12, 14, 16], "mani": 3, "two": [3, 9, 11, 12, 14, 16, 17, 19, 20, 22], "them": [3, 4, 5, 6, 9, 11, 12, 14, 16, 17, 19, 20, 22], "To": [3, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "document": [3, 7], "repositori": 3, "recip": [3, 5, 7, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "In": [3, 6, 9, 11, 12, 14, 17, 19, 20, 22], "page": [3, 6, 9, 11, 12, 13, 14, 16, 17, 19, 20, 22], "describ": [3, 4, 9, 11, 12, 14, 17, 19, 20], "how": [3, 4, 6, 7, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "creat": [3, 7, 9, 11, 12, 14, 16, 17, 19, 20, 22], "data": [3, 10], "train": [3, 4, 6, 7], "decod": [3, 6], "model": [3, 4, 6, 7, 8], "section": [4, 8, 9, 14], "find": [4, 5, 6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "also": [4, 5, 8, 9, 11, 12, 14, 16, 22], "try": [4, 6, 16], "from": [4, 6, 8, 9, 10, 11, 12, 14, 16, 17, 19, 20, 22], "within": [4, 6], "without": [4, 6, 9, 14, 16], "anyth": [4, 6], "space": [4, 7], "youtub": [4, 7, 14, 16, 17], "video": [4, 7, 14, 16, 17], "upload": [5, 6, 9, 11, 12, 14, 16, 17, 19, 20, 22], "huggingfac": [5, 7, 9, 11, 12, 14, 16, 17, 19, 20, 22], "co": [5, 6, 9, 10, 11, 12, 14, 16, 17, 19, 20, 22], "visit": [5, 6, 16], "link": [5, 8, 16], "search": [5, 6], "specif": [5, 11], "correspond": [5, 6], "aishel": [5, 7, 9, 11, 12, 13], "gigaspeech": [5, 16], "wenetspeech": 5, "integr": 6, "framework": 6, "sherpa": [6, 16], "need": [6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "download": [6, 7, 10], "window": [6, 16], "maco": [6, 16], "linux": [6, 16], "even": [6, 8], "ipad": 6, "phone": 6, "start": [6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "address": [6, 11, 16], "recognit": [6, 7, 10, 11, 13, 22], "screenshot": [6, 9, 11, 12, 14, 16, 22], "select": [6, 16, 17, 19, 20, 22], "languag": [6, 9, 11, 12], "current": [6, 8, 11, 13, 16], "chines": [6, 10, 11], "english": [6, 16, 22], "target": 6, "method": [6, 8, 9, 11, 12, 14, 16, 17, 19, 20], "greedi": 6, "modified_beam_search": [6, 11, 16], "choos": [6, 8, 16], "number": [6, 9, 11, 12, 14, 16, 17, 19, 20, 22], "activ": 6, "path": [6, 9, 11, 12, 14, 16], "either": [6, 9, 11, 12, 14], "record": [6, 9, 10, 11, 12, 14, 16, 17, 19, 20, 22], "click": [6, 8, 9, 11, 12, 14, 16, 22], "button": 6, "submit": 6, "wait": 6, "moment": 6, "an": [6, 8, 9, 10, 11, 14, 16, 22], "when": [6, 11, 14], "bottom": [6, 16], "part": [6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "tabl": 6, "one": [6, 9, 11, 12, 14, 16, 17, 19, 20, 22], "next": [6, 8, 14, 16, 17], "gen": [6, 8, 14, 16, 17], "kaldi": [6, 8, 14, 16, 17], "subscrib": [6, 8, 14, 16, 17], "channel": [6, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "nadira": [6, 8, 14, 16, 17], "povei": [6, 8, 14, 16, 17], "www": [6, 8, 10, 14, 16, 17], "uc_vaumpkminz1pnkfxan9mw": [6, 8, 14, 16, 17], "torchaudio": 7, "1": [7, 16, 17, 19, 20, 22], "timit": [7, 13, 19, 20], "contribut": 7, "depend": [8, 9, 14, 16], "step": [8, 9, 11, 12, 14, 16, 22], "order": [8, 9, 12, 14, 17, 19, 20], "matter": 8, "org": [8, 10, 11, 16], "least": 8, "v1": [8, 9, 12, 14, 17, 19, 20], "alreadi": 8, "don": [8, 9, 12, 14, 16, 17, 19, 20, 22], "t": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "replac": 8, "compil": [8, 9, 11, 14], "against": 8, "strongli": 8, "collect": 8, "variabl": [8, 9, 12, 14, 16], "pythonpath": 8, "point": [8, 9, 12, 14, 16], "folder": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "tmp": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "setup": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "export": [8, 9, 11, 12, 14, 17, 19, 20, 22], "put": 8, "sever": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "same": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "switch": [8, 9, 14], "just": 8, "about": [8, 11, 16], "virtualenv": 8, "8": [8, 9, 11, 14, 16, 17, 22], "cpython3": 8, "6": [8, 9, 11, 14, 16, 17, 19, 20], "final": [8, 14, 17], "64": [8, 11], "1540m": 8, "creator": 8, "cpython3posix": 8, "dest": 8, "ceph": [8, 9, 11, 14], "fj": [8, 11, 14], "fangjun": [8, 11, 14], "clear": 8, "fals": [8, 9, 11, 14], "no_vcs_ignor": 8, "global": 8, "seeder": 8, "fromappdata": 8, "bundl": 8, "setuptool": 8, "wheel": 8, "via": 8, "copi": 8, "app_data_dir": 8, "root": 8, "share": 8, "v": [8, 14, 19, 20], "irtualenv": 8, "ad": [8, 9, 11, 12, 14, 16, 22], "seed": 8, "packag": 8, "57": [8, 14, 17], "36": [8, 11, 14], "bashactiv": 8, "cshellactiv": 8, "fishactiv": 8, "powershellactiv": 8, "pythonactiv": 8, "xonshactiv": 8, "sourc": [8, 9, 10, 11, 14], "bin": [8, 9, 14, 16], "dev20210822": 8, "cpu": [8, 9, 22], "torch1": 8, "f": [8, 19, 20], "nightli": 8, "whl": [8, 16], "2bcpu": 8, "cp38": 8, "linux_x86_64": 8, "mb": 8, "________________________________": 8, "185": [8, 9, 14, 22], "kb": [8, 19, 20], "graphviz": 8, "17": [8, 9, 14, 16, 19, 20], "py3": 8, "none": [8, 9, 14], "18": [8, 9, 11, 12, 14, 16, 17, 19, 20], "torch": [8, 9, 11, 14], "cach": 8, "manylinux1_x86_64": 8, "831": [8, 11, 20], "type": [8, 9, 11, 14, 16, 22], "extens": 8, "typing_extens": 8, "10": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "26": [8, 11, 14, 20], "successfulli": 8, "probabl": [8, 11, 16], "cuda": [8, 9, 11, 12, 14, 16, 17, 19, 20], "req": 8, "7b1b76ge": 8, "q": 8, "audioread": 8, "soundfil": 8, "post1": 8, "py2": 8, "7": [8, 9, 12, 14, 16, 17, 19, 20], "97": [8, 9], "cytoolz": 8, "11": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "manylinux_2_17_x86_64": 8, "manylinux2014_x86_64": 8, "dataclass": 8, "14": [8, 9, 14, 16, 17, 19], "h5py": 8, "manylinux_2_12_x86_64": 8, "manylinux2010_x86_64": 8, "684": [8, 9, 22], "intervaltre": 8, "lilcom": 8, "numpi": 8, "15": [8, 11, 12, 14, 19, 22], "40": [8, 12, 14, 17, 19, 20], "pyyaml": 8, "662": 8, "tqdm": 8, "62": [8, 14, 17], "76": [8, 22], "73": 8, "satisfi": 8, "lib": 8, "site": 8, "dev": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "2a1410b": 8, "clean": [8, 9, 11, 14, 16, 17], "toolz": 8, "55": [8, 12, 14, 19], "sortedcontain": 8, "29": [8, 9, 11, 12, 14, 17, 19, 20], "cffi": 8, "411": [8, 14], "pycpars": 8, "20": [8, 9, 11, 12, 14, 17, 19, 20, 22], "112": 8, "pypars": 8, "67": 8, "done": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "filenam": [8, 16], "dev_2a1410b_clean": 8, "size": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "342242": 8, "sha256": 8, "f683444afa4dc0881133206b4646a": 8, "9d0f774224cc84000f55d0a67f6e4a37997": 8, "store": [8, 14], "ephem": 8, "ftu0qysz": 8, "7f": 8, "7a": 8, "8e": 8, "a0bf241336e2e3cb573e1e21e5600952d49f5162454f2e612f": 8, "warn": 8, "built": 8, "invalid": [8, 14], "metadata": [8, 19, 20], "mandat": 8, "pep": 8, "440": 8, "packa": 8, "ging": 8, "deprec": [8, 11], "legaci": 8, "becaus": 8, "could": [8, 9, 12], "A": [8, 9, 11, 12, 14, 16, 17], "discuss": 8, "regard": 8, "pypa": 8, "sue": 8, "8368": 8, "inter": 8, "valtre": 8, "sor": 8, "tedcontain": 8, "remot": 8, "enumer": 8, "object": [8, 9, 11, 12, 16, 22], "500": [8, 11, 14, 16], "count": 8, "100": [8, 9, 11, 12, 14, 16], "compress": 8, "308": [8, 9, 11, 12], "total": [8, 9, 11, 12, 14, 16, 17, 22], "delta": 8, "263": 8, "reus": 8, "307": 8, "102": [8, 9], "pack": 8, "receiv": 8, "172": 8, "49": [8, 14, 20, 22], "kib": 8, "385": 8, "00": [8, 9, 11, 12, 14, 17, 19, 20, 22], "resolv": 8, "kaldilm": 8, "tar": 8, "gz": 8, "48": [8, 9, 11], "574": 8, "kaldialign": 8, "sentencepiec": [8, 14], "96": 8, "tensorboard": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "41": [8, 9, 11, 19, 22], "line": 8, "absl": 8, "absl_pi": 8, "13": [8, 11, 12, 14, 17, 19], "132": 8, "googl": [8, 16], "auth": 8, "oauthlib": 8, "google_auth_oauthlib": 8, "grpcio": 8, "24": [8, 12, 17, 19, 20, 22], "39": [8, 11, 14, 17, 19], "ment": 8, "requi": 8, "rement": 8, "protobuf": 8, "manylinux_2_5_x86_64": 8, "werkzeug": 8, "288": 8, "tensorboard_data_serv": 8, "google_auth": 8, "35": [8, 11, 14, 16], "152": 8, "request": 8, "plugin": 8, "wit": 8, "tensorboard_plugin_wit": 8, "781": 8, "markdown": 8, "six": 8, "16": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "cachetool": 8, "rsa": 8, "34": 8, "pyasn1": 8, "modul": 8, "pyasn1_modul": 8, "155": 8, "requests_oauthlib": 8, "23": [8, 9, 11, 12, 14, 19, 20, 22], "77": [8, 14], "urllib3": 8, "27": [8, 9, 11, 17, 20], "138": [8, 9, 11], "certifi": 8, "2017": 8, "2021": [8, 9, 12, 14, 17, 19, 20, 22], "30": [8, 9, 11, 12, 14, 16, 22], "145": 8, "charset": 8, "normal": [8, 17, 19, 20, 22], "charset_norm": 8, "idna": 8, "59": [8, 12, 14], "146": 8, "897233": 8, "eccb906cafcd45bf9a7e1a1718e4534254bfb": 8, "f4c0d0cbc66eee6c88d68a63862": 8, "85": 8, "7d": 8, "63": [8, 11], "f2dd586369b8797cb36d213bf3a84a789eeb92db93d2e723c9": 8, "etool": 8, "oaut": 8, "hlib": 8, "let": [8, 9, 14, 16], "u": [8, 9, 11, 12, 14, 16, 22], "log": [8, 17, 19, 20, 22], "08": [8, 14, 16, 17, 19, 20, 22], "19": [8, 9, 14, 17, 19, 20], "main": [8, 9, 14], "dl_dir": [8, 9, 12, 14, 16], "waves_yesno": 8, "49mb": 8, "03": [8, 11, 14, 16, 19, 20], "39mb": 8, "manifest": 8, "31": [8, 14], "42": [8, 9, 14, 22], "comput": [8, 9, 11, 12, 16, 17, 19, 20, 22], "fbank": [8, 9, 11, 12, 14, 17, 19, 20, 22], "32": [8, 9, 11, 12], "803": 8, "info": [8, 9, 11, 12, 14, 17, 19, 20, 22], "compute_fbank_yesno": 8, "52": [8, 9, 14], "process": [8, 9, 11, 12, 14, 16], "extract": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "featur": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "_______________________________________________________________": 8, "90": 8, "01": [8, 11, 12, 14], "80": [8, 9, 11, 14], "57it": 8, "085": 8, "______________________________________________________________": 8, "248": [8, 11], "21it": 8, "lang": [8, 11, 14], "fcordre9": 8, "kaldilm_6899d26f2d684ad48f21025950cd2866": 8, "csrc": [8, 14], "arpa_file_pars": 8, "cc": 8, "void": 8, "arpafilepars": 8, "rea": 8, "d": [8, 19, 20], "std": 8, "istream": 8, "79": 8, "140": [8, 12], "gram": [8, 9, 11, 12, 14, 17, 19, 20], "89": [8, 9], "hlg": [8, 17, 19, 20, 22], "928": 8, "compile_hlg": 8, "120": 8, "lang_phon": [8, 12, 17, 19, 20, 22], "929": [8, 11], "lexicon": [8, 9, 11, 12, 14, 16, 22], "116": 8, "convert": [8, 14, 16], "l": [8, 11, 16, 19, 20, 22], "pt": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "linv": [8, 11, 14, 22], "931": 8, "ctc_topo": 8, "max_token_id": 8, "932": 8, "load": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "fst": [8, 11, 22], "intersect": 8, "933": 8, "lg": 8, "shape": 8, "66": 8, "connect": [8, 14, 16, 17], "68": [8, 14], "70": 8, "class": [8, 14], "tensor": [8, 9, 11, 12, 14, 16, 22], "71": [8, 14, 17], "determin": 8, "934": 8, "74": 8, "_k2": 8, "raggedint": 8, "remov": [8, 9, 11, 12, 14, 17, 19, 20], "disambigu": 8, "symbol": [8, 11], "87": 8, "remove_epsilon": 8, "935": 8, "92": [8, 14], "arc": 8, "95": [8, 10], "compos": 8, "h": 8, "105": [8, 14], "936": 8, "107": [8, 17], "123": 8, "now": [8, 9, 14, 16, 17, 19, 20], "cuda_visible_devic": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "gpu": [8, 9, 11, 12, 14, 16, 19, 20, 22], "avail": [8, 9, 11, 14, 16, 17, 19, 20, 22], "given": [8, 9, 11, 12, 14, 17], "below": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "072": 8, "465": 8, "466": 8, "exp_dir": [8, 11, 14], "posixpath": [8, 11, 14], "exp": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "lang_dir": [8, 11, 14], "lr": [8, 11, 16], "feature_dim": [8, 9, 11, 14, 22], "weight_decai": 8, "1e": 8, "06": [8, 12, 14, 17, 22], "start_epoch": 8, "best_train_loss": 8, "inf": 8, "best_valid_loss": 8, "best_train_epoch": 8, "best_valid_epoch": 8, "batch_idx_train": 8, "log_interv": 8, "valid_interv": 8, "beam_siz": [8, 11], "reduct": 8, "sum": 8, "use_doub": 8, "le_scor": 8, "true": [8, 9, 11, 14, 16, 17, 19, 20, 22], "world_siz": 8, "master_port": 8, "12354": 8, "num_epoch": 8, "feature_dir": [8, 14], "max_dur": [8, 14], "bucketing_sampl": [8, 14], "num_bucket": [8, 14], "concatenate_cut": [8, 14], "duration_factor": [8, 14], "gap": [8, 14], "on_the_fly_feat": [8, 14], "shuffl": [8, 14], "return_cut": [8, 14], "num_work": [8, 14], "074": 8, "113": [8, 11, 14], "098": [8, 17], "cut": [8, 14], "240": [8, 9, 22], "149": [8, 14], "200": [8, 9, 14, 19, 20, 22], "singlecutsampl": 8, "206": [8, 14], "219": [8, 11, 14], "246": [8, 11, 14, 19, 20], "357": 8, "416": 8, "epoch": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "batch": [8, 9, 11, 12, 14, 16], "avg": [8, 11, 14, 16, 17, 19, 20, 22], "loss": [8, 9, 12, 14, 16, 17, 19, 20, 22], "0789": 8, "848": 8, "5356": 8, "7556": 8, "301": [8, 14], "432": [8, 14], "9972": 8, "best": [8, 9, 12, 14], "805": 8, "2436": 8, "5717": 8, "33": [8, 9, 10, 11, 14, 19], "109": [8, 9, 14], "4167": 8, "121": [8, 17], "325": 8, "2214": 8, "798": [8, 11], "0781": 8, "1343": 8, "065": 8, "0859": 8, "556": 8, "0421": 8, "0975": 8, "810": 8, "0431": 8, "824": 8, "657": 8, "0109": 8, "984": [8, 14], "0093": 8, "0096": 8, "50": [8, 14, 16, 19], "239": [8, 11], "0104": 8, "0101": 8, "569": 8, "0092": 8, "819": [8, 19], "835": 8, "51": [8, 9, 14, 22], "024": 8, "0105": 8, "317": 8, "0099": 8, "0097": 8, "552": 8, "0108": 8, "869": 8, "0102": 8, "126": [8, 14], "128": [8, 14], "537": [8, 14], "192": [8, 14], "249": 8, "250": [8, 11, 17], "lm_dir": [8, 14], "search_beam": [8, 9, 14, 22], "output_beam": [8, 9, 14, 22], "min_active_st": [8, 9, 14, 22], "max_active_st": [8, 9, 14, 22], "10000": [8, 9, 14, 22], "use_double_scor": [8, 9, 14, 22], "193": 8, "213": [8, 22], "259": [8, 9], "devic": [8, 9, 11, 12, 14, 17, 19, 20, 22], "217": [8, 9, 14], "279": [8, 14], "averag": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "userwarn": [8, 11], "floor_divid": 8, "futur": [8, 11, 13], "round": [8, 11], "toward": [8, 11], "trunc": [8, 11], "function": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "NOT": [8, 9, 11, 14, 22], "floor": [8, 11], "incorrect": [8, 11], "neg": [8, 11], "valu": [8, 9, 11, 12, 14, 16], "keep": [8, 11], "behavior": [8, 11], "div": [8, 11], "b": [8, 11, 14, 19, 20], "rounding_mod": [8, 11], "actual": [8, 9, 11, 12, 14, 16], "divis": [8, 11], "trigger": 8, "intern": 8, "aten": 8, "src": [8, 16], "nativ": 8, "binaryop": 8, "cpp": 8, "450": [8, 9, 11, 12], "k": [8, 16, 19, 20], "n": [8, 9, 14, 16, 19, 20], "220": [8, 11, 12, 14], "409": 8, "190": [8, 17], "until": [8, 14], "571": [8, 14], "228": [8, 14], "transcript": [8, 9, 10, 11, 12, 14, 16, 17, 19, 20], "recog": [8, 11, 14], "test_set": [8, 22], "572": 8, "util": [8, 14], "ins": [8, 14, 22], "del": [8, 14, 22], "sub": [8, 14, 22], "573": 8, "236": 8, "wrote": [8, 14], "detail": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "error": [8, 14], "stat": [8, 14], "err": [8, 11, 14], "299": 8, "congratul": [8, 9, 12, 14, 17, 19, 20, 22], "first": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "fun": 8, "debug": 8, "variou": [8, 13], "problem": 8, "mai": [8, 9, 11, 12, 13, 14, 16], "encount": [8, 9, 11, 12, 14, 16], "while": [8, 9, 11, 12, 14, 16], "tutori": [9, 11, 12, 14, 16, 17, 19, 20], "learn": [9, 11, 12, 14, 16, 17, 19, 20, 22], "singl": [9, 11, 12, 14, 16, 17, 19, 20, 22], "multipl": [9, 11, 12, 14, 17, 19, 20, 22], "1best": [9, 12, 14, 17, 19, 20], "handl": [9, 12, 14, 16, 17, 19, 20, 22], "automag": [9, 12, 14, 16, 17, 19, 20, 22], "stop": [9, 11, 12, 14, 16, 17, 19, 20, 22], "control": [9, 11, 12, 14, 16, 17, 19, 20, 22], "By": [9, 12, 14, 16, 17, 19, 20, 22], "default": [9, 11, 12, 14, 16, 17, 19, 20, 22], "execut": [9, 12, 14, 16, 17, 19, 20, 22], "mean": [9, 11, 12, 14, 16, 17, 19, 20, 22], "onli": [9, 11, 12, 13, 14, 16, 17, 19, 20, 22], "musan": [9, 12, 14, 16], "sai": [9, 11, 12, 14, 16, 17, 19, 20, 22], "thei": [9, 11, 12, 14, 16], "won": [9, 12, 14, 16], "re": [9, 12, 14, 16], "intal": [9, 12], "initi": [9, 12], "lf": [9, 11, 12, 14, 17, 19, 20, 22], "sudo": [9, 12], "apt": [9, 12], "permiss": [9, 12], "binari": [9, 11, 12, 14, 16, 22], "here": [9, 11, 12, 14, 17], "pass": [9, 11, 12, 14, 16], "commandlin": [9, 11, 12, 14, 16], "quit": [9, 11, 12, 14, 16], "often": [9, 11, 12, 14, 16], "dir": [9, 11, 12, 14, 16, 17, 19, 20, 22], "experi": [9, 11, 12, 14, 16, 22], "num": [9, 11, 12, 14, 16], "resum": [9, 11, 12, 14, 16, 17, 19, 20, 22], "state": [9, 11, 12, 14, 16], "world": [9, 11, 12, 14, 16, 17], "multi": [9, 11, 12, 14, 16], "machin": [9, 11, 12, 14, 16], "ddp": [9, 11, 12, 14, 16], "4": [9, 11, 12, 14, 16, 17, 19, 20, 22], "implement": [9, 11, 12, 14, 16], "present": [9, 11, 12, 14, 16], "later": [9, 12, 14, 16, 17, 19, 20], "max": [9, 11, 12, 14, 16], "durat": [9, 11, 12, 14, 16, 17, 19, 20, 22], "specifi": [9, 11, 12, 14, 16, 17, 19, 20, 22], "second": [9, 11, 12, 14, 16, 22], "over": [9, 11, 12, 14, 16], "utter": [9, 11, 12, 14, 16], "pad": [9, 11, 12, 14, 16], "oom": [9, 11, 12, 14, 16], "reduc": [9, 11, 12, 14, 16, 17, 19, 20, 22], "v100": [9, 11, 12, 14], "nvidia": [9, 11, 12, 14], "due": [9, 11, 12, 14, 16], "usual": [9, 11, 12, 14, 16], "larger": [9, 11, 12, 14, 16], "than": [9, 11, 12, 14, 16, 17, 22], "caus": [9, 11, 12, 14, 16], "smaller": [9, 11, 12, 14, 16], "increas": [9, 11, 12, 14, 16], "tune": [9, 11, 12, 14, 16], "weight": [9, 12, 14, 16], "decai": [9, 12, 14, 16], "warmup": [9, 11, 12, 14, 16], "get_param": [9, 11, 12, 14, 16, 17, 19, 20, 22], "paramet": [9, 11, 12, 14, 16, 17, 19, 20], "realli": [9, 12, 14, 16], "directli": [9, 11, 12, 14, 16], "perturb": [9, 11, 12, 14, 16], "speed": [9, 11, 12, 14, 16], "factor": [9, 11, 12, 14, 16], "each": [9, 11, 12, 14, 16], "3x150": [9, 11, 12], "hour": [9, 11, 12, 14, 16], "These": [9, 11, 12, 14, 16, 17, 19, 20, 22], "state_dict": [9, 11, 12, 14, 17, 19, 20, 22], "optim": [9, 11, 12, 14, 16, 17, 19, 20, 22], "rate": [9, 11, 12, 14, 16, 17, 19, 20, 22], "visual": [9, 11, 12, 14, 16, 17, 19, 20, 22], "logdir": [9, 11, 12, 14, 16, 17, 19, 20, 22], "labelsmooth": 9, "someth": [9, 11, 12, 14, 16, 22], "tensorflow": [9, 11, 12, 14, 16, 22], "found": [9, 11, 12, 14, 16, 22], "continu": [9, 11, 12, 14, 16, 22], "press": [9, 11, 12, 14, 16, 22], "ctrl": [9, 11, 12, 14, 16, 22], "engw8ksktzqs24zbv5dgcg": 9, "22t11": 9, "09": [9, 11, 12, 14, 16], "scan": [9, 11, 12, 14, 16, 22], "116068": 9, "scalar": [9, 11, 12, 14, 16, 22], "listen": [9, 11, 12, 16, 22], "note": [9, 11, 12, 14, 16, 17, 19, 20, 22], "url": [9, 11, 12, 14, 16, 22], "output": [9, 11, 12, 14, 16, 17, 19, 20, 22], "xxxx": [9, 11, 12, 14, 16, 17, 19, 20, 22], "text": [9, 11, 12, 14, 16, 17, 19, 20, 22], "saw": [9, 11, 12, 14, 16, 17, 19, 20, 22], "consol": [9, 11, 12, 14, 16, 17, 19, 20, 22], "typic": [9, 11, 12, 14], "avoid": [9, 11, 14], "commonli": [9, 11, 12, 14, 17, 19, 20, 22], "nbest": [9, 14], "scale": [9, 14, 17, 19, 20], "down": [9, 14, 16], "lattic": [9, 12, 14, 17, 19, 20], "score": [9, 14], "more": [9, 14, 16, 22], "uniqu": [9, 14], "pkufool": [9, 12, 17], "icefall_asr_aishell_conformer_ctc": 9, "transcrib": [9, 11, 12, 14], "sound": [9, 11, 12, 14, 17, 19, 20, 22], "csukuangfj": [9, 11, 12, 14, 16, 17, 19, 20, 22], "tree": [9, 11, 12, 14, 16, 17, 19, 20, 22], "lang_char": [9, 11], "token": [9, 11, 12, 14, 17, 19, 20, 22], "word": [9, 11, 12, 14, 17, 19, 20, 22], "test_wav": [9, 11, 12, 14, 17, 19, 20, 22], "bac009s0764w0121": [9, 11, 12], "wav": [9, 11, 12, 14, 16, 19, 20, 22], "bac009s0764w0122": [9, 11, 12], "bac009s0764w0123": [9, 11, 12], "tran": [9, 12, 14, 17, 19, 20], "graph": [9, 12, 14, 17, 19, 20], "id": [9, 12, 14, 17, 19, 20], "conveni": [9, 12, 14], "eo": [9, 12, 14], "easili": [9, 12, 14], "obtain": [9, 11, 12, 14, 17, 19, 20], "25": [9, 14, 19, 20, 22], "84": 9, "list": [9, 11, 12, 14, 17, 19, 20], "soxi": [9, 11, 12, 14, 17, 22], "sampl": [9, 11, 12, 14, 17, 22], "16000": [9, 11, 12, 14, 17, 19, 20], "precis": [9, 11, 12, 14, 17, 22], "bit": [9, 11, 12, 14, 17, 22], "04": [9, 11, 12, 14, 17, 19, 20], "67263": [9, 11, 12], "315": [9, 11, 12, 14, 17], "295": [9, 11, 12, 14], "cdda": [9, 11, 12, 14, 17, 22], "sector": [9, 11, 12, 14, 17, 22], "135k": [9, 11, 12], "256k": [9, 11, 12, 14], "encod": [9, 11, 12, 14, 16, 17, 22], "sign": [9, 11, 12, 14, 22], "integ": [9, 11, 12, 14, 22], "pcm": [9, 11, 12, 14, 22], "65840": [9, 11, 12], "625": [9, 11, 12], "132k": [9, 11, 12], "64000": [9, 11, 12], "300": [9, 11, 12, 14], "128k": [9, 11, 12, 22], "displai": [9, 11, 12, 14], "support": [9, 11, 14, 16], "three": [9, 11], "topologi": [9, 14], "07": [9, 11, 12, 14], "53": [9, 16, 17, 20], "707": [9, 14], "229": 9, "sample_r": [9, 11, 14, 22], "subsampling_factor": [9, 11, 14], "nhead": [9, 11, 14], "attention_dim": [9, 11, 14], "512": [9, 11, 14], "num_decoder_lay": [9, 14], "vgg_frontend": [9, 11, 14], "use_feat_batchnorm": [9, 14], "env_info": [9, 11, 14], "releas": [9, 11, 14], "sha1": [9, 11, 14], "f2fd997f752ed11bbef4c306652c433e83f9cf12": 9, "date": [9, 11, 14], "sun": 9, "sep": 9, "46": [9, 14], "33cfe45": 9, "branch": [9, 11, 14], "d57a873": 9, "dirti": [9, 14], "wed": [9, 11, 14], "nov": [9, 14], "hw": 9, "kangwei": 9, "icefall_aishell3": 9, "k2_releas": 9, "__init__": [9, 11, 14], "tokens_fil": 9, "words_fil": [9, 14, 22], "num_path": [9, 14], "ngram_lm_scal": [9, 14], "attention_decoder_scal": [9, 14], "nbest_scal": [9, 14], "sos_id": [9, 14], "eos_id": [9, 14], "num_class": [9, 14, 22], "4336": [9, 11], "sound_fil": [9, 11, 14, 22], "708": [9, 11, 14, 22], "242": [9, 14], "131": [9, 14], "construct": [9, 11, 12, 14, 17, 19, 20, 22], "134": 9, "269": [9, 19, 20], "275": 9, "241": 9, "293": [9, 14], "704": [9, 19], "369": [9, 14], "\u751a": [9, 11], "\u81f3": [9, 11], "\u51fa": [9, 11], "\u73b0": [9, 11], "\u4ea4": [9, 11], "\u6613": [9, 11], "\u51e0": [9, 11], "\u4e4e": [9, 11], "\u505c": [9, 11], "\u6b62": 9, "\u7684": [9, 11, 12], "\u60c5": [9, 11], "\u51b5": [9, 11], "\u4e00": [9, 11], "\u4e8c": [9, 11], "\u7ebf": [9, 11, 12], "\u57ce": [9, 11], "\u5e02": [9, 11], "\u867d": [9, 11], "\u7136": [9, 11], "\u4e5f": [9, 11, 12], "\u5904": [9, 11], "\u4e8e": [9, 11], "\u8c03": [9, 11], "\u6574": [9, 11], "\u4e2d": [9, 11, 12], "\u4f46": [9, 11, 12], "\u56e0": [9, 11], "\u4e3a": [9, 11], "\u805a": [9, 11], "\u96c6": [9, 11], "\u4e86": [9, 11, 12], "\u8fc7": [9, 11], "\u591a": [9, 11], "\u516c": [9, 11], "\u5171": [9, 11], "\u8d44": [9, 11], "\u6e90": [9, 11], "371": 9, "37": [9, 11, 14, 19], "38": [9, 11, 14, 19], "683": 9, "47": [9, 14], "651": [9, 22], "654": 9, "659": 9, "752": 9, "321": 9, "887": 9, "340": 9, "370": 9, "\u751a\u81f3": [9, 12], "\u51fa\u73b0": [9, 12], "\u4ea4\u6613": [9, 12], "\u51e0\u4e4e": [9, 12], "\u505c\u6b62": 9, "\u60c5\u51b5": [9, 12], "\u4e00\u4e8c": [9, 12], "\u57ce\u5e02": [9, 12], "\u867d\u7136": [9, 12], "\u5904\u4e8e": [9, 12], "\u8c03\u6574": [9, 12], "\u56e0\u4e3a": [9, 12], "\u805a\u96c6": [9, 12], "\u8fc7\u591a": [9, 12], "\u516c\u5171": [9, 12], "\u8d44\u6e90": [9, 12], "372": 9, "recor": [9, 14], "highest": [9, 14], "05": [9, 11, 12, 14, 20], "965": 9, "966": 9, "821": 9, "822": 9, "826": 9, "916": 9, "115": [9, 14], "345": 9, "888": 9, "889": 9, "limit": [9, 11, 14], "memori": [9, 11, 14], "upgrad": [9, 14], "pro": [9, 14], "finish": [9, 11, 12, 14, 17, 19, 20, 22], "deploi": [9, 14], "At": [9, 14], "doe": [9, 11, 14, 22], "stream": [9, 14, 16, 19, 20], "home": [9, 14], "checkout": [9, 14], "v2": [9, 14], "cmake": [9, 14], "dcmake_build_typ": [9, 14], "j": [9, 14], "hlg_decod": [9, 14], "four": [9, 14], "ln": [9, 14, 16], "messag": [9, 14, 16], "nn_model": [9, 14], "use_gpu": [9, 14], "word_tabl": [9, 14], "wave": [9, 14], "caution": [9, 14], "relat": [9, 11, 14, 17, 19, 20, 22], "forward": [9, 14], "cpu_jit": [9, 14], "cu": [9, 14], "int": [9, 14], "char": [9, 14], "124": [9, 14], "98": 9, "142": [9, 12, 14], "150": [9, 14], "693": [9, 19], "165": [9, 14], "nnet_output": [9, 14], "182": [9, 17], "180": [9, 14], "489": 9, "45": [9, 11, 14], "216": [9, 14, 19, 20], "mandarin": 10, "corpu": 10, "beij": 10, "shell": 10, "technologi": 10, "ltd": 10, "400": 10, "peopl": 10, "accent": 10, "area": 10, "china": 10, "invit": 10, "particip": 10, "conduct": 10, "quiet": 10, "indoor": 10, "high": 10, "fidel": 10, "microphon": 10, "downsampl": 10, "16khz": 10, "manual": 10, "accuraci": 10, "through": 10, "profession": 10, "annot": 10, "strict": 10, "inspect": 10, "free": [10, 16], "academ": 10, "hope": [10, 14, 17], "moder": 10, "amount": 10, "research": 10, "field": 10, "openslr": 10, "ctc": [10, 13, 15, 18, 21], "stateless": [10, 13, 16], "transduc": [10, 13, 15], "instead": 11, "rnn": [11, 16], "As": [11, 14], "head": 11, "dim": 11, "layer": [11, 16], "feedforward": 11, "2048": 11, "embed": [11, 16], "conv1d": [11, 16], "kernel": 11, "left": 11, "context": [11, 16], "joiner": [11, 16], "nn": [11, 16], "tanh": 11, "linear": 11, "borrow": 11, "ieeexplor": 11, "ieee": 11, "stamp": 11, "jsp": 11, "arnumb": 11, "9054419": 11, "predict": [11, 16], "modif": 11, "right": 11, "charact": 11, "unit": 11, "whose": [11, 14, 17], "vocabulari": 11, "87939824": 11, "88": 11, "optimized_transduc": 11, "extra": 11, "technqiu": 11, "propos": 11, "improv": 11, "end": [11, 16, 22], "furthermor": 11, "maximum": 11, "emit": 11, "per": 11, "frame": 11, "simplifi": 11, "significantli": 11, "degrad": 11, "perform": 11, "exactli": 11, "benchmark": 11, "unprun": 11, "advantag": 11, "minim": 11, "pruned_transducer_stateless": 11, "prune": [11, 16], "other": [11, 13, 14, 17, 19, 20, 22], "altern": 11, "though": 11, "transducer_stateless_modifi": 11, "option": [11, 17, 19, 20, 22], "pr": 11, "gb": 11, "ram": 11, "small": [11, 19, 20, 22], "tri": 11, "prob": [11, 16], "appli": 11, "configur": [11, 17, 19, 20, 22], "c": [11, 12, 16, 22], "lagz6hrcqxoigbfd5e0y3q": 11, "2022": [11, 16], "03t14": 11, "8477": 11, "greedy_search": [11, 16], "sym": 11, "beam_search": 11, "decoding_method": 11, "beam_4": 11, "02": [11, 14, 16, 20], "28": [11, 14, 17], "ensur": 11, "give": 11, "poor": 11, "531": [11, 12], "994": [11, 14], "176": [11, 14], "027": 11, "encoder_out_dim": 11, "dim_feedforward": 11, "num_encoder_lay": 11, "f4fefe4882bc0ae59af951da3f47335d5495ef71": 11, "thu": [11, 14, 17], "feb": 11, "miss": [11, 14], "50d2281": 11, "mar": 11, "hostnam": 11, "de": 11, "74279": 11, "0815224919": 11, "75d558775b": 11, "mmnv8": 11, "ip": 11, "177": [11, 12, 14], "72": [11, 14], "context_s": 11, "max_sym_per_fram": 11, "blank_id": 11, "vocab_s": 11, "878": [11, 20], "257": [11, 19, 20], "880": 11, "267": [11, 19, 20], "891": 11, "273": 11, "__floordiv__": 11, "length": 11, "x_len": 11, "163": [11, 14], "320": 11, "\u6ede": 11, "322": 11, "285": [11, 14], "759": 11, "760": 11, "919": 11, "922": 11, "046": 11, "047": 11, "319": [11, 14], "214": [11, 14], "215": [11, 14, 17], "402": 11, "topk_hyp_index": 11, "topk_index": 11, "logit": 11, "583": [11, 20], "2000": 12, "lji9mwuorlow3jkdhxwk8a": 12, "13t11": 12, "4454": 12, "icefall_asr_aishell_tdnn_lstm_ctc": 12, "858": [12, 14], "389": [12, 14], "154": 12, "161": [12, 14], "536": 12, "171": [12, 14, 19, 20], "539": 12, "917": 12, "207": [12, 14], "129": 12, "\u505c\u6ede": 12, "222": [12, 14], "task": 13, "well": [13, 22], "ligru": [13, 18], "full": [14, 16], "libri": [14, 16], "960": [14, 16], "subset": [14, 16], "3x960": [14, 16], "2880": [14, 16], "lzgnetjwrxc3yghnmd4kpw": 14, "24t16": 14, "43": 14, "4540": 14, "sentenc": 14, "piec": 14, "And": [14, 16], "neither": 14, "nor": 14, "vocab": 14, "work": 14, "5000": 14, "lang_bpe_500": [14, 16], "44": [14, 19, 20], "033": 14, "538": 14, "full_libri": 14, "406": 14, "464": 14, "548": 14, "776": 14, "652": [14, 22], "109226120": 14, "714": [14, 19], "473": 14, "944": 14, "1328": 14, "54": [14, 17, 19, 20], "443": [14, 17], "2563": 14, "56": [14, 19], "494": 14, "592": 14, "331": [14, 17], "1715": 14, "52576": 14, "1424": 14, "807": 14, "506": 14, "808": [14, 19], "522": 14, "362": 14, "203": 14, "565": 14, "1477": 14, "106": 14, "2922": 14, "208": 14, "4295": 14, "52343": 14, "396": 14, "3584": 14, "433": 14, "680": [14, 19], "jit": 14, "bpe": [14, 16], "_pickl": 14, "unpicklingerror": 14, "kei": 14, "hlg_modifi": 14, "g_4_gram": [14, 17, 19, 20], "1089": [14, 17], "134686": [14, 17], "0001": [14, 17], "1221": [14, 17], "135766": [14, 17], "0002": [14, 17], "reproduc": 14, "our": 14, "106000": [14, 17], "496": [14, 17], "875": [14, 17], "212k": 14, "267440": [14, 17], "1253": [14, 17], "535k": 14, "83": [14, 17], "77200": [14, 17], "361": [14, 17], "154k": 14, "554": 14, "260": 14, "bpe_model": 14, "7178d67e594bc7fa89c2b331ad7bd1c62a6a9eb4": 14, "tue": 14, "oct": 14, "22": [14, 19, 20, 22], "8d93169": 14, "266": [14, 17], "268": [14, 17], "600": [14, 16], "601": 14, "758": 14, "025": 14, "204": 14, "425": 14, "earli": [14, 17], "nightfal": [14, 17], "THE": [14, 17], "yellow": [14, 17], "lamp": [14, 17], "light": [14, 17], "AND": [14, 17], "THERE": [14, 17], "squalid": [14, 17], "quarter": [14, 17], "OF": [14, 17], "broffel": 14, "god": [14, 17], "AS": [14, 17], "direct": [14, 17], "consequ": [14, 17], "sin": [14, 17], "man": [14, 17], "punish": [14, 17], "had": [14, 17], "her": [14, 17], "love": [14, 17], "child": [14, 17], "ON": [14, 17], "THAT": [14, 17], "dishonor": [14, 17], "osom": 14, "TO": [14, 17], "parent": [14, 17], "forev": [14, 17], "WITH": [14, 17], "race": [14, 17], "descent": [14, 17], "mortal": [14, 17], "BE": [14, 17], "bless": [14, 17], "soul": [14, 17], "IN": [14, 17], "heaven": [14, 17], "yet": [14, 17], "THESE": [14, 17], "thought": [14, 17], "affect": [14, 17], "hester": [14, 17], "prynn": [14, 17], "less": [14, 17, 22], "apprehens": [14, 17], "427": 14, "723": 14, "775": 14, "881": 14, "951": 14, "352": 14, "234": 14, "384": 14, "brothel": [14, 17], "bosom": [14, 17], "whole": [14, 17, 19, 20], "ngram": [14, 17, 19, 20], "Its": 14, "857": 14, "979": 14, "980": 14, "055": 14, "117": 14, "051": 14, "363": 14, "959": [14, 20], "546": 14, "598": 14, "599": [14, 17], "833": 14, "834": 14, "915": 14, "076": 14, "110": 14, "329": 14, "397": 14, "999": 14, "concaten": 14, "bucket": 14, "sampler": 14, "1000": 14, "ctc_decod": 14, "ngram_lm_rescor": 14, "attention_rescor": 14, "kind": [14, 16], "316": 14, "118": 14, "58": 14, "221": 14, "125": [14, 22], "136": 14, "144": 14, "159": [14, 22], "543": 14, "174": 14, "topo": 14, "547": 14, "729": 14, "111": 14, "702": 14, "703": 14, "545": 14, "122": 14, "280": 14, "135": [14, 22], "153": [14, 22], "945": 14, "475": 14, "191": [14, 19, 20], "398": 14, "199": [14, 17], "515": 14, "205": 14, "w": [14, 19, 20], "deseri": 14, "441": 14, "fsaclass": 14, "loadfsa": 14, "const": 14, "string": 14, "c10": 14, "ignor": 14, "non": 14, "attribut": 14, "dummi": 14, "589": 14, "attention_scal": 14, "656": 14, "162": 14, "169": [14, 19, 20], "188": 14, "624": 14, "519": [14, 20], "632": 14, "645": [14, 22], "243": 14, "970": 14, "303": 14, "179": 14, "scroll": 16, "scratch": 16, "paper": 16, "arxiv": 16, "ab": 16, "2206": 16, "13236": 16, "joint": 16, "contrari": 16, "convent": 16, "That": 16, "recurr": 16, "sinc": [16, 22], "suitabl": 16, "onlin": 16, "lstm_transducer_stateless": 16, "lstm_transducer_stateless2": 16, "architectur": 16, "lower": 16, "skip": 16, "prepare_giga_speech": 16, "encourag": 16, "case": 16, "giga": 16, "436000": 16, "438000": 16, "cj2vtpiwqhkn9q1tx6ptpg": 16, "20t15": 16, "4468": 16, "210171": 16, "access": 16, "6008": 16, "localhost": 16, "expos": 16, "proxi": 16, "bind_al": 16, "fp16": 16, "worker": 16, "iter": 16, "suggest": 16, "both": 16, "produc": 16, "lowest": 16, "fast_beam_search": 16, "hidden": 16, "1024": 16, "beam": 16, "474000": 16, "includ": 16, "But": 16, "interest": 16, "468000": 16, "smallest": 16, "9999": 16, "encoder_jit_trac": 16, "decoder_jit_trac": 16, "joiner_jit_trac": 16, "jit_pretrain": 16, "streaming_asr": 16, "pnnx": 16, "submodul": 16, "updat": 16, "recurs": 16, "init": 16, "bdist_wheel": 16, "lh": 16, "dist": 16, "j4": 16, "pwd": 16, "third": 16, "torchscript": 16, "param": 16, "abl": 16, "static": 16, "raspberri": 16, "pi": 16, "extern": 16, "stateless2": 16, "zengwei": 16, "icefall_asr_librispeech_tdnn": 17, "lstm_ctc": 17, "flac": 17, "116k": 17, "140k": 17, "343k": 17, "164k": 17, "105k": 17, "174k": 17, "usag": [17, 19, 20, 22], "pretraind": 17, "168": 17, "170": 17, "581": 17, "584": [17, 20], "209": 17, "791": 17, "245": 17, "099": 17, "methond": [17, 19, 20], "725": 17, "403": 17, "631": 17, "010": 17, "tdnn_ligru_ctc": 19, "enough": [19, 20, 22], "luomingshuang": [19, 20], "icefall_asr_timit_tdnn_ligru_ctc": 19, "pretrained_average_9_25": 19, "fdhc0_si1559": [19, 20], "felc0_si756": [19, 20], "fmgd0_si1564": [19, 20], "ffprobe": [19, 20], "show_format": [19, 20], "nistspher": [19, 20], "database_id": [19, 20], "database_vers": [19, 20], "utterance_id": [19, 20], "dhc0_si1559": [19, 20], "sample_min": [19, 20], "4176": [19, 20], "sample_max": [19, 20], "5984": [19, 20], "bitrat": [19, 20], "258": [19, 20], "audio": [19, 20], "pcm_s16le": [19, 20], "hz": [19, 20], "s16": [19, 20], "256": [19, 20], "elc0_si756": [19, 20], "1546": [19, 20], "1989": [19, 20], "mgd0_si1564": [19, 20], "7626": [19, 20], "10573": [19, 20], "660": 19, "183": [19, 20], "695": 19, "697": 19, "210": [19, 20], "829": 19, "sil": [19, 20], "dh": [19, 20], "ih": [19, 20], "uw": [19, 20], "ah": [19, 20], "ii": [19, 20], "z": [19, 20], "aa": [19, 20], "ei": [19, 20], "dx": [19, 20], "uh": [19, 20], "ng": [19, 20], "th": [19, 20], "eh": [19, 20], "jh": [19, 20], "er": [19, 20], "ai": [19, 20], "hh": [19, 20], "aw": 19, "ae": [19, 20], "705": 19, "715": 19, "720": 19, "251": [19, 20], "348": 19, "ch": 19, "icefall_asr_timit_tdnn_lstm_ctc": 20, "pretrained_average_16_25": 20, "816": 20, "827": 20, "387": 20, "unk": 20, "739": 20, "971": 20, "977": 20, "978": 20, "981": 20, "ow": 20, "ykubhb5wrmosxykid1z9eg": 22, "23t23": 22, "icefall_asr_yesno_tdnn": 22, "l_disambig": 22, "lexicon_disambig": 22, "arpa": 22, "0_0_0_1_0_0_0_1": 22, "0_0_1_0_0_0_1_0": 22, "0_0_1_0_0_1_1_1": 22, "0_0_1_0_1_0_0_1": 22, "0_0_1_1_0_0_0_1": 22, "0_0_1_1_0_1_1_0": 22, "0_0_1_1_1_0_0_0": 22, "0_0_1_1_1_1_0_0": 22, "0_1_0_0_0_1_0_0": 22, "0_1_0_0_1_0_1_0": 22, "0_1_0_1_0_0_0_0": 22, "0_1_0_1_1_1_0_0": 22, "0_1_1_0_0_1_1_1": 22, "0_1_1_1_0_0_1_0": 22, "0_1_1_1_1_0_1_0": 22, "1_0_0_0_0_0_0_0": 22, "1_0_0_0_0_0_1_1": 22, "1_0_0_1_0_1_1_1": 22, "1_0_1_1_0_1_1_1": 22, "1_0_1_1_1_1_0_1": 22, "1_1_0_0_0_1_1_1": 22, "1_1_0_0_1_0_1_1": 22, "1_1_0_1_0_1_0_0": 22, "1_1_0_1_1_0_0_1": 22, "1_1_0_1_1_1_1_0": 22, "1_1_1_0_0_1_0_1": 22, "1_1_1_0_1_0_1_0": 22, "1_1_1_1_0_0_1_0": 22, "1_1_1_1_1_0_0_0": 22, "1_1_1_1_1_1_1_1": 22, "54080": 22, "507": 22, "108k": 22, "No": 22, "ye": 22, "hebrew": 22, "NO": 22, "621": 22, "119": 22, "127": 22, "650": 22, "139": 22, "143": 22, "198": 22, "181": 22, "186": 22, "187": 22, "287": 22, "correctli": 22, "simplest": 22}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"follow": 0, "code": 0, "style": 0, "contribut": [1, 3], "document": 1, "how": 2, "creat": [2, 8], "recip": [2, 13], "data": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "prepar": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "train": [2, 5, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "decod": [2, 8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "pre": [2, 5, 9, 11, 12, 14, 16, 17, 19, 20, 22], "model": [2, 5, 9, 11, 12, 14, 16, 17, 19, 20, 22], "huggingfac": [4, 6], "space": 6, "youtub": [6, 8], "video": [6, 8], "icefal": [7, 8], "content": [7, 13], "instal": [8, 9, 11, 12, 14, 17, 19, 20], "0": 8, "pytorch": 8, "torchaudio": 8, "1": [8, 9, 11, 12, 14], "k2": 8, "2": [8, 9, 11, 12, 14], "lhots": 8, "3": [8, 9, 11, 14], "download": [8, 9, 11, 12, 14, 16, 17, 19, 20, 22], "exampl": [8, 9, 11, 12, 14, 16], "virtual": 8, "environ": 8, "activ": 8, "your": 8, "4": 8, "5": 8, "test": 8, "conform": [9, 14], "ctc": [9, 12, 14, 17, 19, 20, 22], "configur": [9, 12, 14, 16], "option": [9, 12, 14, 16], "log": [9, 11, 12, 14, 16], "usag": [9, 11, 12, 14, 16], "case": [9, 11, 12, 14], "kaldifeat": [9, 11, 12, 14, 17, 19, 20, 22], "hlg": [9, 12, 14], "attent": [9, 14], "rescor": [9, 14], "colab": [9, 11, 12, 14, 17, 19, 20, 22], "notebook": [9, 11, 12, 14, 17, 19, 20, 22], "deploy": [9, 14], "c": [9, 14], "aishel": 10, "stateless": 11, "transduc": [11, 16], "The": 11, "loss": 11, "todo": 11, "greedi": 11, "search": 11, "beam": 11, "modifi": 11, "tdnn": [12, 17, 19, 20, 22], "lstm": [12, 16, 17, 20], "tabl": 13, "lm": 14, "comput": 14, "wer": 14, "librispeech": 15, "which": 16, "us": 16, "export": 16, "state_dict": 16, "torch": 16, "jit": 16, "trace": 16, "ncnn": 16, "pretrain": 16, "infer": [17, 19, 20, 22], "timit": 18, "ligru": 19, "yesno": 21}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.todo": 2, "sphinx": 57}, "alltitles": {"Follow the code style": [[0, "follow-the-code-style"]], "Contributing to Documentation": [[1, "contributing-to-documentation"]], "How to create a recipe": [[2, "how-to-create-a-recipe"]], "Data Preparation": [[2, "data-preparation"], [11, "data-preparation"]], "Training": [[2, "training"], [8, "training"], [9, "training"], [11, "training"], [12, "training"], [14, "training"], [16, "training"], [17, "training"], [19, "training"], [20, "training"], [22, "training"]], "Decoding": [[2, "decoding"], [8, "decoding"], [9, "decoding"], [11, "decoding"], [12, "decoding"], [14, "decoding"], [16, "decoding"], [17, "decoding"], [19, "decoding"], [20, "decoding"], [22, "decoding"]], "Pre-trained model": [[2, "pre-trained-model"]], "Contributing": [[3, "contributing"]], "Huggingface": [[4, "huggingface"]], "Pre-trained models": [[5, "pre-trained-models"]], "Huggingface spaces": [[6, "huggingface-spaces"]], "YouTube Video": [[6, "youtube-video"], [8, "youtube-video"]], "Icefall": [[7, "icefall"]], "Contents:": [[7, null]], "Installation": [[8, "installation"]], "(0) Install PyTorch and torchaudio": [[8, "install-pytorch-and-torchaudio"]], "(1) Install k2": [[8, "install-k2"]], "(2) Install lhotse": [[8, "install-lhotse"]], "(3) Download icefall": [[8, "download-icefall"]], "Installation example": [[8, "installation-example"]], "(1) Create a virtual environment": [[8, "create-a-virtual-environment"]], "(2) Activate your virtual environment": [[8, "activate-your-virtual-environment"]], "(3) Install k2": [[8, "id1"]], "(4) Install lhotse": [[8, "id2"]], "(5) Download icefall": [[8, "id3"]], "Test Your Installation": [[8, "test-your-installation"]], "Data preparation": [[8, "data-preparation"], [9, "data-preparation"], [12, "data-preparation"], [14, "data-preparation"], [16, "data-preparation"], [17, "data-preparation"], [19, "data-preparation"], [20, "data-preparation"], [22, "data-preparation"]], "Conformer CTC": [[9, "conformer-ctc"], [14, "conformer-ctc"]], "Configurable options": [[9, "configurable-options"], [12, "configurable-options"], [14, "configurable-options"], [16, "configurable-options"]], "Pre-configured options": [[9, "pre-configured-options"], [12, "pre-configured-options"], [14, "pre-configured-options"], [16, "pre-configured-options"]], "Training logs": [[9, "training-logs"], [11, "training-logs"], [12, "training-logs"], [14, "training-logs"], [16, "training-logs"]], "Usage examples": [[9, "usage-examples"], [11, "usage-examples"], [12, "usage-examples"], [14, "usage-examples"]], "Case 1": [[9, "case-1"], [11, "case-1"], [12, "case-1"], [14, "case-1"]], "Case 2": [[9, "case-2"], [11, "case-2"], [12, "case-2"], [14, "case-2"]], "Case 3": [[9, "case-3"], [11, "case-3"], [14, "case-3"]], "Pre-trained Model": [[9, "pre-trained-model"], [11, "pre-trained-model"], [12, "pre-trained-model"], [14, "pre-trained-model"], [17, "pre-trained-model"], [19, "pre-trained-model"], [20, "pre-trained-model"], [22, "pre-trained-model"]], "Install kaldifeat": [[9, "install-kaldifeat"], [11, "install-kaldifeat"], [12, "install-kaldifeat"], [14, "install-kaldifeat"], [17, "install-kaldifeat"], [19, "install-kaldifeat"], [20, "install-kaldifeat"]], "Download the pre-trained model": [[9, "download-the-pre-trained-model"], [11, "download-the-pre-trained-model"], [12, "download-the-pre-trained-model"], [14, "download-the-pre-trained-model"], [17, "download-the-pre-trained-model"], [19, "download-the-pre-trained-model"], [20, "download-the-pre-trained-model"], [22, "download-the-pre-trained-model"]], "Usage": [[9, "usage"], [11, "usage"], [12, "usage"], [14, "usage"]], "CTC decoding": [[9, "ctc-decoding"], [14, "ctc-decoding"]], "HLG decoding": [[9, "hlg-decoding"], [12, "hlg-decoding"], [14, "hlg-decoding"]], "HLG decoding + attention decoder rescoring": [[9, "hlg-decoding-attention-decoder-rescoring"]], "Colab notebook": [[9, "colab-notebook"], [11, "colab-notebook"], [12, "colab-notebook"], [14, "colab-notebook"], [17, "colab-notebook"], [19, "colab-notebook"], [20, "colab-notebook"], [22, "colab-notebook"]], "Deployment with C++": [[9, "deployment-with-c"], [14, "deployment-with-c"]], "aishell": [[10, "aishell"]], "Stateless Transducer": [[11, "stateless-transducer"]], "The Model": [[11, "the-model"]], "The Loss": [[11, "the-loss"]], "Todo": [[11, "id1"]], "Greedy search": [[11, "greedy-search"]], "Beam search": [[11, "beam-search"]], "Modified Beam search": [[11, "modified-beam-search"]], "TDNN-LSTM CTC": [[12, "tdnn-lstm-ctc"]], "Recipes": [[13, "recipes"]], "Table of Contents": [[13, null]], "HLG decoding + LM rescoring": [[14, "hlg-decoding-lm-rescoring"]], "HLG decoding + LM rescoring + attention decoder rescoring": [[14, "hlg-decoding-lm-rescoring-attention-decoder-rescoring"]], "Compute WER with the pre-trained model": [[14, "compute-wer-with-the-pre-trained-model"]], "LibriSpeech": [[15, "librispeech"]], "LSTM Transducer": [[16, "lstm-transducer"]], "Which model to use": [[16, "which-model-to-use"]], "Usage example": [[16, "usage-example"]], "Export models": [[16, "export-models"]], "Export model.state_dict()": [[16, "export-model-state-dict"]], "Export model using torch.jit.trace()": [[16, "export-model-using-torch-jit-trace"]], "Export model for ncnn": [[16, "export-model-for-ncnn"]], "Download pretrained models": [[16, "download-pretrained-models"]], "TDNN-LSTM-CTC": [[17, "tdnn-lstm-ctc"], [20, "tdnn-lstm-ctc"]], "Inference with a pre-trained model": [[17, "inference-with-a-pre-trained-model"], [19, "inference-with-a-pre-trained-model"], [20, "inference-with-a-pre-trained-model"], [22, "inference-with-a-pre-trained-model"]], "TIMIT": [[18, "timit"]], "TDNN-LiGRU-CTC": [[19, "tdnn-ligru-ctc"]], "YesNo": [[21, "yesno"]], "TDNN-CTC": [[22, "tdnn-ctc"]], "Download kaldifeat": [[22, "download-kaldifeat"]]}, "indexentries": {}})
\ No newline at end of file
+Search.setIndex({"docnames": ["contributing/code-style", "contributing/doc", "contributing/how-to-create-a-recipe", "contributing/index", "huggingface/index", "huggingface/pretrained-models", "huggingface/spaces", "index", "installation/index", "model-export/export-model-state-dict", "model-export/export-ncnn", "model-export/export-onnx", "model-export/export-with-torch-jit-script", "model-export/export-with-torch-jit-trace", "model-export/index", "recipes/aishell/conformer_ctc", "recipes/aishell/index", "recipes/aishell/stateless_transducer", "recipes/aishell/tdnn_lstm_ctc", "recipes/index", "recipes/librispeech/conformer_ctc", "recipes/librispeech/index", "recipes/librispeech/lstm_pruned_stateless_transducer", "recipes/librispeech/tdnn_lstm_ctc", "recipes/timit/index", "recipes/timit/tdnn_ligru_ctc", "recipes/timit/tdnn_lstm_ctc", "recipes/yesno/index", "recipes/yesno/tdnn"], "filenames": ["contributing/code-style.rst", "contributing/doc.rst", "contributing/how-to-create-a-recipe.rst", "contributing/index.rst", "huggingface/index.rst", "huggingface/pretrained-models.rst", "huggingface/spaces.rst", "index.rst", "installation/index.rst", "model-export/export-model-state-dict.rst", "model-export/export-ncnn.rst", "model-export/export-onnx.rst", "model-export/export-with-torch-jit-script.rst", "model-export/export-with-torch-jit-trace.rst", "model-export/index.rst", "recipes/aishell/conformer_ctc.rst", "recipes/aishell/index.rst", "recipes/aishell/stateless_transducer.rst", "recipes/aishell/tdnn_lstm_ctc.rst", "recipes/index.rst", "recipes/librispeech/conformer_ctc.rst", "recipes/librispeech/index.rst", "recipes/librispeech/lstm_pruned_stateless_transducer.rst", "recipes/librispeech/tdnn_lstm_ctc.rst", "recipes/timit/index.rst", "recipes/timit/tdnn_ligru_ctc.rst", "recipes/timit/tdnn_lstm_ctc.rst", "recipes/yesno/index.rst", "recipes/yesno/tdnn.rst"], "titles": ["Follow the code style", "Contributing to Documentation", "How to create a recipe", "Contributing", "Huggingface", "Pre-trained models", "Huggingface spaces", "Icefall", "Installation", "Export model.state_dict()", "Export to ncnn", "Export to ONNX", "Export model with torch.jit.script()", "Export model with torch.jit.trace()", "Model export", "Conformer CTC", "aishell", "Stateless Transducer", "TDNN-LSTM CTC", "Recipes", "Conformer CTC", "LibriSpeech", "LSTM Transducer", "TDNN-LSTM-CTC", "TIMIT", "TDNN-LiGRU-CTC", "TDNN-LSTM-CTC", "YesNo", "TDNN-CTC"], "terms": {"we": [0, 1, 2, 3, 5, 6, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 25, 26, 28], "us": [0, 1, 2, 4, 6, 7, 8, 10, 14, 15, 16, 17, 18, 20, 23, 25, 26, 28], "tool": [0, 22], "make": [0, 1, 3, 15, 17, 20, 22], "consist": [0, 17, 22], "possibl": [0, 2, 3, 8, 15, 20], "black": 0, "format": [0, 15, 17, 18, 20, 22, 23, 25, 26, 28], "flake8": 0, "check": [0, 20], "qualiti": [0, 16], "isort": 0, "sort": [0, 8], "import": 0, "The": [0, 1, 2, 6, 8, 9, 10, 15, 16, 18, 20, 22, 23, 25, 26, 28], "version": [0, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26], "abov": [0, 8, 9, 15, 16, 17, 18, 20, 22, 28], "ar": [0, 1, 3, 8, 9, 11, 15, 16, 17, 18, 19, 20, 22, 23, 25, 26, 28], "12": [0, 8, 9, 15, 17, 18, 20, 22, 25, 28], "6b0": 0, "3": [0, 7, 9, 18, 22, 23, 28], "9": [0, 8, 15, 17, 18, 20, 22, 23, 25, 28], "2": [0, 7, 9, 11, 22, 23, 25, 26, 28], "5": [0, 15, 17, 18, 20, 22, 23, 25, 26, 28], "after": [0, 1, 6, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "run": [0, 2, 6, 8, 11, 14, 15, 17, 18, 20, 22, 23, 25, 26, 28], "command": [0, 1, 8, 9, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "git": [0, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "clone": [0, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "http": [0, 1, 2, 5, 6, 8, 9, 10, 11, 12, 13, 15, 16, 17, 18, 20, 22, 23, 25, 26, 28], "github": [0, 2, 5, 8, 9, 10, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "com": [0, 2, 5, 6, 8, 9, 10, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "k2": [0, 2, 5, 6, 7, 9, 10, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26], "fsa": [0, 2, 5, 6, 8, 9, 10, 11, 12, 13, 15, 17, 20, 22], "icefal": [0, 2, 3, 5, 6, 9, 11, 12, 13, 15, 17, 18, 19, 20, 22, 23, 25, 26, 28], "cd": [0, 1, 2, 8, 9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "pip": [0, 1, 8, 17, 22], "instal": [0, 1, 4, 6, 7, 9, 22, 28], "pre": [0, 3, 4, 6, 7, 8], "commit": 0, "whenev": 0, "you": [0, 1, 2, 5, 6, 8, 9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "automat": [0, 6], "hook": 0, "invok": 0, "fail": [0, 8], "If": [0, 2, 6, 8, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "ani": [0, 8, 15, 17, 18, 20, 22, 28], "your": [0, 1, 2, 4, 6, 7, 15, 17, 18, 20, 22, 23, 25, 26, 28], "wa": [0, 8, 9, 20, 23], "success": [0, 8], "pleas": [0, 1, 2, 6, 8, 10, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "fix": [0, 8, 20], "issu": [0, 8, 20], "report": [0, 8], "some": [0, 1, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "i": [0, 1, 2, 6, 8, 9, 10, 15, 16, 17, 18, 20, 22, 23, 25, 26, 28], "e": [0, 2, 15, 17, 18, 20, 22, 23, 25, 26, 28], "modifi": [0, 15, 18, 20, 22, 23, 25, 26, 28], "file": [0, 2, 6, 9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "place": [0, 8, 9, 17, 20, 23], "so": [0, 6, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "statu": 0, "failur": 0, "see": [0, 1, 6, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "which": [0, 2, 6, 9, 15, 16, 17, 18, 20, 23, 25, 26, 28], "ha": [0, 2, 10, 11, 15, 17, 18, 20, 22, 23, 25, 26], "been": [0, 10, 11, 17], "befor": [0, 1, 9, 12, 15, 17, 18, 20, 22], "further": 0, "chang": [0, 15, 17, 18, 20, 22, 23, 25, 26, 28], "all": [0, 5, 6, 9, 12, 15, 17, 18, 20, 22, 23, 25, 26, 28], "again": [0, 28], "should": [0, 2, 15, 17, 18, 20, 22, 23, 25, 26, 28], "succe": 0, "thi": [0, 2, 3, 4, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 22, 23, 25, 26, 28], "time": [0, 15, 17, 18, 20, 22, 23, 25, 26, 28], "succeed": 0, "want": [0, 8, 9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "can": [0, 1, 2, 5, 6, 8, 9, 10, 11, 12, 13, 15, 16, 17, 18, 20, 22, 23, 25, 26, 28], "do": [0, 2, 15, 17, 18, 20, 22, 23, 25, 26, 28], "21": [0, 8, 9, 15, 17, 20, 25, 26], "your_changed_fil": 0, "py": [0, 2, 8, 11, 12, 13, 14, 15, 17, 18, 20, 22, 23, 25, 26, 28], "sphinx": 1, "write": [1, 2, 3], "have": [1, 2, 5, 6, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "prepar": [1, 3, 9], "environ": [1, 15, 16, 17, 18, 20, 22, 23, 25, 26, 28], "doc": [1, 9], "r": [1, 8, 25, 26], "requir": [1, 8], "txt": [1, 8, 15, 17, 18, 20, 23, 25, 26, 28], "set": [1, 8, 15, 17, 18, 20, 22, 28], "up": [1, 8, 9, 15, 18, 20, 23], "readi": [1, 15, 20], "refer": [1, 2, 8, 9, 10, 12, 13, 15, 17, 18, 20, 23, 25, 26, 28], "restructuredtext": 1, "primer": 1, "familiar": 1, "build": [1, 8, 9, 15, 17, 20, 22], "local": [1, 8, 22], "preview": 1, "what": [1, 2, 8, 17], "look": [1, 2, 5, 8, 15, 17, 18, 20], "like": [1, 2, 6, 8, 15, 17, 18, 20, 22, 28], "publish": [1, 9, 16], "html": [1, 2, 8, 12, 13, 22], "gener": [1, 9, 11, 12, 13, 15, 17, 18, 20, 22], "view": [1, 15, 17, 18, 20, 22, 28], "follow": [1, 2, 3, 5, 6, 7, 8, 9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "python3": [1, 8, 22], "m": [1, 17, 22, 25, 26], "server": [1, 6, 8, 22], "It": [1, 2, 4, 8, 10, 11, 12, 13, 15, 16, 17, 18, 20, 22, 23, 25, 26, 28], "print": [1, 15, 17, 18, 20, 22, 23, 25, 26, 28], "serv": [1, 22], "0": [1, 7, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "port": [1, 22], "8000": [1, 28], "open": [1, 9, 16, 17, 20], "browser": [1, 4, 6, 22], "go": [1, 15, 17, 20, 22], "read": [2, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "code": [2, 3, 7, 15, 20, 23, 25, 26, 28], "style": [2, 3, 7], "adjust": 2, "sytl": 2, "design": 2, "python": [2, 8, 9, 12, 13, 15, 17, 20, 22], "recommend": [2, 8, 15, 17, 18, 20], "test": [2, 7, 9, 10, 11, 15, 17, 18, 20, 23, 25, 26], "valid": [2, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "dataset": [2, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "lhots": [2, 7, 9, 15, 17, 20], "readthedoc": [2, 8], "io": [2, 8, 12, 13, 22], "en": [2, 8], "latest": [2, 6, 8, 20, 22, 23], "index": [2, 8, 12, 13, 22], "yesno": [2, 7, 8, 19, 28], "veri": [2, 3, 17, 25, 26, 28], "good": 2, "exampl": [2, 6, 7, 9, 11, 12, 13, 23, 25, 26, 28], "speech": [2, 6, 7, 8, 10, 11, 16, 17, 19, 28], "pull": [2, 15, 17, 20], "380": [2, 26], "show": [2, 6, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "add": [2, 15, 17, 18, 19], "new": [2, 3, 6, 8, 15, 16, 17, 18, 20, 22, 23, 28], "suppos": 2, "would": [2, 8, 9, 20, 23], "name": [2, 9, 15, 17], "foo": [2, 11, 13, 15, 20, 22], "eg": [2, 5, 8, 9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "mkdir": [2, 15, 17, 18, 20, 22, 23, 25, 26, 28], "p": [2, 8, 17, 25, 26], "asr": [2, 5, 8, 9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "touch": 2, "sh": [2, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "chmod": 2, "x": 2, "simpl": [2, 17], "own": 2, "otherwis": [2, 15, 17, 20, 22], "librispeech": [2, 5, 7, 9, 11, 12, 13, 19, 20, 22, 23], "assum": [2, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "fanci": 2, "call": 2, "bar": [2, 11, 13, 15, 20, 22], "organ": 2, "wai": [2, 3, 14, 22], "readm": [2, 15, 17, 18, 20, 23, 25, 26, 28], "md": [2, 5, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "asr_datamodul": [2, 8], "pretrain": [2, 9, 11, 13, 15, 17, 18, 20, 23, 25, 26, 28], "For": [2, 5, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "instanc": [2, 5, 15, 17, 18, 20, 22, 23, 25, 26, 28], "tdnn": [2, 8, 16, 19, 21, 24, 27], "its": [2, 9, 13, 17], "directori": [2, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "structur": 2, "descript": [2, 15, 17, 18, 20, 22, 23, 25, 26, 28], "contain": [2, 7, 9, 10, 15, 17, 18, 19, 20, 22, 23, 25, 26, 28], "inform": [2, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "g": [2, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "wer": [2, 8, 9, 22, 23, 25, 26, 28], "etc": [2, 15, 17, 18, 20, 22, 23, 25, 26, 28], "provid": [2, 6, 8, 9, 10, 11, 15, 16, 17, 18, 19, 20, 22, 23, 25, 26, 28], "pytorch": [2, 7, 17], "dataload": [2, 8], "take": [2, 9, 28], "input": [2, 9, 15, 17, 18, 20, 23, 25, 26, 28], "checkpoint": [2, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "save": [2, 8, 9, 12, 15, 17, 18, 20, 22, 23, 25, 26, 28], "dure": [2, 6, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "stage": [2, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "": [2, 8, 9, 12, 15, 17, 18, 20, 22, 23, 25, 26, 28], "definit": 2, "neural": [2, 15, 20], "network": [2, 15, 17, 20, 22], "script": [2, 7, 8, 13, 14, 15, 17, 18, 20, 22, 23, 25, 26, 28], "infer": [2, 9, 11], "tdnn_lstm_ctc": [2, 18, 23, 26], "conformer_ctc": [2, 15, 20], "get": [2, 6, 8, 15, 17, 18, 20, 22, 23, 28], "feel": [2, 22], "result": [2, 5, 6, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "everi": [2, 9, 22], "kept": 2, "self": [2, 10], "toler": 2, "duplic": 2, "among": [2, 8], "differ": [2, 8, 15, 16, 20, 22], "invoc": 2, "help": [2, 15, 17, 18, 20, 22, 23, 25, 26, 28], "blob": [2, 5, 9, 13, 22], "master": [2, 5, 9, 11, 12, 13, 17, 22], "transform": [2, 15, 20, 22], "conform": [2, 11, 12, 16, 17, 19, 21, 22], "base": [2, 15, 17, 18, 20, 22], "lstm": [2, 10, 13, 16, 19, 21, 24], "attent": [2, 17, 18], "lm": [2, 8, 17, 23, 25, 26, 28], "rescor": [2, 18, 23, 25, 26, 28], "demonstr": [2, 4, 6, 9], "consid": 2, "colab": 2, "notebook": 2, "welcom": 3, "There": [3, 15, 17, 18, 20, 22], "mani": 3, "two": [3, 15, 17, 18, 20, 22, 23, 25, 26, 28], "them": [3, 4, 5, 6, 15, 17, 18, 20, 22, 23, 25, 26, 28], "To": [3, 6, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "document": [3, 7, 9], "repositori": 3, "recip": [3, 5, 7, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "In": [3, 6, 9, 11, 12, 13, 14, 15, 17, 18, 20, 23, 25, 26, 28], "page": [3, 6, 12, 15, 17, 18, 19, 20, 22, 23, 25, 26, 28], "describ": [3, 4, 9, 11, 12, 13, 14, 15, 17, 18, 20, 23, 25, 26], "how": [3, 4, 6, 7, 8, 14, 15, 17, 18, 20, 22, 23, 25, 26, 28], "creat": [3, 7, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "data": [3, 9, 11, 12, 13, 16], "train": [3, 4, 6, 7, 9, 12, 13], "decod": [3, 6, 11, 13, 14], "model": [3, 4, 6, 7, 8, 10], "section": [4, 8, 9, 11, 12, 13, 14, 15, 20], "find": [4, 5, 6, 8, 9, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "also": [4, 5, 8, 9, 10, 11, 13, 15, 17, 18, 20, 22, 28], "try": [4, 6, 22], "from": [4, 6, 8, 9, 15, 16, 17, 18, 20, 22, 23, 25, 26, 28], "within": [4, 6], "without": [4, 6, 15, 20, 22], "anyth": [4, 6], "space": [4, 7], "youtub": [4, 7, 20, 22, 23], "video": [4, 7, 20, 22, 23], "upload": [5, 6, 15, 17, 18, 20, 22, 23, 25, 26, 28], "huggingfac": [5, 7, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "co": [5, 6, 9, 15, 16, 17, 18, 20, 22, 23, 25, 26, 28], "visit": [5, 6, 22], "link": [5, 8, 9, 10, 22], "search": [5, 6], "specif": [5, 17], "correspond": [5, 6], "aishel": [5, 7, 15, 17, 18, 19], "gigaspeech": [5, 12, 22], "wenetspeech": [5, 12], "integr": 6, "framework": [6, 11], "sherpa": [6, 10, 11, 12, 13, 22], "need": [6, 8, 9, 10, 15, 17, 18, 20, 22, 23, 25, 26, 28], "download": [6, 7, 16], "window": [6, 10, 11, 22], "maco": [6, 10, 11, 22], "linux": [6, 10, 11, 22], "even": [6, 8], "ipad": 6, "phone": 6, "start": [6, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "address": [6, 9, 17, 22], "recognit": [6, 7, 10, 11, 16, 17, 19, 28], "screenshot": [6, 15, 17, 18, 20, 22, 28], "select": [6, 22, 23, 25, 26, 28], "languag": [6, 15, 17, 18], "current": [6, 8, 17, 19, 22], "chines": [6, 16, 17], "english": [6, 22, 28], "target": 6, "method": [6, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26], "greedi": 6, "modified_beam_search": [6, 17, 22], "choos": [6, 8, 22], "number": [6, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "activ": 6, "path": [6, 9, 11, 13, 15, 17, 18, 20, 22], "either": [6, 15, 17, 18, 20], "record": [6, 15, 16, 17, 18, 20, 22, 23, 25, 26, 28], "click": [6, 8, 15, 17, 18, 20, 22, 28], "button": 6, "submit": 6, "wait": 6, "moment": 6, "an": [6, 8, 9, 11, 12, 13, 15, 16, 17, 20, 22, 28], "when": [6, 14, 17, 20], "bottom": [6, 22], "part": [6, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "tabl": 6, "one": [6, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "next": [6, 8, 20, 22, 23], "gen": [6, 8, 20, 22, 23], "kaldi": [6, 8, 20, 22, 23], "subscrib": [6, 8, 20, 22, 23], "channel": [6, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "nadira": [6, 8, 20, 22, 23], "povei": [6, 8, 20, 22, 23], "www": [6, 8, 16, 20, 22, 23], "uc_vaumpkminz1pnkfxan9mw": [6, 8, 20, 22, 23], "torchaudio": 7, "1": [7, 9, 11, 12, 13, 22, 23, 25, 26, 28], "export": [7, 8, 15, 17, 18, 20, 23, 25, 26, 28], "state_dict": [7, 14, 15, 17, 18, 20, 23, 25, 26, 28], "torch": [7, 8, 9, 14, 15, 17, 20], "jit": [7, 14, 20], "trace": [7, 12, 14], "onnx": [7, 9, 14], "ncnn": [7, 14], "timit": [7, 19, 25, 26], "contribut": 7, "depend": [8, 15, 20, 22], "step": [8, 9, 15, 17, 18, 20, 22, 28], "order": [8, 15, 18, 20, 23, 25, 26], "matter": 8, "org": [8, 16, 17, 22], "least": 8, "v1": [8, 15, 18, 20, 23, 25, 26], "alreadi": [8, 9], "don": [8, 12, 15, 18, 20, 22, 23, 25, 26, 28], "t": [8, 12, 15, 17, 18, 20, 22, 23, 25, 26, 28], "replac": 8, "compil": [8, 15, 17, 20], "against": 8, "strongli": 8, "collect": 8, "variabl": [8, 15, 18, 20, 22], "pythonpath": 8, "point": [8, 9, 15, 18, 20, 22], "folder": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "tmp": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "setup": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "put": 8, "sever": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "same": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "switch": [8, 15, 20], "just": 8, "about": [8, 17, 22], "virtualenv": 8, "8": [8, 9, 15, 17, 20, 22, 23, 28], "cpython3": 8, "6": [8, 15, 17, 20, 22, 23, 25, 26], "final": [8, 9, 20, 23], "64": [8, 9, 17], "1540m": 8, "creator": 8, "cpython3posix": 8, "dest": 8, "ceph": [8, 9, 15, 17, 20], "fj": [8, 9, 17, 20], "fangjun": [8, 9, 17, 20], "clear": 8, "fals": [8, 9, 15, 17, 20], "no_vcs_ignor": 8, "global": 8, "seeder": 8, "fromappdata": 8, "bundl": 8, "setuptool": 8, "wheel": 8, "via": [8, 12, 13], "copi": 8, "app_data_dir": 8, "root": 8, "share": 8, "v": [8, 20, 25, 26], "irtualenv": 8, "ad": [8, 15, 17, 18, 20, 22, 28], "seed": 8, "packag": 8, "57": [8, 20, 23], "36": [8, 17, 20], "bashactiv": 8, "cshellactiv": 8, "fishactiv": 8, "powershellactiv": 8, "pythonactiv": 8, "xonshactiv": 8, "sourc": [8, 9, 15, 16, 17, 20], "bin": [8, 15, 20, 22], "dev20210822": 8, "cpu": [8, 9, 12, 15, 28], "torch1": 8, "f": [8, 25, 26], "nightli": 8, "whl": [8, 22], "2bcpu": 8, "cp38": 8, "linux_x86_64": 8, "mb": 8, "________________________________": 8, "185": [8, 15, 20, 28], "kb": [8, 25, 26], "graphviz": 8, "17": [8, 9, 15, 20, 22, 25, 26], "py3": 8, "none": [8, 15, 20], "18": [8, 15, 17, 18, 20, 22, 23, 25, 26], "cach": 8, "manylinux1_x86_64": 8, "831": [8, 17, 26], "type": [8, 9, 15, 17, 20, 22, 28], "extens": 8, "typing_extens": 8, "10": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "26": [8, 17, 20, 26], "successfulli": 8, "probabl": [8, 17, 22], "cuda": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26], "req": 8, "7b1b76ge": 8, "q": 8, "audioread": 8, "soundfil": 8, "post1": 8, "py2": 8, "7": [8, 9, 15, 18, 20, 22, 23, 25, 26], "97": [8, 15], "cytoolz": 8, "11": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "manylinux_2_17_x86_64": 8, "manylinux2014_x86_64": 8, "dataclass": 8, "14": [8, 9, 11, 12, 15, 20, 22, 23, 25], "h5py": 8, "manylinux_2_12_x86_64": 8, "manylinux2010_x86_64": 8, "684": [8, 15, 28], "intervaltre": 8, "lilcom": 8, "numpi": 8, "15": [8, 9, 17, 18, 20, 25, 28], "40": [8, 18, 20, 23, 25, 26], "pyyaml": 8, "662": 8, "tqdm": 8, "62": [8, 20, 23], "76": [8, 28], "73": 8, "satisfi": 8, "lib": 8, "site": 8, "dev": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "2a1410b": 8, "clean": [8, 15, 17, 20, 22, 23], "toolz": 8, "55": [8, 18, 20, 25], "sortedcontain": 8, "29": [8, 15, 17, 18, 20, 23, 25, 26], "cffi": 8, "411": [8, 20], "pycpars": 8, "20": [8, 9, 15, 17, 18, 20, 23, 25, 26, 28], "112": 8, "pypars": 8, "67": 8, "done": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "filenam": [8, 11, 12, 13, 22], "dev_2a1410b_clean": 8, "size": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "342242": 8, "sha256": 8, "f683444afa4dc0881133206b4646a": 8, "9d0f774224cc84000f55d0a67f6e4a37997": 8, "store": [8, 20], "ephem": 8, "ftu0qysz": 8, "7f": 8, "7a": 8, "8e": 8, "a0bf241336e2e3cb573e1e21e5600952d49f5162454f2e612f": 8, "warn": 8, "built": 8, "invalid": [8, 20], "metadata": [8, 25, 26], "mandat": 8, "pep": 8, "440": 8, "packa": 8, "ging": 8, "deprec": [8, 17], "legaci": 8, "becaus": 8, "could": [8, 15, 18], "A": [8, 9, 15, 17, 18, 20, 22, 23], "discuss": 8, "regard": 8, "pypa": 8, "sue": 8, "8368": 8, "inter": 8, "valtre": 8, "sor": 8, "tedcontain": 8, "remot": 8, "enumer": 8, "object": [8, 15, 17, 18, 22, 28], "500": [8, 9, 17, 20, 22], "count": 8, "100": [8, 15, 17, 18, 20, 22], "compress": 8, "308": [8, 15, 17, 18], "total": [8, 15, 17, 18, 20, 22, 23, 28], "delta": 8, "263": 8, "reus": 8, "307": 8, "102": [8, 15], "pack": 8, "receiv": 8, "172": 8, "49": [8, 20, 26, 28], "kib": 8, "385": 8, "00": [8, 15, 17, 18, 20, 23, 25, 26, 28], "resolv": 8, "kaldilm": 8, "tar": 8, "gz": 8, "48": [8, 15, 17], "574": 8, "kaldialign": 8, "sentencepiec": [8, 20], "96": 8, "tensorboard": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "41": [8, 15, 17, 25, 28], "line": 8, "absl": 8, "absl_pi": 8, "13": [8, 9, 17, 18, 20, 23, 25], "132": 8, "googl": [8, 22], "auth": 8, "oauthlib": 8, "google_auth_oauthlib": 8, "grpcio": 8, "24": [8, 18, 23, 25, 26, 28], "39": [8, 17, 20, 23, 25], "ment": 8, "requi": 8, "rement": 8, "protobuf": 8, "manylinux_2_5_x86_64": 8, "werkzeug": 8, "288": 8, "tensorboard_data_serv": 8, "google_auth": 8, "35": [8, 9, 17, 20, 22], "152": 8, "request": 8, "plugin": 8, "wit": 8, "tensorboard_plugin_wit": 8, "781": 8, "markdown": 8, "six": 8, "16": [8, 9, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "cachetool": 8, "rsa": 8, "34": 8, "pyasn1": 8, "modul": 8, "pyasn1_modul": 8, "155": 8, "requests_oauthlib": 8, "23": [8, 15, 17, 18, 20, 25, 26, 28], "77": [8, 20], "urllib3": 8, "27": [8, 15, 17, 23, 26], "138": [8, 15, 17], "certifi": 8, "2017": 8, "2021": [8, 15, 18, 20, 23, 25, 26, 28], "30": [8, 15, 17, 18, 20, 22, 28], "145": 8, "charset": 8, "normal": [8, 23, 25, 26, 28], "charset_norm": 8, "idna": 8, "59": [8, 18, 20], "146": 8, "897233": 8, "eccb906cafcd45bf9a7e1a1718e4534254bfb": 8, "f4c0d0cbc66eee6c88d68a63862": 8, "85": 8, "7d": 8, "63": [8, 17], "f2dd586369b8797cb36d213bf3a84a789eeb92db93d2e723c9": 8, "etool": 8, "oaut": 8, "hlib": 8, "let": [8, 15, 20, 22], "u": [8, 15, 17, 18, 20, 22, 28], "log": [8, 23, 25, 26, 28], "08": [8, 20, 22, 23, 25, 26, 28], "19": [8, 9, 15, 20, 23, 25, 26], "main": [8, 15, 20], "dl_dir": [8, 15, 18, 20, 22], "waves_yesno": 8, "49mb": 8, "03": [8, 9, 17, 20, 22, 25, 26], "39mb": 8, "manifest": 8, "31": [8, 20], "42": [8, 15, 20, 28], "comput": [8, 9, 15, 17, 18, 22, 23, 25, 26, 28], "fbank": [8, 9, 15, 17, 18, 20, 23, 25, 26, 28], "32": [8, 15, 17, 18], "803": 8, "info": [8, 9, 15, 17, 18, 20, 23, 25, 26, 28], "compute_fbank_yesno": 8, "52": [8, 15, 20], "process": [8, 9, 15, 17, 18, 20, 22], "extract": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "featur": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "_______________________________________________________________": 8, "90": 8, "01": [8, 17, 18, 20], "80": [8, 9, 15, 17, 20], "57it": 8, "085": 8, "______________________________________________________________": 8, "248": [8, 17], "21it": 8, "lang": [8, 9, 17, 20], "fcordre9": 8, "kaldilm_6899d26f2d684ad48f21025950cd2866": 8, "csrc": [8, 20], "arpa_file_pars": 8, "cc": 8, "void": 8, "arpafilepars": 8, "rea": 8, "d": [8, 25, 26], "std": 8, "istream": 8, "79": 8, "140": [8, 18], "gram": [8, 15, 17, 18, 20, 23, 25, 26], "89": [8, 15], "hlg": [8, 23, 25, 26, 28], "928": 8, "compile_hlg": 8, "120": 8, "lang_phon": [8, 18, 23, 25, 26, 28], "929": [8, 17], "lexicon": [8, 15, 17, 18, 20, 22, 28], "116": 8, "convert": [8, 20, 22], "l": [8, 17, 22, 25, 26, 28], "pt": [8, 9, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "linv": [8, 17, 20, 28], "931": 8, "ctc_topo": 8, "max_token_id": 8, "932": 8, "load": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "fst": [8, 17, 28], "intersect": 8, "933": 8, "lg": 8, "shape": 8, "66": 8, "connect": [8, 9, 20, 22, 23], "68": [8, 20], "70": 8, "class": [8, 20], "tensor": [8, 15, 17, 18, 20, 22, 28], "71": [8, 20, 23], "determin": 8, "934": 8, "74": [8, 9], "_k2": 8, "raggedint": 8, "remov": [8, 15, 17, 18, 20, 23, 25, 26], "disambigu": 8, "symbol": [8, 17], "87": 8, "remove_epsilon": 8, "935": 8, "92": [8, 20], "arc": 8, "95": [8, 16], "compos": 8, "h": 8, "105": [8, 20], "936": 8, "107": [8, 23], "123": 8, "now": [8, 15, 20, 22, 23, 25, 26], "cuda_visible_devic": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "gpu": [8, 15, 17, 18, 20, 22, 25, 26, 28], "avail": [8, 9, 15, 17, 20, 22, 23, 25, 26, 28], "given": [8, 9, 15, 17, 18, 20, 23], "below": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "072": 8, "465": 8, "466": 8, "exp_dir": [8, 17, 20], "posixpath": [8, 17, 20], "exp": [8, 9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "lang_dir": [8, 17, 20], "lr": [8, 17, 22], "feature_dim": [8, 9, 15, 17, 20, 28], "weight_decai": 8, "1e": 8, "06": [8, 9, 18, 20, 23, 28], "start_epoch": 8, "best_train_loss": [8, 9], "inf": [8, 9], "best_valid_loss": [8, 9], "best_train_epoch": [8, 9], "best_valid_epoch": [8, 9], "batch_idx_train": [8, 9], "log_interv": [8, 9], "valid_interv": [8, 9], "beam_siz": [8, 9, 17], "reduct": 8, "sum": 8, "use_doub": 8, "le_scor": 8, "true": [8, 9, 15, 17, 20, 22, 23, 25, 26, 28], "world_siz": 8, "master_port": 8, "12354": 8, "num_epoch": 8, "feature_dir": [8, 20], "max_dur": [8, 20], "bucketing_sampl": [8, 20], "num_bucket": [8, 20], "concatenate_cut": [8, 20], "duration_factor": [8, 20], "gap": [8, 20], "on_the_fly_feat": [8, 20], "shuffl": [8, 20], "return_cut": [8, 20], "num_work": [8, 20], "074": 8, "113": [8, 17, 20], "098": [8, 23], "cut": [8, 20], "240": [8, 15, 28], "149": [8, 20], "200": [8, 9, 15, 20, 25, 26, 28], "singlecutsampl": 8, "206": [8, 20], "219": [8, 17, 20], "246": [8, 17, 20, 25, 26], "357": 8, "416": 8, "epoch": [8, 9, 11, 12, 15, 17, 18, 20, 22, 23, 25, 26, 28], "batch": [8, 15, 17, 18, 20, 22], "avg": [8, 9, 11, 12, 13, 17, 20, 22, 23, 25, 26, 28], "loss": [8, 15, 18, 20, 22, 23, 25, 26, 28], "0789": 8, "848": 8, "5356": 8, "7556": 8, "301": [8, 9, 20], "432": [8, 20], "9972": 8, "best": [8, 15, 18, 20], "805": 8, "2436": 8, "5717": 8, "33": [8, 15, 16, 17, 20, 25], "109": [8, 15, 20], "4167": 8, "121": [8, 23], "325": 8, "2214": 8, "798": [8, 17], "0781": 8, "1343": 8, "065": 8, "0859": 8, "556": 8, "0421": 8, "0975": 8, "810": 8, "0431": 8, "824": 8, "657": 8, "0109": 8, "984": [8, 20], "0093": 8, "0096": 8, "50": [8, 9, 20, 22, 25], "239": [8, 17], "0104": 8, "0101": 8, "569": 8, "0092": 8, "819": [8, 25], "835": 8, "51": [8, 15, 20, 28], "024": 8, "0105": 8, "317": 8, "0099": 8, "0097": 8, "552": 8, "0108": 8, "869": 8, "0102": 8, "126": [8, 20], "128": [8, 20], "537": [8, 20], "192": [8, 20], "249": 8, "250": [8, 17, 23], "lm_dir": [8, 20], "search_beam": [8, 15, 20, 28], "output_beam": [8, 15, 20, 28], "min_active_st": [8, 15, 20, 28], "max_active_st": [8, 15, 20, 28], "10000": [8, 15, 20, 28], "use_double_scor": [8, 15, 20, 28], "193": 8, "213": [8, 28], "259": [8, 15], "devic": [8, 9, 15, 17, 18, 20, 23, 25, 26, 28], "217": [8, 15, 20], "279": [8, 20], "averag": [8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "userwarn": [8, 17], "floor_divid": 8, "futur": [8, 17, 19], "round": [8, 17], "toward": [8, 17], "trunc": [8, 17], "function": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "NOT": [8, 15, 17, 20, 28], "floor": [8, 17], "incorrect": [8, 17], "neg": [8, 17], "valu": [8, 15, 17, 18, 20, 22], "keep": [8, 17], "behavior": [8, 17], "div": [8, 17], "b": [8, 17, 20, 25, 26], "rounding_mod": [8, 17], "actual": [8, 15, 17, 18, 20, 22], "divis": [8, 17], "trigger": 8, "intern": 8, "aten": 8, "src": [8, 22], "nativ": 8, "binaryop": 8, "cpp": [8, 12], "450": [8, 15, 17, 18], "k": [8, 22, 25, 26], "n": [8, 15, 20, 22, 25, 26], "220": [8, 17, 18, 20], "409": 8, "190": [8, 23], "until": [8, 20], "571": [8, 20], "228": [8, 20], "transcript": [8, 15, 16, 17, 18, 20, 22, 23, 25, 26], "recog": [8, 17, 20], "test_set": [8, 28], "572": 8, "util": [8, 20], "ins": [8, 20, 28], "del": [8, 20, 28], "sub": [8, 20, 28], "573": 8, "236": 8, "wrote": [8, 20], "detail": [8, 10, 15, 17, 18, 20, 22, 23, 25, 26, 28], "error": [8, 20], "stat": [8, 20], "err": [8, 17, 20], "299": 8, "congratul": [8, 15, 18, 20, 23, 25, 26, 28], "first": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "fun": 8, "debug": 8, "variou": [8, 14, 19], "problem": 8, "mai": [8, 15, 17, 18, 19, 20, 22], "encount": [8, 15, 17, 18, 20, 22], "while": [8, 15, 17, 18, 20, 22], "period": 9, "disk": 9, "optim": [9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "other": [9, 17, 19, 20, 23, 25, 26, 28], "relat": [9, 15, 17, 20, 23, 25, 26, 28], "resum": [9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "howev": 9, "onli": [9, 11, 15, 17, 18, 19, 20, 22, 23, 25, 26, 28], "case": [9, 22], "strip": 9, "except": 9, "reduc": [9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "each": [9, 15, 17, 18, 20, 22], "well": [9, 19, 28], "usag": [9, 12, 13, 23, 25, 26, 28], "pruned_transducer_stateless3": [9, 11, 12], "almost": 9, "dir": [9, 11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "bpe": [9, 11, 12, 13, 20, 22], "lang_bpe_500": [9, 11, 12, 13, 20, 22], "dict": 9, "host": 9, "csukuangfj": [9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "prune": [9, 17, 22], "transduc": [9, 10, 11, 16, 19, 21], "stateless3": 9, "2022": [9, 17, 22], "05": [9, 15, 17, 18, 20, 26], "lf": [9, 15, 17, 18, 20, 23, 25, 26, 28], "repo": 9, "prefix": 9, "those": 9, "xxx": 9, "wave": [9, 11, 15, 20], "iter": [9, 13, 22], "1224000": 9, "greedy_search": [9, 17, 22], "test_wav": [9, 15, 17, 18, 20, 23, 25, 26, 28], "1089": [9, 20, 23], "134686": [9, 20, 23], "0001": [9, 20, 23], "wav": [9, 11, 13, 15, 17, 18, 20, 22, 25, 26, 28], "1221": [9, 20, 23], "135766": [9, 20, 23], "0002": [9, 20, 23], "multipl": [9, 15, 17, 18, 20, 23, 25, 26, 28], "sound": [9, 13, 15, 17, 18, 20, 23, 25, 26, 28], "Its": [9, 20], "output": [9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "09": [9, 15, 17, 18, 20, 22], "02": [9, 17, 20, 22, 26], "233": 9, "265": 9, "reset_interv": 9, "3000": 9, "subsampling_factor": [9, 15, 17, 20], "4": [9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "encoder_dim": 9, "512": [9, 15, 17, 20], "nhead": [9, 15, 17, 20], "dim_feedforward": [9, 17], "2048": [9, 17], "num_encoder_lay": [9, 17], "decoder_dim": 9, "joiner_dim": 9, "model_warm_step": 9, "env_info": [9, 15, 17, 20], "releas": [9, 15, 17, 20], "sha1": [9, 15, 17, 20], "4810e00d8738f1a21278b0156a42ff396a2d40ac": 9, "date": [9, 15, 17, 20], "fri": 9, "oct": [9, 20], "miss": [9, 17, 20], "cu102": 9, "branch": [9, 15, 17, 20], "1013": 9, "c39cba5": 9, "dirti": [9, 15, 20], "thu": [9, 17, 20, 23], "__init__": [9, 15, 17, 20], "jsonl": 9, "hostnam": [9, 17], "de": [9, 17], "74279": [9, 17], "0324160024": 9, "65bfd8b584": 9, "jjlbn": 9, "ip": [9, 17], "177": [9, 17, 18, 20], "203": [9, 20], "bpe_model": [9, 20], "sound_fil": [9, 15, 17, 20, 28], "sample_r": [9, 15, 17, 20, 28], "16000": [9, 15, 17, 18, 20, 23, 25, 26], "beam": [9, 22], "max_context": 9, "max_stat": 9, "context_s": [9, 17], "max_sym_per_fram": [9, 17], "simulate_stream": 9, "decode_chunk_s": 9, "left_context": 9, "dynamic_chunk_train": 9, "causal_convolut": 9, "short_chunk_s": 9, "25": [9, 15, 20, 25, 26, 28], "num_left_chunk": 9, "blank_id": [9, 17], "unk_id": 9, "vocab_s": [9, 17], "271": 9, "273": [9, 17], "612": 9, "458": 9, "disabl": 9, "giga": [9, 22], "623": 9, "277": 9, "paramet": [9, 12, 15, 17, 18, 20, 22, 23, 25, 26], "78648040": 9, "951": [9, 20], "285": [9, 17, 20], "construct": [9, 15, 17, 18, 20, 23, 25, 26, 28], "952": 9, "295": [9, 15, 17, 18, 20], "957": 9, "700": 9, "329": [9, 20], "912": 9, "388": 9, "earli": [9, 20, 23], "nightfal": [9, 20, 23], "THE": [9, 20, 23], "yellow": [9, 20, 23], "lamp": [9, 20, 23], "light": [9, 20, 23], "here": [9, 15, 17, 18, 20, 23], "AND": [9, 20, 23], "THERE": [9, 20, 23], "squalid": [9, 20, 23], "quarter": [9, 20, 23], "OF": [9, 20, 23], "brothel": [9, 20, 23], "god": [9, 20, 23], "AS": [9, 20, 23], "direct": [9, 20, 23], "consequ": [9, 20, 23], "sin": [9, 20, 23], "man": [9, 20, 23], "punish": [9, 20, 23], "had": [9, 20, 23], "her": [9, 20, 23], "love": [9, 20, 23], "child": [9, 20, 23], "whose": [9, 17, 20, 23], "ON": [9, 20, 23], "THAT": [9, 20, 23], "dishonor": [9, 20, 23], "bosom": [9, 20, 23], "TO": [9, 20, 23], "parent": [9, 20, 23], "forev": [9, 20, 23], "WITH": [9, 20, 23], "race": [9, 20, 23], "descent": [9, 20, 23], "mortal": [9, 20, 23], "BE": [9, 20, 23], "bless": [9, 20, 23], "soul": [9, 20, 23], "IN": [9, 20, 23], "heaven": [9, 20, 23], "yet": [9, 20, 23], "THESE": [9, 20, 23], "thought": [9, 20, 23], "affect": [9, 20, 23], "hester": [9, 20, 23], "prynn": [9, 20, 23], "less": [9, 20, 23, 28], "hope": [9, 16, 20, 23], "than": [9, 15, 17, 18, 20, 22, 23, 28], "apprehens": [9, 20, 23], "390": 9, "alwai": 9, "note": [9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "down": [9, 15, 20, 22], "reproduc": [9, 20], "ln": [9, 15, 20, 22], "9999": [9, 22], "symlink": 9, "pass": [9, 15, 17, 18, 20, 22], "max": [9, 15, 17, 18, 20, 22], "durat": [9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "600": [9, 20, 22], "reason": 9, "support": [10, 11, 15, 17, 20, 22], "perform": [10, 11, 17], "raspberri": [10, 22], "pi": [10, 22], "project": 10, "static": [10, 22], "produc": [10, 22], "binari": [10, 15, 17, 18, 20, 22, 28], "everyth": 10, "non": [11, 20], "stream": [11, 15, 20, 22, 25, 26], "tree": [11, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 28], "insid": [11, 13], "encod": [11, 13, 15, 17, 18, 20, 22, 23, 28], "joiner": [11, 13, 17, 22], "joiner_encoder_proj": 11, "joiner_decoder_proj": 11, "onnx_pretrain": 11, "proj": 11, "baz": [11, 13], "onnxruntim": 11, "our": [12, 13, 20], "torchscript": [12, 13, 22], "cpu_jit": [12, 15, 20], "confus": 12, "move": 12, "why": 12, "streaming_asr": [12, 13, 22], "emform": 12, "conv_emform": 12, "offline_asr": 12, "lstm_transducer_stateless2": [13, 22], "468000": [13, 22], "three": [13, 15, 17], "encoder_jit_trac": [13, 22], "decoder_jit_trac": [13, 22], "joiner_jit_trac": [13, 22], "jit_pretrain": [13, 22], "tutori": [15, 17, 18, 20, 22, 23, 25, 26], "learn": [15, 17, 18, 20, 22, 23, 25, 26, 28], "singl": [15, 17, 18, 20, 22, 23, 25, 26, 28], "1best": [15, 18, 20, 23, 25, 26], "handl": [15, 18, 20, 22, 23, 25, 26, 28], "automag": [15, 18, 20, 22, 23, 25, 26, 28], "stop": [15, 17, 18, 20, 22, 23, 25, 26, 28], "control": [15, 17, 18, 20, 22, 23, 25, 26, 28], "By": [15, 18, 20, 22, 23, 25, 26, 28], "default": [15, 17, 18, 20, 22, 23, 25, 26, 28], "execut": [15, 18, 20, 22, 23, 25, 26, 28], "mean": [15, 17, 18, 20, 22, 23, 25, 26, 28], "musan": [15, 18, 20, 22], "sai": [15, 17, 18, 20, 22, 23, 25, 26, 28], "thei": [15, 17, 18, 20, 22], "won": [15, 18, 20, 22], "re": [15, 18, 20, 22], "intal": [15, 18], "initi": [15, 18], "sudo": [15, 18], "apt": [15, 18], "permiss": [15, 18], "commandlin": [15, 17, 18, 20, 22], "quit": [15, 17, 18, 20, 22], "often": [15, 17, 18, 20, 22], "experi": [15, 17, 18, 20, 22, 28], "num": [15, 17, 18, 20, 22], "state": [15, 17, 18, 20, 22], "world": [15, 17, 18, 20, 22, 23], "multi": [15, 17, 18, 20, 22], "machin": [15, 17, 18, 20, 22], "ddp": [15, 17, 18, 20, 22], "implement": [15, 17, 18, 20, 22], "present": [15, 17, 18, 20, 22], "later": [15, 18, 20, 22, 23, 25, 26], "specifi": [15, 17, 18, 20, 22, 23, 25, 26, 28], "second": [15, 17, 18, 20, 22, 28], "over": [15, 17, 18, 20, 22], "utter": [15, 17, 18, 20, 22], "pad": [15, 17, 18, 20, 22], "oom": [15, 17, 18, 20, 22], "v100": [15, 17, 18, 20], "nvidia": [15, 17, 18, 20], "due": [15, 17, 18, 20, 22], "usual": [15, 17, 18, 20, 22], "larger": [15, 17, 18, 20, 22], "caus": [15, 17, 18, 20, 22], "smaller": [15, 17, 18, 20, 22], "increas": [15, 17, 18, 20, 22], "tune": [15, 17, 18, 20, 22], "weight": [15, 18, 20, 22], "decai": [15, 18, 20, 22], "warmup": [15, 17, 18, 20, 22], "get_param": [15, 17, 18, 20, 22, 23, 25, 26, 28], "realli": [15, 18, 20, 22], "directli": [15, 17, 18, 20, 22], "perturb": [15, 17, 18, 20, 22], "speed": [15, 17, 18, 20, 22], "factor": [15, 17, 18, 20, 22], "3x150": [15, 17, 18], "hour": [15, 17, 18, 20, 22], "These": [15, 17, 18, 20, 22, 23, 25, 26, 28], "rate": [15, 17, 18, 20, 22, 23, 25, 26, 28], "visual": [15, 17, 18, 20, 22, 23, 25, 26, 28], "logdir": [15, 17, 18, 20, 22, 23, 25, 26, 28], "labelsmooth": 15, "someth": [15, 17, 18, 20, 22, 28], "tensorflow": [15, 17, 18, 20, 22, 28], "found": [15, 17, 18, 20, 22, 28], "continu": [15, 17, 18, 20, 22, 28], "press": [15, 17, 18, 20, 22, 28], "ctrl": [15, 17, 18, 20, 22, 28], "engw8ksktzqs24zbv5dgcg": 15, "22t11": 15, "scan": [15, 17, 18, 20, 22, 28], "116068": 15, "scalar": [15, 17, 18, 20, 22, 28], "listen": [15, 17, 18, 22, 28], "url": [15, 17, 18, 20, 22, 28], "xxxx": [15, 17, 18, 20, 22, 23, 25, 26, 28], "text": [15, 17, 18, 20, 22, 23, 25, 26, 28], "saw": [15, 17, 18, 20, 22, 23, 25, 26, 28], "consol": [15, 17, 18, 20, 22, 23, 25, 26, 28], "typic": [15, 17, 18, 20], "avoid": [15, 17, 20], "commonli": [15, 17, 18, 20, 23, 25, 26, 28], "nbest": [15, 20], "scale": [15, 20, 23, 25, 26], "lattic": [15, 18, 20, 23, 25, 26], "score": [15, 20], "more": [15, 20, 22, 28], "uniqu": [15, 20], "pkufool": [15, 18, 23], "icefall_asr_aishell_conformer_ctc": 15, "transcrib": [15, 17, 18, 20], "lang_char": [15, 17], "token": [15, 17, 18, 20, 23, 25, 26, 28], "word": [15, 17, 18, 20, 23, 25, 26, 28], "bac009s0764w0121": [15, 17, 18], "bac009s0764w0122": [15, 17, 18], "bac009s0764w0123": [15, 17, 18], "tran": [15, 18, 20, 23, 25, 26], "graph": [15, 18, 20, 23, 25, 26], "id": [15, 18, 20, 23, 25, 26], "conveni": [15, 18, 20], "eo": [15, 18, 20], "easili": [15, 18, 20], "obtain": [15, 17, 18, 20, 23, 25, 26], "84": 15, "list": [15, 17, 18, 20, 23, 25, 26], "soxi": [15, 17, 18, 20, 23, 28], "sampl": [15, 17, 18, 20, 23, 28], "precis": [15, 17, 18, 20, 23, 28], "bit": [15, 17, 18, 20, 23, 28], "04": [15, 17, 18, 20, 23, 25, 26], "67263": [15, 17, 18], "315": [15, 17, 18, 20, 23], "cdda": [15, 17, 18, 20, 23, 28], "sector": [15, 17, 18, 20, 23, 28], "135k": [15, 17, 18], "256k": [15, 17, 18, 20], "sign": [15, 17, 18, 20, 28], "integ": [15, 17, 18, 20, 28], "pcm": [15, 17, 18, 20, 28], "65840": [15, 17, 18], "625": [15, 17, 18], "132k": [15, 17, 18], "64000": [15, 17, 18], "300": [15, 17, 18, 20], "128k": [15, 17, 18, 28], "displai": [15, 17, 18, 20], "topologi": [15, 20], "07": [15, 17, 18, 20], "53": [15, 22, 23, 26], "707": [15, 20], "229": 15, "attention_dim": [15, 17, 20], "num_decoder_lay": [15, 20], "vgg_frontend": [15, 17, 20], "use_feat_batchnorm": [15, 20], "f2fd997f752ed11bbef4c306652c433e83f9cf12": 15, "sun": 15, "sep": 15, "46": [15, 20], "33cfe45": 15, "d57a873": 15, "wed": [15, 17, 20], "nov": [15, 20], "hw": 15, "kangwei": 15, "icefall_aishell3": 15, "k2_releas": 15, "tokens_fil": 15, "words_fil": [15, 20, 28], "num_path": [15, 20], "ngram_lm_scal": [15, 20], "attention_decoder_scal": [15, 20], "nbest_scal": [15, 20], "sos_id": [15, 20], "eos_id": [15, 20], "num_class": [15, 20, 28], "4336": [15, 17], "708": [15, 17, 20, 28], "242": [15, 20], "131": [15, 20], "134": 15, "269": [15, 25, 26], "275": 15, "241": 15, "293": [15, 20], "704": [15, 25], "369": [15, 20], "\u751a": [15, 17], "\u81f3": [15, 17], "\u51fa": [15, 17], "\u73b0": [15, 17], "\u4ea4": [15, 17], "\u6613": [15, 17], "\u51e0": [15, 17], "\u4e4e": [15, 17], "\u505c": [15, 17], "\u6b62": 15, "\u7684": [15, 17, 18], "\u60c5": [15, 17], "\u51b5": [15, 17], "\u4e00": [15, 17], "\u4e8c": [15, 17], "\u7ebf": [15, 17, 18], "\u57ce": [15, 17], "\u5e02": [15, 17], "\u867d": [15, 17], "\u7136": [15, 17], "\u4e5f": [15, 17, 18], "\u5904": [15, 17], "\u4e8e": [15, 17], "\u8c03": [15, 17], "\u6574": [15, 17], "\u4e2d": [15, 17, 18], "\u4f46": [15, 17, 18], "\u56e0": [15, 17], "\u4e3a": [15, 17], "\u805a": [15, 17], "\u96c6": [15, 17], "\u4e86": [15, 17, 18], "\u8fc7": [15, 17], "\u591a": [15, 17], "\u516c": [15, 17], "\u5171": [15, 17], "\u8d44": [15, 17], "\u6e90": [15, 17], "371": 15, "37": [15, 17, 20, 25], "38": [15, 17, 20, 25], "683": 15, "47": [15, 20], "651": [15, 28], "654": 15, "659": 15, "752": 15, "321": 15, "887": 15, "340": 15, "370": 15, "\u751a\u81f3": [15, 18], "\u51fa\u73b0": [15, 18], "\u4ea4\u6613": [15, 18], "\u51e0\u4e4e": [15, 18], "\u505c\u6b62": 15, "\u60c5\u51b5": [15, 18], "\u4e00\u4e8c": [15, 18], "\u57ce\u5e02": [15, 18], "\u867d\u7136": [15, 18], "\u5904\u4e8e": [15, 18], "\u8c03\u6574": [15, 18], "\u56e0\u4e3a": [15, 18], "\u805a\u96c6": [15, 18], "\u8fc7\u591a": [15, 18], "\u516c\u5171": [15, 18], "\u8d44\u6e90": [15, 18], "372": 15, "recor": [15, 20], "highest": [15, 20], "965": 15, "966": 15, "821": 15, "822": 15, "826": 15, "916": 15, "115": [15, 20], "345": 15, "888": 15, "889": 15, "limit": [15, 17, 20], "memori": [15, 17, 20], "upgrad": [15, 20], "pro": [15, 20], "finish": [15, 17, 18, 20, 23, 25, 26, 28], "deploi": [15, 20], "At": [15, 20], "doe": [15, 17, 20, 28], "home": [15, 20], "checkout": [15, 20], "v2": [15, 20], "cmake": [15, 20], "dcmake_build_typ": [15, 20], "j": [15, 20], "hlg_decod": [15, 20], "four": [15, 20], "messag": [15, 20, 22], "nn_model": [15, 20], "use_gpu": [15, 20], "word_tabl": [15, 20], "caution": [15, 20], "forward": [15, 20], "cu": [15, 20], "int": [15, 20], "char": [15, 20], "124": [15, 20], "98": 15, "142": [15, 18, 20], "150": [15, 20], "693": [15, 25], "165": [15, 20], "nnet_output": [15, 20], "182": [15, 23], "180": [15, 20], "489": 15, "45": [15, 17, 20], "216": [15, 20, 25, 26], "mandarin": 16, "corpu": 16, "beij": 16, "shell": 16, "technologi": 16, "ltd": 16, "400": 16, "peopl": 16, "accent": 16, "area": 16, "china": 16, "invit": 16, "particip": 16, "conduct": 16, "quiet": 16, "indoor": 16, "high": 16, "fidel": 16, "microphon": 16, "downsampl": 16, "16khz": 16, "manual": 16, "accuraci": 16, "through": 16, "profession": 16, "annot": 16, "strict": 16, "inspect": 16, "free": [16, 22], "academ": 16, "moder": 16, "amount": 16, "research": 16, "field": 16, "openslr": 16, "ctc": [16, 19, 21, 24, 27], "stateless": [16, 19, 22], "instead": 17, "rnn": [17, 22], "As": [17, 20], "head": 17, "dim": 17, "layer": [17, 22], "feedforward": 17, "embed": [17, 22], "conv1d": [17, 22], "kernel": 17, "left": 17, "context": [17, 22], "nn": [17, 22], "tanh": 17, "linear": 17, "borrow": 17, "ieeexplor": 17, "ieee": 17, "stamp": 17, "jsp": 17, "arnumb": 17, "9054419": 17, "predict": [17, 22], "modif": 17, "right": 17, "charact": 17, "unit": 17, "vocabulari": 17, "87939824": 17, "88": 17, "optimized_transduc": 17, "extra": 17, "technqiu": 17, "propos": 17, "improv": 17, "end": [17, 22, 28], "furthermor": 17, "maximum": 17, "emit": 17, "per": 17, "frame": 17, "simplifi": 17, "significantli": 17, "degrad": 17, "exactli": 17, "benchmark": 17, "unprun": 17, "advantag": 17, "minim": 17, "pruned_transducer_stateless": 17, "altern": 17, "though": 17, "transducer_stateless_modifi": 17, "option": [17, 23, 25, 26, 28], "pr": 17, "gb": 17, "ram": 17, "small": [17, 25, 26, 28], "tri": 17, "prob": [17, 22], "appli": 17, "configur": [17, 23, 25, 26, 28], "c": [17, 18, 22, 28], "lagz6hrcqxoigbfd5e0y3q": 17, "03t14": 17, "8477": 17, "sym": 17, "beam_search": 17, "decoding_method": 17, "beam_4": 17, "28": [17, 20, 23], "ensur": 17, "give": 17, "poor": 17, "531": [17, 18], "994": [17, 20], "176": [17, 20], "027": 17, "encoder_out_dim": 17, "f4fefe4882bc0ae59af951da3f47335d5495ef71": 17, "feb": 17, "50d2281": 17, "mar": 17, "0815224919": 17, "75d558775b": 17, "mmnv8": 17, "72": [17, 20], "878": [17, 26], "257": [17, 25, 26], "880": 17, "267": [17, 25, 26], "891": 17, "__floordiv__": 17, "length": 17, "x_len": 17, "163": [17, 20], "320": 17, "\u6ede": 17, "322": 17, "759": 17, "760": 17, "919": 17, "922": 17, "046": 17, "047": 17, "319": [17, 20], "214": [17, 20], "215": [17, 20, 23], "402": 17, "topk_hyp_index": 17, "topk_index": 17, "logit": 17, "583": [17, 26], "2000": 18, "lji9mwuorlow3jkdhxwk8a": 18, "13t11": 18, "4454": 18, "icefall_asr_aishell_tdnn_lstm_ctc": 18, "858": [18, 20], "389": [18, 20], "154": 18, "161": [18, 20], "536": 18, "171": [18, 20, 25, 26], "539": 18, "917": 18, "207": [18, 20], "129": 18, "\u505c\u6ede": 18, "222": [18, 20], "task": 19, "ligru": [19, 24], "full": [20, 22], "libri": [20, 22], "960": [20, 22], "subset": [20, 22], "3x960": [20, 22], "2880": [20, 22], "lzgnetjwrxc3yghnmd4kpw": 20, "24t16": 20, "43": 20, "4540": 20, "sentenc": 20, "piec": 20, "And": [20, 22], "neither": 20, "nor": 20, "vocab": 20, "work": 20, "5000": 20, "44": [20, 25, 26], "033": 20, "538": 20, "full_libri": 20, "406": 20, "464": 20, "548": 20, "776": 20, "652": [20, 28], "109226120": 20, "714": [20, 25], "473": 20, "944": 20, "1328": 20, "54": [20, 23, 25, 26], "443": [20, 23], "2563": 20, "56": [20, 25], "494": 20, "592": 20, "331": [20, 23], "1715": 20, "52576": 20, "1424": 20, "807": 20, "506": 20, "808": [20, 25], "522": 20, "362": 20, "565": 20, "1477": 20, "106": 20, "2922": 20, "208": 20, "4295": 20, "52343": 20, "396": 20, "3584": 20, "433": 20, "680": [20, 25], "_pickl": 20, "unpicklingerror": 20, "kei": 20, "hlg_modifi": 20, "g_4_gram": [20, 23, 25, 26], "106000": [20, 23], "496": [20, 23], "875": [20, 23], "212k": 20, "267440": [20, 23], "1253": [20, 23], "535k": 20, "83": [20, 23], "77200": [20, 23], "361": [20, 23], "154k": 20, "554": 20, "260": 20, "7178d67e594bc7fa89c2b331ad7bd1c62a6a9eb4": 20, "tue": 20, "22": [20, 25, 26, 28], "8d93169": 20, "266": [20, 23], "268": [20, 23], "601": 20, "758": 20, "025": 20, "204": 20, "425": 20, "broffel": 20, "osom": 20, "427": 20, "723": 20, "775": 20, "881": 20, "352": 20, "234": 20, "384": 20, "whole": [20, 23, 25, 26], "ngram": [20, 23, 25, 26], "857": 20, "979": 20, "980": 20, "055": 20, "117": 20, "051": 20, "363": 20, "959": [20, 26], "546": 20, "598": 20, "599": [20, 23], "833": 20, "834": 20, "915": 20, "076": 20, "110": 20, "397": 20, "999": 20, "concaten": 20, "bucket": 20, "sampler": 20, "1000": 20, "ctc_decod": 20, "ngram_lm_rescor": 20, "attention_rescor": 20, "kind": [20, 22], "316": 20, "118": 20, "58": 20, "221": 20, "125": [20, 28], "136": 20, "144": 20, "159": [20, 28], "543": 20, "174": 20, "topo": 20, "547": 20, "729": 20, "111": 20, "702": 20, "703": 20, "545": 20, "122": 20, "280": 20, "135": [20, 28], "153": [20, 28], "945": 20, "475": 20, "191": [20, 25, 26], "398": 20, "199": [20, 23], "515": 20, "205": 20, "w": [20, 25, 26], "deseri": 20, "441": 20, "fsaclass": 20, "loadfsa": 20, "const": 20, "string": 20, "c10": 20, "ignor": 20, "attribut": 20, "dummi": 20, "589": 20, "attention_scal": 20, "656": 20, "162": 20, "169": [20, 25, 26], "188": 20, "624": 20, "519": [20, 26], "632": 20, "645": [20, 28], "243": 20, "970": 20, "303": 20, "179": 20, "scroll": 22, "scratch": 22, "paper": 22, "arxiv": 22, "ab": 22, "2206": 22, "13236": 22, "joint": 22, "contrari": 22, "convent": 22, "That": 22, "recurr": 22, "sinc": [22, 28], "suitabl": 22, "onlin": 22, "lstm_transducer_stateless": 22, "architectur": 22, "lower": 22, "skip": 22, "prepare_giga_speech": 22, "encourag": 22, "436000": 22, "438000": 22, "cj2vtpiwqhkn9q1tx6ptpg": 22, "20t15": 22, "4468": 22, "210171": 22, "access": 22, "6008": 22, "localhost": 22, "expos": 22, "proxi": 22, "bind_al": 22, "fp16": 22, "worker": 22, "suggest": 22, "both": 22, "lowest": 22, "fast_beam_search": 22, "hidden": 22, "1024": 22, "474000": 22, "includ": 22, "But": 22, "interest": 22, "smallest": 22, "pnnx": 22, "submodul": 22, "updat": 22, "recurs": 22, "init": 22, "bdist_wheel": 22, "lh": 22, "dist": 22, "j4": 22, "pwd": 22, "third": 22, "param": 22, "abl": 22, "extern": 22, "stateless2": 22, "zengwei": 22, "icefall_asr_librispeech_tdnn": 23, "lstm_ctc": 23, "flac": 23, "116k": 23, "140k": 23, "343k": 23, "164k": 23, "105k": 23, "174k": 23, "pretraind": 23, "168": 23, "170": 23, "581": 23, "584": [23, 26], "209": 23, "791": 23, "245": 23, "099": 23, "methond": [23, 25, 26], "725": 23, "403": 23, "631": 23, "010": 23, "tdnn_ligru_ctc": 25, "enough": [25, 26, 28], "luomingshuang": [25, 26], "icefall_asr_timit_tdnn_ligru_ctc": 25, "pretrained_average_9_25": 25, "fdhc0_si1559": [25, 26], "felc0_si756": [25, 26], "fmgd0_si1564": [25, 26], "ffprobe": [25, 26], "show_format": [25, 26], "nistspher": [25, 26], "database_id": [25, 26], "database_vers": [25, 26], "utterance_id": [25, 26], "dhc0_si1559": [25, 26], "sample_min": [25, 26], "4176": [25, 26], "sample_max": [25, 26], "5984": [25, 26], "bitrat": [25, 26], "258": [25, 26], "audio": [25, 26], "pcm_s16le": [25, 26], "hz": [25, 26], "s16": [25, 26], "256": [25, 26], "elc0_si756": [25, 26], "1546": [25, 26], "1989": [25, 26], "mgd0_si1564": [25, 26], "7626": [25, 26], "10573": [25, 26], "660": 25, "183": [25, 26], "695": 25, "697": 25, "210": [25, 26], "829": 25, "sil": [25, 26], "dh": [25, 26], "ih": [25, 26], "uw": [25, 26], "ah": [25, 26], "ii": [25, 26], "z": [25, 26], "aa": [25, 26], "ei": [25, 26], "dx": [25, 26], "uh": [25, 26], "ng": [25, 26], "th": [25, 26], "eh": [25, 26], "jh": [25, 26], "er": [25, 26], "ai": [25, 26], "hh": [25, 26], "aw": 25, "ae": [25, 26], "705": 25, "715": 25, "720": 25, "251": [25, 26], "348": 25, "ch": 25, "icefall_asr_timit_tdnn_lstm_ctc": 26, "pretrained_average_16_25": 26, "816": 26, "827": 26, "387": 26, "unk": 26, "739": 26, "971": 26, "977": 26, "978": 26, "981": 26, "ow": 26, "ykubhb5wrmosxykid1z9eg": 28, "23t23": 28, "icefall_asr_yesno_tdnn": 28, "l_disambig": 28, "lexicon_disambig": 28, "arpa": 28, "0_0_0_1_0_0_0_1": 28, "0_0_1_0_0_0_1_0": 28, "0_0_1_0_0_1_1_1": 28, "0_0_1_0_1_0_0_1": 28, "0_0_1_1_0_0_0_1": 28, "0_0_1_1_0_1_1_0": 28, "0_0_1_1_1_0_0_0": 28, "0_0_1_1_1_1_0_0": 28, "0_1_0_0_0_1_0_0": 28, "0_1_0_0_1_0_1_0": 28, "0_1_0_1_0_0_0_0": 28, "0_1_0_1_1_1_0_0": 28, "0_1_1_0_0_1_1_1": 28, "0_1_1_1_0_0_1_0": 28, "0_1_1_1_1_0_1_0": 28, "1_0_0_0_0_0_0_0": 28, "1_0_0_0_0_0_1_1": 28, "1_0_0_1_0_1_1_1": 28, "1_0_1_1_0_1_1_1": 28, "1_0_1_1_1_1_0_1": 28, "1_1_0_0_0_1_1_1": 28, "1_1_0_0_1_0_1_1": 28, "1_1_0_1_0_1_0_0": 28, "1_1_0_1_1_0_0_1": 28, "1_1_0_1_1_1_1_0": 28, "1_1_1_0_0_1_0_1": 28, "1_1_1_0_1_0_1_0": 28, "1_1_1_1_0_0_1_0": 28, "1_1_1_1_1_0_0_0": 28, "1_1_1_1_1_1_1_1": 28, "54080": 28, "507": 28, "108k": 28, "No": 28, "ye": 28, "hebrew": 28, "NO": 28, "621": 28, "119": 28, "127": 28, "650": 28, "139": 28, "143": 28, "198": 28, "181": 28, "186": 28, "187": 28, "287": 28, "correctli": 28, "simplest": 28}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"follow": 0, "code": 0, "style": 0, "contribut": [1, 3], "document": 1, "how": [2, 9, 11, 12, 13], "creat": [2, 8], "recip": [2, 19], "data": [2, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "prepar": [2, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "train": [2, 5, 8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "decod": [2, 8, 9, 15, 17, 18, 20, 22, 23, 25, 26, 28], "pre": [2, 5, 15, 17, 18, 20, 22, 23, 25, 26, 28], "model": [2, 5, 9, 11, 12, 13, 14, 15, 17, 18, 20, 22, 23, 25, 26, 28], "huggingfac": [4, 6], "space": 6, "youtub": [6, 8], "video": [6, 8], "icefal": [7, 8], "content": [7, 19], "instal": [8, 15, 17, 18, 20, 23, 25, 26], "0": 8, "pytorch": 8, "torchaudio": 8, "1": [8, 15, 17, 18, 20], "k2": 8, "2": [8, 15, 17, 18, 20], "lhots": 8, "3": [8, 15, 17, 20], "download": [8, 15, 17, 18, 20, 22, 23, 25, 26, 28], "exampl": [8, 15, 17, 18, 20, 22], "virtual": 8, "environ": 8, "activ": 8, "your": 8, "4": 8, "5": 8, "test": 8, "export": [9, 10, 11, 12, 13, 14, 22], "state_dict": [9, 22], "when": [9, 11, 12, 13], "us": [9, 11, 12, 13, 22], "run": 9, "py": 9, "ncnn": [10, 22], "onnx": 11, "torch": [12, 13, 22], "jit": [12, 13, 22], "script": 12, "trace": [13, 22], "conform": [15, 20], "ctc": [15, 18, 20, 23, 25, 26, 28], "configur": [15, 18, 20, 22], "option": [15, 18, 20, 22], "log": [15, 17, 18, 20, 22], "usag": [15, 17, 18, 20, 22], "case": [15, 17, 18, 20], "kaldifeat": [15, 17, 18, 20, 23, 25, 26, 28], "hlg": [15, 18, 20], "attent": [15, 20], "rescor": [15, 20], "colab": [15, 17, 18, 20, 23, 25, 26, 28], "notebook": [15, 17, 18, 20, 23, 25, 26, 28], "deploy": [15, 20], "c": [15, 20], "aishel": 16, "stateless": 17, "transduc": [17, 22], "The": 17, "loss": 17, "todo": 17, "greedi": 17, "search": 17, "beam": 17, "modifi": 17, "tdnn": [18, 23, 25, 26, 28], "lstm": [18, 22, 23, 26], "tabl": 19, "lm": 20, "comput": 20, "wer": 20, "librispeech": 21, "which": 22, "pretrain": 22, "infer": [23, 25, 26, 28], "timit": 24, "ligru": 25, "yesno": 27}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.todo": 2, "sphinx": 57}, "alltitles": {"Follow the code style": [[0, "follow-the-code-style"]], "Contributing to Documentation": [[1, "contributing-to-documentation"]], "How to create a recipe": [[2, "how-to-create-a-recipe"]], "Data Preparation": [[2, "data-preparation"], [17, "data-preparation"]], "Training": [[2, "training"], [8, "training"], [15, "training"], [17, "training"], [18, "training"], [20, "training"], [22, "training"], [23, "training"], [25, "training"], [26, "training"], [28, "training"]], "Decoding": [[2, "decoding"], [8, "decoding"], [15, "decoding"], [17, "decoding"], [18, "decoding"], [20, "decoding"], [22, "decoding"], [23, "decoding"], [25, "decoding"], [26, "decoding"], [28, "decoding"]], "Pre-trained model": [[2, "pre-trained-model"]], "Contributing": [[3, "contributing"]], "Huggingface": [[4, "huggingface"]], "Pre-trained models": [[5, "pre-trained-models"]], "Huggingface spaces": [[6, "huggingface-spaces"]], "YouTube Video": [[6, "youtube-video"], [8, "youtube-video"]], "Icefall": [[7, "icefall"]], "Contents:": [[7, null]], "Installation": [[8, "installation"]], "(0) Install PyTorch and torchaudio": [[8, "install-pytorch-and-torchaudio"]], "(1) Install k2": [[8, "install-k2"]], "(2) Install lhotse": [[8, "install-lhotse"]], "(3) Download icefall": [[8, "download-icefall"]], "Installation example": [[8, "installation-example"]], "(1) Create a virtual environment": [[8, "create-a-virtual-environment"]], "(2) Activate your virtual environment": [[8, "activate-your-virtual-environment"]], "(3) Install k2": [[8, "id1"]], "(4) Install lhotse": [[8, "id2"]], "(5) Download icefall": [[8, "id3"]], "Test Your Installation": [[8, "test-your-installation"]], "Data preparation": [[8, "data-preparation"], [15, "data-preparation"], [18, "data-preparation"], [20, "data-preparation"], [22, "data-preparation"], [23, "data-preparation"], [25, "data-preparation"], [26, "data-preparation"], [28, "data-preparation"]], "Export model.state_dict()": [[9, "export-model-state-dict"], [22, "export-model-state-dict"]], "When to use it": [[9, "when-to-use-it"], [11, "when-to-use-it"], [12, "when-to-use-it"], [13, "when-to-use-it"]], "How to export": [[9, "how-to-export"], [11, "how-to-export"], [12, "how-to-export"], [13, "how-to-export"]], "How to use the exported model": [[9, "how-to-use-the-exported-model"], [11, "how-to-use-the-exported-model"], [12, "how-to-use-the-exported-model"]], "Use the exported model to run decode.py": [[9, "use-the-exported-model-to-run-decode-py"]], "Export to ncnn": [[10, "export-to-ncnn"]], "Export to ONNX": [[11, "export-to-onnx"]], "Export model with torch.jit.script()": [[12, "export-model-with-torch-jit-script"]], "Export model with torch.jit.trace()": [[13, "export-model-with-torch-jit-trace"]], "How to use the exported models": [[13, "how-to-use-the-exported-models"]], "Model export": [[14, "model-export"]], "Conformer CTC": [[15, "conformer-ctc"], [20, "conformer-ctc"]], "Configurable options": [[15, "configurable-options"], [18, "configurable-options"], [20, "configurable-options"], [22, "configurable-options"]], "Pre-configured options": [[15, "pre-configured-options"], [18, "pre-configured-options"], [20, "pre-configured-options"], [22, "pre-configured-options"]], "Training logs": [[15, "training-logs"], [17, "training-logs"], [18, "training-logs"], [20, "training-logs"], [22, "training-logs"]], "Usage examples": [[15, "usage-examples"], [17, "usage-examples"], [18, "usage-examples"], [20, "usage-examples"]], "Case 1": [[15, "case-1"], [17, "case-1"], [18, "case-1"], [20, "case-1"]], "Case 2": [[15, "case-2"], [17, "case-2"], [18, "case-2"], [20, "case-2"]], "Case 3": [[15, "case-3"], [17, "case-3"], [20, "case-3"]], "Pre-trained Model": [[15, "pre-trained-model"], [17, "pre-trained-model"], [18, "pre-trained-model"], [20, "pre-trained-model"], [23, "pre-trained-model"], [25, "pre-trained-model"], [26, "pre-trained-model"], [28, "pre-trained-model"]], "Install kaldifeat": [[15, "install-kaldifeat"], [17, "install-kaldifeat"], [18, "install-kaldifeat"], [20, "install-kaldifeat"], [23, "install-kaldifeat"], [25, "install-kaldifeat"], [26, "install-kaldifeat"]], "Download the pre-trained model": [[15, "download-the-pre-trained-model"], [17, "download-the-pre-trained-model"], [18, "download-the-pre-trained-model"], [20, "download-the-pre-trained-model"], [23, "download-the-pre-trained-model"], [25, "download-the-pre-trained-model"], [26, "download-the-pre-trained-model"], [28, "download-the-pre-trained-model"]], "Usage": [[15, "usage"], [17, "usage"], [18, "usage"], [20, "usage"]], "CTC decoding": [[15, "ctc-decoding"], [20, "ctc-decoding"]], "HLG decoding": [[15, "hlg-decoding"], [18, "hlg-decoding"], [20, "hlg-decoding"]], "HLG decoding + attention decoder rescoring": [[15, "hlg-decoding-attention-decoder-rescoring"]], "Colab notebook": [[15, "colab-notebook"], [17, "colab-notebook"], [18, "colab-notebook"], [20, "colab-notebook"], [23, "colab-notebook"], [25, "colab-notebook"], [26, "colab-notebook"], [28, "colab-notebook"]], "Deployment with C++": [[15, "deployment-with-c"], [20, "deployment-with-c"]], "aishell": [[16, "aishell"]], "Stateless Transducer": [[17, "stateless-transducer"]], "The Model": [[17, "the-model"]], "The Loss": [[17, "the-loss"]], "Todo": [[17, "id1"]], "Greedy search": [[17, "greedy-search"]], "Beam search": [[17, "beam-search"]], "Modified Beam search": [[17, "modified-beam-search"]], "TDNN-LSTM CTC": [[18, "tdnn-lstm-ctc"]], "Recipes": [[19, "recipes"]], "Table of Contents": [[19, null]], "HLG decoding + LM rescoring": [[20, "hlg-decoding-lm-rescoring"]], "HLG decoding + LM rescoring + attention decoder rescoring": [[20, "hlg-decoding-lm-rescoring-attention-decoder-rescoring"]], "Compute WER with the pre-trained model": [[20, "compute-wer-with-the-pre-trained-model"]], "LibriSpeech": [[21, "librispeech"]], "LSTM Transducer": [[22, "lstm-transducer"]], "Which model to use": [[22, "which-model-to-use"]], "Usage example": [[22, "usage-example"]], "Export models": [[22, "export-models"]], "Export model using torch.jit.trace()": [[22, "export-model-using-torch-jit-trace"]], "Export model for ncnn": [[22, "export-model-for-ncnn"]], "Download pretrained models": [[22, "download-pretrained-models"]], "TDNN-LSTM-CTC": [[23, "tdnn-lstm-ctc"], [26, "tdnn-lstm-ctc"]], "Inference with a pre-trained model": [[23, "inference-with-a-pre-trained-model"], [25, "inference-with-a-pre-trained-model"], [26, "inference-with-a-pre-trained-model"], [28, "inference-with-a-pre-trained-model"]], "TIMIT": [[24, "timit"]], "TDNN-LiGRU-CTC": [[25, "tdnn-ligru-ctc"]], "YesNo": [[27, "yesno"]], "TDNN-CTC": [[28, "tdnn-ctc"]], "Download kaldifeat": [[28, "download-kaldifeat"]]}, "indexentries": {}})
\ No newline at end of file