14 Commits

Author SHA1 Message Date
root
7cc366d82d add en data, cosy2 token for training 2025-05-08 07:23:22 +00:00
root
2dd40b62ef add vocalnet en data 2025-05-08 06:29:46 +00:00
root
11bd3c9ad8 lint 2025-04-29 09:46:44 +00:00
root
448a4eeea7 update hf dataset loading into lhotse 2025-04-29 07:33:34 +00:00
root
71a0a442a6 add history cache 2025-04-25 10:05:07 +00:00
root
3642dfd8c3 refactor code 2025-04-25 05:36:18 +00:00
root
2e9be46703 debug 2025-04-24 08:24:11 +00:00
root
478d56efd8 fix bugs when padding right 2025-04-23 07:33:27 +00:00
root
bdb60f6ddc add codec lm 2025-04-21 01:00:06 +00:00
root
0c02da82ac refine decoding method 2025-04-15 06:53:20 +00:00
root
3ad075af60 s2t training 2025-04-15 02:16:03 +00:00
root
6b69276b19 add training stage 2025-04-11 06:51:51 +00:00
root
e6897b10fa make asr decode results align 2025-04-11 06:51:51 +00:00
root
cca562d538 migrate from speech llm 2025-04-11 06:51:50 +00:00