1023 Commits

Author SHA1 Message Date
root
559f9e2def fix repeat bos and pad id 2025-06-04 10:02:42 +00:00
root
80677a55f8 remove stats 2025-06-03 00:48:39 -07:00
root
5becf6927d remove concat three items 2025-06-03 00:18:21 -07:00
root
4c0396f8f2 support text2speech ultrachat 2025-06-02 23:16:03 -07:00
root
49256fa917 fix tts stage decode 2025-05-28 02:34:07 +00:00
root
5a7c72cb47 add tts task decode 2025-05-27 02:12:22 -07:00
root
1281d7a515 add tts training 2025-05-27 00:18:23 -07:00
root
39700d5c94 refactor train to reuse code 2025-05-26 19:53:16 -07:00
root
e6e1f3fa4f add tts stage 2025-05-23 01:53:05 -07:00
root
dd858f0cd1 support instruct s2s 2025-05-22 23:16:33 -07:00
root
9fff18edec refactor code 2025-05-22 19:14:52 -07:00
root
7a12d88d6c update 2025-05-21 22:18:57 -07:00
root
7aa6c80ddb add multi gpu processing 2025-05-21 21:54:59 -07:00
root
ca84aff5d6 remove cosyvoice lib 2025-05-20 00:52:09 -07:00
root
9cdd393f43 add server url 2025-05-20 07:48:49 +00:00
root
50fc1aba60 add multi-node 2025-05-18 18:47:22 -07:00
root
4a29430349 add loss type 2025-05-19 01:31:21 +00:00
root
e52581e69b support local_rank for multi-node 2025-05-16 00:02:12 -07:00
root
0e8c1db4d0 fix speed perturb issue 2025-05-15 22:45:04 -07:00
root
bfb4ebeb83 remove triton 2025-05-15 14:32:49 +00:00
root
f81363d324 add speech continuation pretraining 2025-05-15 14:16:51 +00:00
root
e65725810c fix mmsu 2025-05-13 09:13:12 +00:00
root
cbf3af31fd add voicebench eval 2025-05-13 05:37:11 +00:00
root
89781b9bb1 add cosyvoice2 decode 2025-05-12 10:06:59 +00:00
root
b20a0d0e35 add on the fly feature 2025-05-08 19:21:41 -07:00
root
bd2df570ad add debug script 2025-05-08 03:37:26 -07:00
root
37db65984c remove k2 dependency 2025-05-08 03:02:34 -07:00
root
e41c1cabd5 add dependency 2025-05-08 07:56:14 +00:00
root
7cc366d82d add en data, cosy2 token for training 2025-05-08 07:23:22 +00:00
root
2dd40b62ef add vocalnet en data 2025-05-08 06:29:46 +00:00
root
08be51a91f change pic 2025-04-29 10:09:57 +00:00
root
11bd3c9ad8 lint 2025-04-29 09:46:44 +00:00
root
360f0aa397 update README 2025-04-29 08:49:12 +00:00
root
448a4eeea7 update hf dataset loading into lhotse 2025-04-29 07:33:34 +00:00
Yuekai Zhang
d742043e75 refactor decode part 2025-04-25 18:31:43 +08:00
root
71a0a442a6 add history cache 2025-04-25 10:05:07 +00:00
Yuekai Zhang
47920c2336 add gradio demo 2025-04-25 16:05:37 +08:00
Yuekai Zhang
72addd40f5 change place 2025-04-25 14:22:16 +08:00
Yuekai Zhang
9a07363a8d remove unsed 2025-04-25 14:21:50 +08:00
Yuekai Zhang
6ea7ec8543 remove offline tab 2025-04-25 14:10:30 +08:00
Yuekai Zhang
6955639d22 add qwen omni web demo 2025-04-25 14:08:25 +08:00
root
3642dfd8c3 refactor code 2025-04-25 05:36:18 +00:00
root
2e9be46703 debug 2025-04-24 08:24:11 +00:00
root
478d56efd8 fix bugs when padding right 2025-04-23 07:33:27 +00:00
Yuekai Zhang
23fdef2fd3 add codec decode 2025-04-21 17:57:57 +08:00
Yuekai Zhang
09d81b44a7 change padding side name 2025-04-21 17:10:25 +08:00
Yuekai Zhang
7db40052d6 add flash attn support 2025-04-21 14:54:28 +08:00
root
b305cdacc0 fix padding side 2025-04-21 06:23:10 +00:00
root
bdb60f6ddc add codec lm 2025-04-21 01:00:06 +00:00
root
458d697acc fix batch_size>1 decoding bug 2025-04-15 13:41:33 +00:00