Merge 7cdc0da3391e5c3cdd8b7ee9a9db52a7a1d6e641 into 693f069de73fd91d7c2009571245d97221cc3a3f

This commit is contained in:
Peter Ross 2025-10-08 21:44:26 +05:30 committed by GitHub
commit 62abcc8f6f
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -55,6 +55,12 @@ def get_args():
help="Vocabulary size for BPE training",
)
parser.add_argument(
"--unk-surface",
type=str,
help="Unknown symbol surface",
)
return parser.parse_args()
@ -101,6 +107,7 @@ def main():
unk_id=unk_id,
bos_id=-1,
eos_id=-1,
**(dict(unk_surface=args.unk_surface) if args.unk_surface else dict()),
)
else:
print(f"{model_file} exists - skipping")