Update tokenizer.py to fix erroneous Javanese language code

The ISO-639-1 code for Javanese is `jv` NOT `jw` as given here. 
It should be listed as `jv`.
This commit is contained in:
Kathy Reid 2025-10-08 22:43:54 +11:00 committed by GitHub
parent c0d2f624c0
commit bd9d47a977
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -105,7 +105,7 @@ LANGUAGES = {
"ln": "lingala", "ln": "lingala",
"ha": "hausa", "ha": "hausa",
"ba": "bashkir", "ba": "bashkir",
"jw": "javanese", "jv": "javanese",
"su": "sundanese", "su": "sundanese",
"yue": "cantonese", "yue": "cantonese",
} }