diff --git a/tokenizer_for_indian_languages_on_files.py b/tokenizer_for_indian_languages_on_files.py index f439cf72bf85772448f284e1427dbf1d473eb8be..52bb3d5ce40a73f71d763fbdc20af7950d65e3b4 100644 --- a/tokenizer_for_indian_languages_on_files.py +++ b/tokenizer_for_indian_languages_on_files.py @@ -137,7 +137,7 @@ def main(): os.makedirs(args.out) if args.lang in ['hi', 'or', 'mn', 'as', 'bn', 'pa']: lang = 0 - elif args.lang == 'ur': + elif args.lang in ['ur', 'ks']: lang = 1 elif args.lang in ['en', 'gu', 'mr', 'ml', 'kn', 'te', 'ta']: lang = 2