From 45fdcead04a3bd7259e142fbbd4d76836908a45d Mon Sep 17 00:00:00 2001 From: Alexandra Antonova Date: Mon, 13 Nov 2023 14:04:36 +0300 Subject: [PATCH] fix path in comment Signed-off-by: Alexandra Antonova --- .../en_spellmapper/dataset_preparation/build_training_data.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/nlp/en_spellmapper/dataset_preparation/build_training_data.sh b/scripts/nlp/en_spellmapper/dataset_preparation/build_training_data.sh index 4c211f2..2f2e985 100644 --- a/scripts/nlp/en_spellmapper/dataset_preparation/build_training_data.sh +++ b/scripts/nlp/en_spellmapper/dataset_preparation/build_training_data.sh @@ -20,7 +20,7 @@ YAGO_ENTITIES=yago.uniq2 WIKIPEDIA_FOLDER=../yago_wikipedia ## Articles with these titles will be skipped (as they are reserved for testing) -## To generate this file use ${NEMO_PATH}/examples/nlp/spellchecking_asr_customization/evaluation/get_all_titles_from_spoken_wikipedia.py --input_folder en/en/english --output_file spoken_wiki_titles.txt +## To generate this file use ${NEMO_COMPATIBLE_PATH}/scripts/nlp/en_spellmapper/evaluation/get_all_titles_from_spoken_wikipedia.py --input_folder en/en/english --output_file spoken_wiki_titles.txt EXCLUDE_TITLES=spoken_wiki_titles.txt ## Vocabulary of aligned YAGO subphrases, allows to use not only Wikipedia titles as whole phrases, but also their parts.