diff --git a/language_translation/src/data.py b/language_translation/src/data.py index 0ab83f6c6d..a3893a8fae 100644 --- a/language_translation/src/data.py +++ b/language_translation/src/data.py @@ -24,7 +24,7 @@ def get_data(opts): multi30k.URL["train"] = "https://raw.githubusercontent.com/neychev/small_DL_repo/master/datasets/Multi30k/training.tar.gz" multi30k.URL["valid"] = "https://raw.githubusercontent.com/neychev/small_DL_repo/master/datasets/Multi30k/validation.tar.gz" - # Define a token "unkown", "padding", "beginning of sentence", and "end of sentence" + # Define a token "unknown", "padding", "beginning of sentence", and "end of sentence" special_symbols = { "":0, "":1,