From f8ffebb8039342c24e5a7ed16298aeb44912aa08 Mon Sep 17 00:00:00 2001 From: CharlesCNorton <135471798+CharlesCNorton@users.noreply.github.com> Date: Sat, 8 Jun 2024 17:22:53 -0400 Subject: [PATCH] typo: Correct "nornmalized" to "normalized" in SentencePieceTokenizer Corrected a typo in the SentencePieceTokenizer implementation. The word "nornmalized" was misspelled and has been changed to "normalized" to ensure proper spelling in the assertion message "Message content must be normalized". --- src/mistral_common/tokens/tokenizers/sentencepiece.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/mistral_common/tokens/tokenizers/sentencepiece.py b/src/mistral_common/tokens/tokenizers/sentencepiece.py index 3fff97d..3dc2f9d 100644 --- a/src/mistral_common/tokens/tokenizers/sentencepiece.py +++ b/src/mistral_common/tokens/tokenizers/sentencepiece.py @@ -236,7 +236,7 @@ def encode_user_message( system_prompt: Optional[str] = None, ) -> List[int]: assert message.content is not None - assert isinstance(message.content, str), "Message content must be nornmalized" + assert isinstance(message.content, str), "Message content must be normalized" content = "" tools_tokens: List[int] = [] if is_last and available_tools: