review comment

tabergma · tabergma · commit 95fe8da931fe · 2019-10-18T16:13:30.000+02:00
diff --git a/rasa/nlu/tokenizers/spacy_tokenizer.py b/rasa/nlu/tokenizers/spacy_tokenizer.py
@@ -40,7 +40,8 @@ def train(
 
                 if attribute_doc is not None:
                     example.set(
-                        MESSAGE_TOKENS_NAMES[attribute], self.tokenize(attribute_doc)
+                        MESSAGE_TOKENS_NAMES[attribute],
+                        self.tokenize(attribute_doc, attribute),
                     )
 
     def get_doc(self, message: Message, attribute: Text) -> "Doc":
@@ -49,10 +50,12 @@ def get_doc(self, message: Message, attribute: Text) -> "Doc":
     def process(self, message: Message, **kwargs: Any) -> None:
         message.set(
             MESSAGE_TOKENS_NAMES[MESSAGE_TEXT_ATTRIBUTE],
-            self.tokenize(self.get_doc(message, MESSAGE_TEXT_ATTRIBUTE)),
+            self.tokenize(
+                self.get_doc(message, MESSAGE_TEXT_ATTRIBUTE), MESSAGE_TEXT_ATTRIBUTE
+            ),
         )
 
-    def tokenize(self, doc: "Doc") -> List[Token]:
+    def tokenize(self, doc: "Doc", attribute: Text) -> List[Token]:
         tokens = [Token(t.text, t.idx) for t in doc]
-        self.add_cls_token(tokens)
+        self.add_cls_token(tokens, attribute)
         return tokens