We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 9ae3319 commit 053412bCopy full SHA for 053412b
1 file changed
text_preprocessing/preprocessor.py
@@ -17,7 +17,7 @@
17
from spacy.tokens import Doc, Token
18
19
from .modernizer import Modernizer
20
-from .spacy_helpers import load_language_model, Tokens, PreprocessorToken
+from .spacy_helpers import PreprocessorToken, Tokens, load_language_model
21
22
Doc.set_extension("metadata", default={})
23
Doc.set_extension("char_num", default=0)
@@ -176,8 +176,8 @@ def process_texts(
176
if self.ngram_config is not None:
177
tokens = generate_ngrams(**self.ngram_config, tokens=tokens)
178
if self.post_func is not None:
179
- processed_doc = self.post_func(tokens)
180
- yield processed_doc
+ tokens = self.post_func(tokens)
+ yield tokens
181
elif isinstance(tokens, Doc):
182
tokens = Tokens(tokens, keep_all=keep_all)
183
0 commit comments