Hi there,
When running python3 -m prodigy ner.correct poc_en_parties en_core_web_sm ./input.csv --label ORG,PERSON --unsegmented
, I get the following output:
Using 2 label(s): ORG, PERSON
Traceback (most recent call last):
File "/usr/lib/python3.7/runpy.py", line 193, in _run_module_as_main
"__main__", mod_spec)
File "/usr/lib/python3.7/runpy.py", line 85, in _run_code
exec(code, run_globals)
File "/home/forge/.local/lib/python3.7/site-packages/prodigy/__main__.py", line 61, in <module>
controller = recipe(*args, use_plac=True)
File "cython_src/prodigy/core.pyx", line 335, in prodigy.core.recipe.recipe_decorator.recipe_proxy
File "cython_src/prodigy/core.pyx", line 362, in prodigy.core._components_to_ctrl
File "cython_src/prodigy/core.pyx", line 123, in prodigy.core.Controller.__init__
File "cython_src/prodigy/components/feeds.pyx", line 168, in prodigy.components.feeds.Feed.__init__
File "cython_src/prodigy/components/stream.pyx", line 110, in prodigy.components.stream.Stream.__init__
File "cython_src/prodigy/components/stream.pyx", line 116, in prodigy.components.stream.Stream._start_count
File "cython_src/prodigy/components/stream.pyx", line 135, in prodigy.components.stream.Stream._get_buffer
File "/home/forge/.local/lib/python3.7/site-packages/prodigy/recipes/ner.py", line 244, in make_tasks
for doc, eg in nlp.pipe(texts, as_tuples=True, batch_size=10):
File "/home/forge/.local/lib/python3.7/site-packages/spacy/language.py", line 1488, in pipe
for doc, context in zip(docs, contexts):
File "/home/forge/.local/lib/python3.7/site-packages/spacy/language.py", line 1521, in pipe
for doc in docs:
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1488, in _pipe
yield from proc.pipe(docs, **kwargs)
File "spacy/pipeline/transition_parser.pyx", line 227, in pipe
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1443, in minibatch
batch = list(itertools.islice(items, int(batch_size)))
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1488, in _pipe
yield from proc.pipe(docs, **kwargs)
File "spacy/pipeline/pipe.pyx", line 53, in pipe
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1488, in _pipe
yield from proc.pipe(docs, **kwargs)
File "spacy/pipeline/pipe.pyx", line 53, in pipe
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1488, in _pipe
yield from proc.pipe(docs, **kwargs)
File "spacy/pipeline/transition_parser.pyx", line 227, in pipe
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1443, in minibatch
batch = list(itertools.islice(items, int(batch_size)))
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1488, in _pipe
yield from proc.pipe(docs, **kwargs)
File "spacy/pipeline/trainable_pipe.pyx", line 73, in pipe
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1443, in minibatch
batch = list(itertools.islice(items, int(batch_size)))
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1488, in _pipe
yield from proc.pipe(docs, **kwargs)
File "spacy/pipeline/trainable_pipe.pyx", line 73, in pipe
File "/home/forge/.local/lib/python3.7/site-packages/spacy/util.py", line 1443, in minibatch
batch = list(itertools.islice(items, int(batch_size)))
File "/home/forge/.local/lib/python3.7/site-packages/spacy/language.py", line 1518, in <genexpr>
docs = (self.make_doc(text) for text in texts)
File "/home/forge/.local/lib/python3.7/site-packages/spacy/language.py", line 1479, in <genexpr>
texts = (tc[0] for tc in text_context1)
File "/home/forge/.local/lib/python3.7/site-packages/prodigy/recipes/ner.py", line 243, in <genexpr>
texts = ((eg["text"], eg) for eg in stream)
File "cython_src/prodigy/components/preprocess.pyx", line 164, in add_tokens
File "/home/forge/.local/lib/python3.7/site-packages/spacy/language.py", line 1488, in pipe
for doc, context in zip(docs, contexts):
File "/home/forge/.local/lib/python3.7/site-packages/spacy/language.py", line 1521, in pipe
for doc in docs:
File "/home/forge/.local/lib/python3.7/site-packages/spacy/language.py", line 1518, in <genexpr>
docs = (self.make_doc(text) for text in texts)
File "/home/forge/.local/lib/python3.7/site-packages/spacy/language.py", line 1479, in <genexpr>
texts = (tc[0] for tc in text_context1)
File "cython_src/prodigy/components/preprocess.pyx", line 157, in genexpr
File "cython_src/prodigy/components/loaders.pyx", line 29, in _add_attrs
File "cython_src/prodigy/components/filters.pyx", line 46, in filter_duplicates
File "cython_src/prodigy/components/filters.pyx", line 18, in filter_empty
File "cython_src/prodigy/components/loaders.pyx", line 23, in _rehash_stream
File "cython_src/prodigy/components/loaders.pyx", line 195, in CSV
AttributeError: 'NoneType' object has no attribute 'lower'
The exact same command with the exact same input used to work before I upgraded to 1.11.0. Is there something I'm doing wrong or broke in the upgrade?