Skip to content
Snippets Groups Projects
Commit 72657010 authored by Piotr Wątorski's avatar Piotr Wątorski
Browse files

Sentence/chunk generators - fix

parent d46fe12a
No related branches found
No related tags found
1 merge request!1Sentence/chunk generators
...@@ -162,13 +162,14 @@ def get_tagset(tagset): ...@@ -162,13 +162,14 @@ def get_tagset(tagset):
def read_chunks_it(filepath, tagset='nkjp'): def read_chunks_it(filepath, tagset='nkjp'):
""" Returns a iterable sentence generator. """ Returns a iterable chunk generator.
Args: Args:
filepath: a path to CCL file filepath: a path to CCL file
tagset: the name of the tagset that is used in the document or a tagset object itself. tagset: the name of the tagset that is used in the document or a tagset object itself.
Returns: a iterable sentence generator. Returns:
a iterable chunk generator.
""" """
tagset = get_tagset(tagset) tagset = get_tagset(tagset)
reader = corpus2.TokenReader_create_path_reader('ccl', tagset, filepath) reader = corpus2.TokenReader_create_path_reader('ccl', tagset, filepath)
...@@ -176,10 +177,9 @@ def read_chunks_it(filepath, tagset='nkjp'): ...@@ -176,10 +177,9 @@ def read_chunks_it(filepath, tagset='nkjp'):
while True: while True:
chunk = reader.get_next_chunk() chunk = reader.get_next_chunk()
if chunk: if not chunk:
yield chunk
else:
break break
yield chunk
del reader del reader
...@@ -201,10 +201,9 @@ def read_sentences_it(filepath, tagset='nkjp'): ...@@ -201,10 +201,9 @@ def read_sentences_it(filepath, tagset='nkjp'):
while True: while True:
sentence = reader.get_next_sentence() sentence = reader.get_next_sentence()
if sentence: if not sentence:
yield sentence
else:
break break
yield sentence
del reader del reader
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment