Analysers
cclutils

Repository

pip install cclutils --extra-index-url https://pypi.clarin-pl.eu/
import cclutils

filepath = './example.xml'
document = cclutils.read(filepath)

cclpath = './example.xml'
relpath = './exampel.rel.xml'
document = cclutils.read(cclpath, relpath)
document = cclutils.read(cclpath, relpath, 'nkjp')
document = cclutils.read(filepath)
...
cclutils.write(document, './out.xml')
cclutils.write(document, './out.xml', rel_path='./out.rel.xml')
cclutils.write(document, './out.xml', rel_path='./out.rel.xml', tagset='spacy')
tagset = cclutils.get_tagset('nkjp')
tagset = cclutils.get_tagset('spacy')
...
document = cclutils.read('./example.xml')
for paragraph in document.paragraphs():
    ...
    for sentence in paragraph.sentences():
        ...
        for token in sentence.tokens():
            ...
document = cclutils.read('./example.xml')

# tokens is a generator:
tokens = (token for paragraph in document.paragraphs()
    for sentence in paragraph.sentences()
    for token in sentence.tokens())
it = read_chunks_it(ccl_path)
for paragraph in it:
    pass

it = read_sentences_it(ccl_path)
for sentence in it:
    pass
tagset = cclutils.get_tagset('nkjp')
...
pos = get_pos(token, tagset)