Skip to content
Snippets Groups Projects
worker.py 969 B
Newer Older
Bartłomiej Koptyra's avatar
Bartłomiej Koptyra committed
"""Implementation of nlp_worker."""
import logging

import nlp_ws


from src.anonymizer import Anonymizer

_log = logging.getLogger(__name__)


class Worker(nlp_ws.NLPWorker):
    """Implements nlp_worker for anonymizer service."""

    @classmethod
    def static_init(cls, config):
        """One time static initialisation."""
        print("siema")

    def process(self, input_file, task_options, output_file):
        """Anonymizes input text.

        It is assumed input_file is encoded in UTF-8.

        Options:
        method - 'delete'/'tag'/'pseudo' - 'delete' deletes selected tokens,
                'tag' replaces selected tokens with arbitrary tags, 'pseudo'
                replaces selected tokens with a random token that
        """
        anon = Anonymizer(task_options)
        with open(input_file, 'rt', encoding='utf-8') as input_file:
            with open(output_file, 'wt', encoding='utf-8') as output_file:
                print("elo")