From 0af58c5514ce1679b2d373ad051c3026bb330dd1 Mon Sep 17 00:00:00 2001 From: pwalkow <pawel.walkowiak@hotmail.com> Date: Thu, 23 Nov 2023 12:07:39 +0100 Subject: [PATCH] Random letters --- src/dictionaries/morphosyntactic/ner_file.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/src/dictionaries/morphosyntactic/ner_file.py b/src/dictionaries/morphosyntactic/ner_file.py index ef051f5..e2c323a 100644 --- a/src/dictionaries/morphosyntactic/ner_file.py +++ b/src/dictionaries/morphosyntactic/ner_file.py @@ -1,6 +1,7 @@ """Module responsible for Morphosyntactic dict that uses a tsv file with NER tags.""" import random +import string from collections import defaultdict from typing import List, Optional, Type, Dict @@ -115,7 +116,10 @@ class NERFileMorphosyntacticDictionary(MorphosyntacticDictionary): word = self._dictionary[entry_type][morpho_tag][lemma] elif morpho_tag == "ign": # unknown form - lemma = "ABC" + letters = string.ascii_lowercase + size = random.randint(3, 5) + lemma = "".join(random.sample( + list(letters), size)).upper() word = lemma else: morpho_tag = random.choice( -- GitLab