From 50ea5469b0fc6af570ef4ab4b22f30b27bb31c34 Mon Sep 17 00:00:00 2001
From: Mateusz Klimaszewski <mk.klimaszewski@gmail.com>
Date: Fri, 4 Dec 2020 11:49:15 +0100
Subject: [PATCH] Sort feats by lowercase to match iwpt script.

---
 combo/predict.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/combo/predict.py b/combo/predict.py
index 42e8bed..e262b70 100644
--- a/combo/predict.py
+++ b/combo/predict.py
@@ -173,7 +173,9 @@ class SemanticMultitaskPredictor(predictor.Predictor):
                         if len(features) == 0:
                             field_value = "_"
                         else:
-                            field_value = "|".join(sorted(features))
+                            lowercase_features = [f.lower() for f in features]
+                            arg_indices = sorted(range(len(lowercase_features)), key=lowercase_features.__getitem__)
+                            field_value = "|".join(np.array(features)[arg_indices].tolist())
 
                         token[field_name] = field_value
                     elif field_name == "lemma":
-- 
GitLab