|
|
# Konfiguracja
|
|
|
## elinker
|
|
|
### Plik konfiguracyjny
|
|
|
```ini
|
|
|
[general]
|
|
|
tagset = nkjp
|
|
|
[parser]
|
|
|
named_entity_chan_name = nam
|
|
|
mwe_chan_name = mwe
|
|
|
mwe_base_prop_key = mwe_base
|
|
|
synset_prop_key = sense:ukb:syns_id
|
|
|
stop_list_file = nkjp_idf_dict_plwn_nouns_stop_list.txt
|
|
|
ignored_pos = interp,prep,fin,pact,pcon,inf,praet,ppas,qub,conj,adj,xxx
|
|
|
|
|
|
[linker]
|
|
|
url_key_format = %s:url_%d
|
|
|
ignore_shorter_than=5
|
|
|
mark_without_ann=false
|
|
|
without_ann_only_mono=false
|
|
|
use_wsd_toks = true
|
|
|
use_wsd_synsets = true
|
|
|
|
|
|
[filter]
|
|
|
exclude_ignored = true
|
|
|
kw_ignored_ann = kw_ignored
|
|
|
|
|
|
[database]
|
|
|
default_langs=pl,en
|
|
|
```
|
|
|
## kwazon
|
|
|
### Plik konfiguracyjny
|
|
|
```ini
|
|
|
graph_file_path = /home/gkostkowski/WORKING_REPOS/kwazon/keyword_assignment_tool/data/keyword_assignment_tool/data/graph-2018-11-13-categories-broader-narrower-weighted-001-filtered-meaningless.graphml
|
|
|
concepts_categories_mapping = /home/gkostkowski/WORKING_REPOS/kwazon/keyword_assignment_tool/data/concept_category_index_all_sources_extended_reduced_at_least_one_v7.bin.zip
|
|
|
categories_vectors = /home/gkostkowski/WORKING_REPOS/kwazon/keyword_assignment_tool/data/categories_keyed_vectors_v2.bin.zip
|
|
|
concepts_vectors = /home/gkostkowski/WORKING_REPOS/kwazon/keyword_assignment_tool/data/concepts_keyed_vectors.bin.zip
|
|
|
|
|
|
edge_weights_prop = 'rel_w'
|
|
|
orth_idf_weights = idf-dict2_norm_sorted.tsv
|
|
|
[results]
|
|
|
as_json = true
|
|
|
cats_labels = /home/gkostkowski/WORKING_REPOS/kwazon/keyword_assignment_tool/data/categories_pl_labels_lowercase_v4.txt
|
|
|
n_best_keywords = 10
|
|
|
score_min_threshold = 0.0003
|
|
|
|
|
|
[algorithm]
|
|
|
iterations = 100
|
|
|
damping_factor = 0.1
|
|
|
init_personalisation = 1.0
|
|
|
```
|
|
|
|
|
|
### Opis konfiguracji
|
|
|
- graf
|
|
|
- skierowany, z relacjami broader i narrower
|
|
|
- **z wagami krawędzi broader: 1.0, narrower: 0.01**
|
|
|
- z usuniętymi zbędnymi kategoriami
|
|
|
|
|
|
# Wyniki
|
|
|
```
|
|
|
|
|
|
``` |
|
|
\ No newline at end of file |