Commit a50073f4 authored by Grzegorz Kostkowski's avatar Grzegorz Kostkowski

Changes in config

parent 85965e20
Pipeline #535 failed with stage
in 16 seconds
[general]
; data_dir = %(project_dir)s/data
resources_config = resources.ini
derived_resources_config = derived_resources.ini
[algorithm]
algo_class = gt_pprmc.GTPPRMC
required_rtypes = EDGE_WEIGHT,VERTEX_WEIGHT,WATCHER
iterations = 50
damping_factor = 0.1
init_personalisation = 1.0
use_entropy = true
normalize = true
method = normal
[database]
; used only when concepts_categories_mapping is not specified
endpoint = http://10.108.41.103:8080/db/data/cypher
user = neo4j
password = neodb
; Definitions of resources generated during runtime, based on loaded resources
; defined in resources.ini file
;
; Compulsory properties for each resource:
; - name
; - type - conceptual type of resource (one from set of available types defined
; in keyword_assignment_tool.config.resource_types module)
; - required_resources - list of resources (names) required for initialization of this
; resource: static resources (resource.ini) or other derived resources (this
; file). Dependencies to other derived resources will be resolved by
; ResourceManager, avoid declaring derived resources in a way cousing circular
; reference, such cases will be detected.
; - resource_class - name of class from resource.resources module used to create
; instance of this resource.
[lod-url-v-mapping]
name = lod-url-v-mapping
type = VERTEX_ID_VERTEX
required_resources = dbpedia-graph
resource_class = GraphVertexIndexResource
key_prop_name = lod_url
inverted = true
[v-lod-url-mapping]
name = v-lod-url-mapping
type = VERTEX_VERTEX_ID
required_resources = dbpedia-graph
resource_class = GraphVertexIndexResource
key_prop_name = lod_url
inverted = false
[concept-node-mapping]
name = concept-node-mapping
type = CONCEPT_VERTEX
required_resources = lod-url-v-mapping,concepts-dbpedia-categories-mapping
resource_class = TextGraphVertexIndexResource
; [v_id_vector_map]
; name = v_id_vector_map
; type = VERTEX_VECTOR
; required_resources = dbpedia-graph,categories-vectors
; resource_class = GraphVertexVectorIndexResource
; vprop_name = lod_url
; ============ late-initialized resources ============
[document]
name = document
type = DOCUMENT
required_resources =
resource_class = CclDocumentResource
late_init = true
[document-context]
name = document-context
type = DOCUMENT_CONTEXT
required_resources = document,concepts-dbpedia-categories-mapping,concept-node-mapping
optional_resources = v-lod-url-mapping, categories-vectors, concepts-vectors, orth_idf_w_map,doc-context-debug-log
resource_class = CclDocumentContextResource
late_init = true
[v-id-v-weight-mapping]
name = v-id-v-weight-mapping
type = VERTEX_WEIGHT
required_resources = document-context,lod-url-v-mapping,categories-vectors
resource_class = GraphVertexWeightIndexResource
late_init = true
batches_no = 8
set_zeros = true
[gtpprmc-ranking]
name = gtpprmc-ranking
type = ALGO_RANKING
required_resources =
resource_class = AlgoRankingResource
late_init = true
manual_init = true
[output-keywords-path]
; path is passed in such way only to avoid auto creation of results (without
; this path passed in run)
name = output-keywords-path
type = OUTPUT
required_resources =
resource_class = StringResource
late_init = true
[results]
name = results
type = RESULTS
required_resources = document-context,gtpprmc-ranking,doc-context-debug-log,lod-url-v-mapping,v-lod-url-mapping,category-label,output-keywords-path
resource_class = ResultsResource
late_init = true
manual_init = true
as_json = true
; min_score_threshold = 0.0003
n_best_keywords = 10
; output_ranking = %(data_dir)s/ranking.tsv
output_path_suffix = ranking.tsv
[doc-context-debug-log]
name = doc-context-debug-log
type = WATCHER
required_resources = output-keywords-path
resource_class = DocumentContextLogResource
late_init = true
output_path_suffix = doc-context.log
; output_path = %(data_dir)s/doc-context-debug.log
with_labels = true
; config for static resources
; description:
; Every section represents each resource
; (from keyword_assignment_tool.resource.resources module) to load by ResourceManager.
; Compulsory properties for each resource:
; - name
; - type - conceptual type of resource (one from set of available types defined
; in keyword_assignment_tool.config.resource_types module)
; - resource_class (class specified in resource package)
; Note that if implementation of certain resource will require additional
; properties, then such must be provided by declaring them in certain section
; Note about paths:
; by default, all paths included in this file should contain names of files in
; 'keyword_assignment_tool.data' module, be an absolute paths or use
; interpolation variable. Path to directory with data can be also passed as
; parameter to the constructor of KwConfig.
; Keep in mind that only files included in instalation setup.py file will be
; available in mentioned module directory.
[dbpedia-graph]
name = dbpedia-graph
type = GRAPH
resource_class = GraphResource
path = graph-2018-11-13-categories-broader-narrower-weighted-001-filtered-meaningless.graphml
v_id_prop_name = lod_url
[concepts_categories_mapping]
name = concepts-dbpedia-categories-mapping
type = CONCEPT_VERTEX_ID
resource_class = ZippedTextIndexResource
path = concept_category_index_all_sources_extended_reduced_at_least_one_v7.bin.zip
[categories-vectors]
name = categories-vectors
type = VERTEX_ID_VECTOR
resource_class = VectorsResource
path = cats_keyed_vectors_v2.bin.zip
[concepts-vectors]
name = concepts-vectors
type = CONCEPT_VECTOR
resource_class = VectorsResource
path = concepts_keyed_vectors.bin.zip
[concept-weights]
name = orth_idf_w_map
type = CONCEPT_WEIGHT
resource_class = IndexValueResource
path = idf-dict2_norm_sorted.tsv
need_normalisation = true
delimiter = %(tabulation)s
[category-label]
name = category-label
type = VERTEX_LABEL
resource_class = IndexResource
path = categories_pl_labels_lowercase_v4.txt
delimiter = %(tabulation)s
[general]
; data_dir = %(project_dir)s/data
resources_config = resources.ini
derived_resources_config = derived_resources.ini
[algorithm]
algo_class = gt_pprmc.GTPPRMC
required_rtypes = EDGE_WEIGHT,VERTEX_WEIGHT,WATCHER
iterations = 50
damping_factor = 0.1
init_personalisation = 1.0
use_entropy = true
normalize = true
method = normal
[database]
; used only when concepts_categories_mapping is not specified
endpoint = http://10.108.41.103:8080/db/data/cypher
user = neo4j
password = neodb
; Definitions of resources generated during runtime, based on loaded resources
; defined in resources.ini file
;
; Compulsory properties for each resource:
; - name
; - type - conceptual type of resource (one from set of available types defined
; in keyword_assignment_tool.config.resource_types module)
; - required_resources - list of resources (names) required for initialization of this
; resource: static resources (resource.ini) or other derived resources (this
; file). Dependencies to other derived resources will be resolved by
; ResourceManager, avoid declaring derived resources in a way cousing circular
; reference, such cases will be detected.
; - resource_class - name of class from resource.resources module used to create
; instance of this resource.
[lod-url-v-mapping]
name = lod-url-v-mapping
type = VERTEX_ID_VERTEX
required_resources = dbpedia-graph
resource_class = GraphVertexIndexResource
key_prop_name = lod_url
inverted = true
[v-lod-url-mapping]
name = v-lod-url-mapping
type = VERTEX_VERTEX_ID
required_resources = dbpedia-graph
resource_class = GraphVertexIndexResource
key_prop_name = lod_url
inverted = false
[concept-node-mapping]
name = concept-node-mapping
type = CONCEPT_VERTEX
required_resources = lod-url-v-mapping,concepts-dbpedia-categories-mapping
resource_class = TextGraphVertexIndexResource
[v_id_vector_map]
name = v_id_vector_map
type = VERTEX_VECTOR
required_resources = dbpedia-graph,categories-vectors
resource_class = GraphVertexVectorIndexResource
vprop_name = lod_url
; ============ late-initialized resources ============
[document]
name = document
type = DOCUMENT
required_resources =
resource_class = CclDocumentResource
late_init = true
[document-context]
name = document-context
type = DOCUMENT_CONTEXT
required_resources = document,concepts-dbpedia-categories-mapping,concept-node-mapping
optional_resources = v-lod-url-mapping, categories-vectors, concepts-vectors, orth_idf_w_map,doc-context-debug-log
resource_class = CclDocumentContextResource
late_init = true
[v-id-v-weight-mapping]
name = v-id-v-weight-mapping
type = VERTEX_WEIGHT
required_resources = document-context,lod-url-v-mapping,categories-vectors
resource_class = GraphVertexWeightIndexResource
late_init = true
batches_no = 8
set_zeros = true
[gtpprmc-ranking]
name = gtpprmc-ranking
type = ALGO_RANKING
required_resources =
resource_class = AlgoRankingResource
late_init = true
manual_init = true
[output-keywords-path]
; path is passed in such way only to avoid auto creation of results (without
; this path passed in run)
name = output-keywords-path
type = OUTPUT
required_resources =
resource_class = StringResource
late_init = true
[results]
name = results
type = RESULTS
required_resources = document-context,gtpprmc-ranking,doc-context-debug-log,lod-url-v-mapping,v-lod-url-mapping,category-label,output-keywords-path
resource_class = ResultsResource
late_init = true
manual_init = true
as_json = true
; min_score_threshold = 0.0003
n_best_keywords = 10
; output_ranking = %(data_dir)s/ranking.tsv
output_path_suffix = ranking.tsv
[doc-context-debug-log]
name = doc-context-debug-log
type = WATCHER
required_resources = output-keywords-path
resource_class = DocumentContextLogResource
late_init = true
output_path_suffix = doc-context.log
; output_path = %(data_dir)s/doc-context-debug.log
with_labels = true
; config for static resources
; description:
; Every section represents each resource
; (from keyword_assignment_tool.resource.resources module) to load by ResourceManager.
; Compulsory properties for each resource:
; - name
; - type - conceptual type of resource (one from set of available types defined
; in keyword_assignment_tool.config.resource_types module)
; - resource_class (class specified in resource package)
; Note that if implementation of certain resource will require additional
; properties, then such must be provided by declaring them in certain section
; Note about paths:
; by default, all paths included in this file should contain names of files in
; 'keyword_assignment_tool.data' module, be an absolute paths or use
; interpolation variable. Path to directory with data can be also passed as
; parameter to the constructor of KwConfig.
; Keep in mind that only files included in instalation setup.py file will be
; available in mentioned module directory.
[dbpedia-graph]
name = dbpedia-graph
type = GRAPH
resource_class = GraphResource
path = graph-2018-11-13-categories-broader-narrower-weighted-001-filtered-meaningless.graphml
v_id_prop_name = lod_url
[concepts_categories_mapping]
name = concepts-dbpedia-categories-mapping
type = CONCEPT_VERTEX_ID
resource_class = ZippedTextIndexResource
path = concept_category_index_only_dbpedia_concepts_reduced_v5_at_least_one.txt.bin.zip
[categories-vectors]
name = categories-vectors
type = VERTEX_ID_VECTOR
resource_class = VectorsResource
path = cats_keyed_vectors_v2.bin.zip
[concepts-vectors]
name = concepts-vectors
type = CONCEPT_VECTOR
resource_class = VectorsResource
path = concepts_keyed_vectors.bin.zip
[concept-weights]
name = orth_idf_w_map
type = CONCEPT_WEIGHT
resource_class = IndexValueResource
path = idf-dict2_norm_sorted.tsv
need_normalisation = true
delimiter = %(tabulation)s
[category-label]
name = category-label
type = VERTEX_LABEL
resource_class = IndexResource
path = categories_pl_labels_lowercase_v4.txt
delimiter = %(tabulation)s
[general]
; data_dir = %(project_dir)s/data
resources_config = resources.ini
derived_resources_config = derived_resources.ini
[algorithm]
algo_class = gt_pprmc.GTPPRMC
required_rtypes = EDGE_WEIGHT,VERTEX_WEIGHT,WATCHER
iterations = 50
damping_factor = 0.1
init_personalisation = 1.0
use_entropy = true
normalize = true
method = normal
[database]
; used only when concepts_categories_mapping is not specified
endpoint = http://10.108.41.103:8080/db/data/cypher
user = neo4j
password = neodb
; Definitions of resources generated during runtime, based on loaded resources
; defined in resources.ini file
;
; Compulsory properties for each resource:
; - name
; - type - conceptual type of resource (one from set of available types defined
; in keyword_assignment_tool.config.resource_types module)
; - required_resources - list of resources (names) required for initialization of this
; resource: static resources (resource.ini) or other derived resources (this
; file). Dependencies to other derived resources will be resolved by
; ResourceManager, avoid declaring derived resources in a way cousing circular
; reference, such cases will be detected.
; - resource_class - name of class from resource.resources module used to create
; instance of this resource.
[lod-url-v-mapping]
name = lod-url-v-mapping
type = VERTEX_ID_VERTEX
required_resources = dbpedia-graph
resource_class = GraphVertexIndexResource
key_prop_name = lod_url
inverted = true
[v-lod-url-mapping]
name = v-lod-url-mapping
type = VERTEX_VERTEX_ID
required_resources = dbpedia-graph
resource_class = GraphVertexIndexResource
key_prop_name = lod_url
inverted = false
[concept-node-mapping]
name = concept-node-mapping
type = CONCEPT_VERTEX
required_resources = lod-url-v-mapping,concepts-dbpedia-categories-mapping
resource_class = TextGraphVertexIndexResource
[v_id_vector_map]
name = v_id_vector_map
type = VERTEX_VECTOR
required_resources = dbpedia-graph,categories-vectors
resource_class = GraphVertexVectorIndexResource
vprop_name = lod_url
; ============ late-initialized resources ============
[document]
name = document
type = DOCUMENT
required_resources =
resource_class = CclDocumentResource
late_init = true
[document-context]
name = document-context
type = DOCUMENT_CONTEXT
required_resources = document,concepts-dbpedia-categories-mapping,concept-node-mapping
optional_resources = v-lod-url-mapping, categories-vectors, concepts-vectors, orth_idf_w_map,doc-context-debug-log
resource_class = CclDocumentContextResource
late_init = true
[v-id-v-weight-mapping]
name = v-id-v-weight-mapping
type = VERTEX_WEIGHT
required_resources = document-context,lod-url-v-mapping,categories-vectors
resource_class = GraphVertexWeightIndexResource
late_init = true
batches_no = 8
set_zeros = true
[gtpprmc-ranking]
name = gtpprmc-ranking
type = ALGO_RANKING
required_resources =
resource_class = AlgoRankingResource
late_init = true
manual_init = true
[output-keywords-path]
; path is passed in such way only to avoid auto creation of results (without
; this path passed in run)
name = output-keywords-path
type = OUTPUT
required_resources =
resource_class = StringResource
late_init = true
[results]
name = results
type = RESULTS
required_resources = document-context,gtpprmc-ranking,doc-context-debug-log,lod-url-v-mapping,v-lod-url-mapping,category-label,output-keywords-path
resource_class = ResultsResource
late_init = true
manual_init = true
as_json = true
; min_score_threshold = 0.0003
n_best_keywords = 10
; output_ranking = %(data_dir)s/ranking.tsv
output_path_suffix = ranking.tsv
[doc-context-debug-log]
name = doc-context-debug-log
type = WATCHER
required_resources = output-keywords-path
resource_class = DocumentContextLogResource
late_init = true
output_path_suffix = doc-context.log
; output_path = %(data_dir)s/doc-context-debug.log
with_labels = true
; config for static resources
; description:
; Every section represents each resource
; (from keyword_assignment_tool.resource.resources module) to load by ResourceManager.
; Compulsory properties for each resource:
; - name
; - type - conceptual type of resource (one from set of available types defined
; in keyword_assignment_tool.config.resource_types module)
; - resource_class (class specified in resource package)
; Note that if implementation of certain resource will require additional
; properties, then such must be provided by declaring them in certain section
; Note about paths:
; by default, all paths included in this file should contain names of files in
; 'keyword_assignment_tool.data' module, be an absolute paths or use
; interpolation variable. Path to directory with data can be also passed as
; parameter to the constructor of KwConfig.
; Keep in mind that only files included in instalation setup.py file will be
; available in mentioned module directory.
[dbpedia-graph]
name = dbpedia-graph
type = GRAPH
resource_class = GraphResource
path = graph-2018-11-13-categories-broader-narrower-weighted-001-filtered-meaningless.graphml
v_id_prop_name = lod_url
[concepts_categories_mapping]
name = concepts-dbpedia-categories-mapping
type = CONCEPT_VERTEX_ID
resource_class = ZippedTextIndexResource
path = concept_category_index_only_dbpedia_concepts_reduced_v4_many.txt.bin.zip
[categories-vectors]
name = categories-vectors
type = VERTEX_ID_VECTOR
resource_class = VectorsResource
path = cats_keyed_vectors_v2.bin.zip
[concepts-vectors]
name = concepts-vectors
type = CONCEPT_VECTOR
resource_class = VectorsResource
path = concepts_keyed_vectors.bin.zip
[concept-weights]
name = orth_idf_w_map
type = CONCEPT_WEIGHT
resource_class = IndexValueResource
path = idf-dict2_norm_sorted.tsv
need_normalisation = true
delimiter = %(tabulation)s