-
Notifications
You must be signed in to change notification settings - Fork 27
/
default.cfg
89 lines (68 loc) · 2.81 KB
/
default.cfg
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
[BASIC]
# the file of input ontology; mandatory; you can also set it as a projected ontology
ontology_file = ./case_studies/data/helis_v1.00.origin.owl
# ontology_file = ./cache/projection.ttl
#ontology_file = ./case_studies/pizza/pizza.owl
# ontology_file = ./case_studies/simple/test_ontology.owl
# the output director for the embedding; if not set, it uses the default: $cache_dir/output
# embedding_dir = ./case_studies/simple/
[DOCUMENT]
# cache directory for storing files; if not set, it creates a default: ./cache/
cache_dir = ./cache/
# use or not use the projected ontology
# default: no
ontology_projection = yes
# Projection of only the taxonomy of the ontology without other relationships. Default: no
projection_only_taxonomy = no
#Using or not multiple labels/synonyms for the literal/mixed sentences. Default: no
multiple_labels = yes
#Avoid OWL constructs like rdfs:subclassof in the document. Default: no
avoid_owl_constructs = no
#Document of sentences. Default: no
save_document = yes
# reasoning for extract axioms: hermit or elk or none; none denotes not using reasoning.
# axiom_reasoner = hermit
# axiom_reasoner = elk
axiom_reasoner = none
# the seed entities for generating the walks
# default: all the named classes and instances cached in cache/entities.txt
# comment it if the default python program is called to extract all classes and individuals as the seed entities
# pre_entity_file = ./cache/entities.txt
# the annotations and axioms can pre-calculated and saved in the some directory (e.g., the cache directory)
# OWL2Vec will use the pre-calculated files if set, or it will extract them by default
# comment them if the default python program is called to extract annotations and axioms
# pre_annotation_file = ./cache/annotations.txt
# pre_axiom_file = ./cache/axioms.txt
# walker and walk_depth must be set
# random walk or random walk with Weisfeiler-Lehman (wl) subtree kernel
walker = random
#walker = wl
walk_depth = 3
# use URI/Literal/Mixture document (yes or no)
# they can be over witten by the command line parameters
URI_Doc = yes
Lit_Doc = yes
Mix_Doc = no
# the type for generating the mixture document (all or random)
# works when Mix_Doc is set to yes
# Mix_Type = all
Mix_Type = random
[MODEL]
# the directory of the pre-trained word2vec model
# default: without pre-training
# comment it if no pre-training is needed
# pre_train_model = ~/w2v_model/enwiki_model/word2vec_gensim
# Available from https://tinyurl.com/word2vec-model
# the size for embedding
# it is set to the size of the pre-trained model if it is adopted
embed_size = 100
# number of iterations in training the word2vec model
# i.e., epochs in gensim 4.x.x
iteration = 10
# for training the word2vec model without pre-training
window = 5
min_count = 1
negative = 25
seed = 42
# epoch for fine-tuning the pre-trained model
epoch = 100