-
Notifications
You must be signed in to change notification settings - Fork 87
/
Copy pathyago.ini
87 lines (78 loc) · 3.03 KB
/
yago.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
# This is an example yago.ini file for triggering full extraction.
# Please keep it up to date when you change YAGO.
# Please use a copy of this file for personal purposes.
# number of parallel running threads
numThreads = 6
# skipping extractors, where all output files exist already
reuse = true
# for every executed extractor, execute also its children,
# even if their output files exist already
rerunDependent = true
# destination of generated tsv files
yagoFolder = FOLDER
# show actions, without modifying or generating files
simulate = false
yagoSimulationFolder = FOLDER
# list of Wikipedia dumps, and corresponding languages
# en should come first
#languages = en, ro
#wikipedias = /GW/D5data/wikipedia_dumps/en/20140626/enwiki-latest-pages-articles.xml,
# /GW/D5data/wikipedia_dumps/ro/20140314/rowiki-20140314-pages-articles.xml
# path to wikidata dump
#wikidata = /GW/D5data-8/yago/dumps/wikidatawiki/20170522/wikidata-20170522-all-BETA.ttl
# alternatively, specify folder for dumps and languages
# and use script to download them
dumpsFolder = FOLDER
languages = en, de, fr, nl, it, es, ro, pl, ar, fa
# which extractors to run, in any order
extractors = fromOtherSources.PatternHardExtractor,
deduplicators.ClassExtractor,
deduplicators.DateExtractor,
deduplicators.FactExtractor,
deduplicators.LabelExtractor,
deduplicators.LiteralFactExtractor,
deduplicators.MetaFactExtractor,
deduplicators.SchemaExtractor,
deduplicators.SourceExtractor,
fromGeonames.GeoNamesDataImporter,
fromGeonames.GeoNamesEntityMapper,
fromGeonames.GeoNamesClassMapper,
fromOtherSources.HardExtractor,
fromOtherSources.DictionaryExtractor,
fromOtherSources.UWNImporter,
fromOtherSources.WikidataLabelExtractor,
fromOtherSources.WordnetDomainExtractor,
fromOtherSources.WordnetDomainHierarchyExtractor,
fromOtherSources.WordnetExtractor,
fromThemes.AttributeMatcher,
fromThemes.CategoryClassExtractor,
fromThemes.CategoryClassHierarchyExtractor,
fromThemes.CategoryMapper,
fromThemes.CategoryTypeExtractor,
fromThemes.CoherentTypeExtractor,
fromThemes.DBpediaLinker,
fromThemes.GenderNameExtractor,
fromThemes.InfoboxMapper,
fromThemes.InfoboxTermExtractor,
fromThemes.InfoboxTypeExtractor,
fromThemes.PersonNameExtractor,
fromThemes.RelationChecker,
fromThemes.RuleExtractor,
fromThemes.SimpleTypeExtractor,
fromThemes.StatisticsExtractor,
fromThemes.TransitiveTypeExtractor,
fromWikipedia.CategoryExtractor,
fromWikipedia.CategoryHierarchyExtractor,
fromWikipedia.CoordinateExtractor,
fromWikipedia.DisambiguationPageExtractor,
fromWikipedia.FlightExtractor,
fromWikipedia.GenderExtractor,
fromWikipedia.InfoboxExtractor,
fromWikipedia.RedirectExtractor,
fromWikipedia.TemporalInfoboxExtractor,
fromWikipedia.WikiInfoExtractor,
fromWikipedia.ConteXtExtractor,
fromWikipedia.StructureExtractor,
# deduplicators.SPOTLXDeduplicator,
# fromThemes.SPOTLXRuleExtractor,
# fromThemes.SPOTLXDeductiveExtractor,