-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconfig.toml
More file actions
38 lines (31 loc) · 1.15 KB
/
config.toml
File metadata and controls
38 lines (31 loc) · 1.15 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
[WikipediaProcessor]
Path = "/data/WikiSearchData/bgwiki-20250120-pages-articles.xml"
CrawlLimit = 441386
[Crawler]
Domain = "https://bg.wikipedia.org"
CrawlLimit = 10
SeedURLs = ["https://bg.wikipedia.org"]
[FileDatabase]
Path = "/data/WikiSearchData/LMDB"
Size = "66571993000"
[USearchIndex]
Path = "/data/WikiSearchData/SemanticIndex/index.usearch"
dimension = 768
[FAISSIndex]
Path = "/data/WikiSearchData/SemanticIndex/index.faiss"
dimension = 768
[SpellChecker]
AffPath = "/data/WikiSearchData/SpellChecker/bg_BG_utf8.aff"
DicPath = "/data/WikiSearchData/SpellChecker/bg_BG_utf8.dic"
CustomDicPath = "/data/WikiSearchData/SpellChecker/custom_utf8.dic"
[Autocompletion]
WordCompletionDAWG = "/data/WikiSearchData/Autocompletion/word-completion.dawg"
NextWordDAWG = "/data/WikiSearchData/Autocompletion/next-word.dawg"
[Evaluator]
NumBatches = 5
QueriesPerBatch = 30
ResultsPerQuery = 20
InvertedResults = "/data/WikiSearchData/Stats/inverted_results.json"
SemanticResults = "/data/WikiSearchData/Stats/semantic_results.json"
InvertedMetrics = "/data/WikiSearchData/Stats/inverted_metrics.json"
SemanticMetrics = "/data/WikiSearchData/Stats/semantic_metrics.json"