access_blob_attrs |
active |
mmap, mmap_preread, mlock |
mmap_preread |
query, ram |
Specifies how index's blob attributes file is accessed |
access_doclists |
active |
file, mmap, mlock |
file |
query, ram |
Specifies how index's doclists file is accessed |
access_hitlists |
active |
file, mmap, mlock |
file |
query, ram |
Specifies how index's hitlists file is accessed |
access_plain_attrs |
active |
mmap, mmap_preread, mlock |
mmap_preread |
query, ram |
Specifies how search server will access index's plain attributes |
agent |
active |
repeatablekey |
null |
cluster |
List of remote agents that are searched every time when the enclosing distributed index is searched. |
agent_blackhole |
active |
repeatablekey: host:port:indexlist |
null |
cluster, net |
Lets you fire-and-forget queries to remote agents. That is useful for debugging (or just testing) production clusters |
agent_connect_timeout |
active |
int (milliseconds) |
1000 (1 second) |
cluster, net |
Remote agent connection timeout |
agent_persistent |
active |
repeatablekey: host:port:indexlist |
null |
cluster, net |
Asks to persistently connect to agent (i.e. don't drop connection after query). |
agent_query_timeout |
active |
int (milliseconds) |
3000 (3 seconds) |
cluster, net |
Remote agent query timeout. |
agent_retry_count |
active |
int |
searchd.agent_retry_count |
cluster, net |
How many times Manticore will try to connect and query remote agents in distributed index before reporting fatal query error. |
attr_update_reserve |
active |
int + sizeunit |
128k |
disk |
Sets the space to be reserved for blob attribute updates. |
bigram_freq_words |
active |
wordlist |
null |
token, nlp, query |
A list of keywords considered "frequent" when indexing bigrams. |
bigram_index |
active |
none, all, first_freq, both_freq |
null |
token, nlp, query |
Bigram indexing is a feature to accelerate phrase searches. |
blend_chars |
active |
charlist |
null |
token, nlp |
Blended characters list. |
blend_mode |
active |
multiple: trim_none, trim_head, trim_tail, trim_both, trim_all, skip_pure |
trim_none |
token. nlp |
Blended tokens indexing mode. |
charset_table |
active |
complex value |
latin and cyrillic characters |
base, charset, token, nlp |
Accepted characters array, with case folding rules. |
charset_type |
removed |
|
|
|
|
columnar_attrs |
active |
fieldlist |
specifies what attributes should be stored in the columnar storage instead of the default row-wise storage. |
columnar, schema |
|
dict |
active |
keywords, crc |
keywords |
token, nlp |
The keywords dictionary type. |
docinfo |
removed |
extern, none, inline |
extern |
|
Docinfo storage mode defines how exactly docinfo will be physically stored on disk and RAM. |
docstore_block_size |
active |
int + sizeunit |
16k |
disk |
Size of the block of documents used by document storage. |
docstore_compression |
active |
lz4, lz4hc, none |
lz4 |
disk |
Type of compression used to compress blocks of documents used by document storage. |
docstore_compression_level |
active |
1 - 12 |
9 |
disk |
Compression level in document storage when 'lz4hc' compression is used. |
embedded_limit |
active |
int + sizeunit |
16k |
parse |
File size limit for embedded exceptions, wordforms, or stop words file. |
enable_star |
removed |
|
|
|
|
exceptions |
active |
filepath |
null |
token, nlp, synonym, exception |
Tokenizing exceptions file. |
expand_keywords |
active |
0, 1, exact, star |
0 (do not expand keywords) |
token, nlp, wildcard |
Expands keywords with their exact forms (i.e. the forms of the keywords before applying any morphological modifications) and/or stars when possible. |
global_idf |
active |
filepath |
null |
cluster, nlp |
The path to a file with global (cluster-wide) keyword IDFs. |
ha_strategy |
active |
random, nodeads, noerrors, roundrobin |
random |
cluster |
Agent mirror selection strategy for load balancing. |
hitless_words |
active |
all, filepath |
null (all words are considered not hitless) |
token, nlp |
Hitless words list. |
html_index_attrs |
active |
tagattrlist |
null (do not index markup attributes) |
html, token |
A list of markup attributes to index when stripping HTML. |
html_remove_elements |
active |
taglist |
null (do not strip contents of any elements) |
html, token |
A list of HTML elements for which to strip contents along with the elements themselves. |
html_strip |
active |
0, 1 |
0 (disable stripping) |
html, token |
Whether to strip HTML markup from incoming full-text data. |
ignore_chars |
active |
charlist |
null |
token, charset, nlp |
Ignored characters list. |
index_exact_words |
active |
0, 1 |
0 (do not index) |
token, stem, wildcard, nlp, morphology |
Whether to index the original keywords along with the stemmed/remapped versions. |
index_field_lengths |
active |
0, 1 |
0 (do not index) |
results, query, nlp |
Enables computing and storing of field lengths (both per-document and average per-index values) into the index. |
index_sp |
active |
0, 1 |
0 (do not detect any sentence or paragraph) |
token, html |
Whether to detect and index sentence and paragraph boundaries. |
index_token_filter |
active |
library name:plugin name:optional string of settings |
none |
token, nlp |
Compiled library for an index-time token filter for index. |
index_zones |
active |
taglist |
null (do not index zones) |
html, token |
A list of in-field HTML/XML zones to index. |
infix_fields |
active |
fieldlist |
null (index all fields in infix mode) |
token, wildcard, nlp |
The list of full-text fields to limit infix indexing to. |
inplace_docinfo_gap |
removed |
int + sizeunit |
0 (use separate temporary files). |
|
Whether to enable in-place index inversion. |
inplace_enable |
active |
0, 1 |
|
disk, plain |
Whether to enable in-place index inversion. |
inplace_hit_gap |
active |
int + sizeunit |
|
disk, plain |
In-place inversion fine-tuning option. Controls preallocated hitlist gap size. |
inplace_reloc_factor |
active |
float, between 0 and 1 |
0.1 |
disk, plain |
Controls relocation buffer size within indexing memory arena. |
inplace_write_factor |
active |
float, between 0 and 1 |
0.1 |
disk, plain |
Controls in-place write buffer size within indexing memory arena. |
killlist_target |
active |
indexlist + killlist mode (kl / id) |
null |
plain |
Sets the index(es) that the kill-list will be applied to. |
local |
active |
repeatablekey |
null |
cluster, distributed |
Distributed, remote index reference |
max_substring_len |
deprecated |
int |
0 (do not limit indexed substrings) |
nlp, wildcard, dictcrc |
Maximum substring (either prefix or infix) length to index. |
min_infix_len |
active |
int |
0 (disallow infixes) |
token, wildcard, nlp |
Minimum infix prefix length to index and search. |
min_prefix_len |
active |
int |
0 (disallow prefixes) |
token, wildcard, nlp |
Minimum word prefix length to index and search. |
min_stemming_len |
active |
int |
1 (stem everything) |
token, wildcard, stem, nlp, morphology |
Minimum word length at which to enable stemming. |
min_word_len |
active |
int |
1 (index everything) |
token, nlp |
Minimum indexed word length. |
mirror_retry_count |
active |
int |
5 |
cluster |
The same as agent_retry_count. If both values provided, mirror_retry_count will be taken. |
mlock |
deprecated |
0, 1 |
0 (do not call mlock()) |
|
Memory locking for cached data. |
morphology |
active |
preprocessorlist |
null (do not apply any preprocessor) |
token, nlp, morphology |
A list of morphology preprocessors to apply. |
morphology_skip_fields |
active |
fieldlist |
null (apply preprocessors to all fields) |
token, nlp, morphology |
A list of fields to skip morphology preprocessing. |
ngram_chars |
active |
charlist |
null |
cjk, nlp |
N-gram characters list. |
ngram_len |
active |
0, 1 |
0 (disable) |
cjk, nlp |
N-gram lengths for N-gram indexing. |
ondisk_attrs |
deprecated |
0, 1, pool |
|
|
Allows for fine-grain control over how attributes are loaded into memory when using indexes with external storage. |
ondisk_dict |
removed |
|
|
|
|
overshort_step |
active |
0, 1 |
1 |
token, nlp |
Position increment on overshort (less than min_word_len) keywords. |
path |
active |
filepath |
required |
base, required, cluster |
Absolute or relative path without extension where to store the index or where to look for it. IMPORTANT: use trailing slash |
phrase_boundary |
active |
charlist |
null |
token, nlp |
Phrase boundary characters list. |
phrase_boundary_step |
active |
int |
|
token, nlp |
Phrase boundary word position increment. |
prefix_fields |
active |
fieldlist |
null (index all fields in prefix mode) |
token, wildcard, nlp |
List of full-text fields to limit prefix indexing to. |
preopen |
active |
0, 1 |
|
startup, query |
Tells searchd that it should pre-open all index files on startup (or rotation) and keep them open while it runs. |
read_buffer_docs |
active |
int + sizeunit; min 8k |
256k |
disk, query |
Per-keyword read buffer size for document lists. |
read_buffer_hits |
active |
int + sizeunit; min 8k |
256k |
disk, query |
Per-keyword read buffer size for hit lists. |
read_unhinted |
active |
int + sizeunit; min 1k |
32k |
disk, query |
Unhinted read size. |
regexp_filter |
active |
repeatablekey: regex |
null |
token |
Regular expressions (regexps) to filter the fields and queries with. |
rlp_context |
removed |
filepath |
null |
|
RLP context configuration file. Mandatory if RLP is used. |
rt_mem_limit |
active |
int + sizeunit |
128m |
ram, query |
RAM chunk size limit. |
source |
active |
repeatablekey: source |
null |
plain |
Specifies document source to get documents from when the current index is indexed. |
stopword_step |
active |
0, 1 |
1 |
token, stopword, nlp |
Position increment on stopwords. |
stopwords |
active |
filepathlist |
null |
token, stopword, nlp |
Stop word files list (space separated). |
stopwords_unstemmed |
active |
0, 1 |
0 (apply stop word filter after stemming) |
token, stopword, nlp |
Whether to apply stop words before or after stemming. |
stored_fields |
active |
fieldlist |
null (no fields stored) |
schema |
Values from the fields will be both indexed and stored. |
stored_only_fields |
active |
fieldlist |
null (no fields stored) |
schema |
A list of fields that will be stored in the index but will be not indexed. |
type |
active |
rt, plain |
plain |
base |
Index type |
wordforms |
active |
repeatablekey: filepath |
null |
token, nlp, wordform |
Word forms dictionary file. |