We can start with looking at the conf file just to make sure there is not something odd in the configuration. This is the call to indexer:
sudo -H -u manticore /usr/bin/indexer --config /etc/manticoresearch/manticore_langs.conf myhb_zh
Here is the conf.
#############################################################################
index definition
#############################################################################
index common
{
type = plain
dict = keywords
wordforms = /var/lib/manticore/wordforms.txt
min_word_len = 2
min_infix_len = 3
expand_keywords = 1
blend_chars = +, &, U+0023, -, U+002F
blend_mode = trim_none, skip_pure
html_strip = 1
html_remove_elements = style, script, title, head
preopen = 1
index_exact_words = 1
# Special terms equivalence
regexp_filter = (β) => beta
regexp_filter = (α) => alpha
regexp_filter = (percent) => %
#
# Dosages common form: bring all dosages into common form
# i.e. 150 mg to 150mg etc... with no space between numeric and units parts
#
regexp_filter = (?i)(\s|\b)+(\pN*[.,]?\pN*)(\s|\b)+(mg\/ml|ml\/amp|mg|ml|ui|g|units|iu|mcg|µg)(\s|\b)+ => \1\2\4\5
}
Chinese
index myhb_zh:common
{
source = zh_products
path = /var/lib/manticore/myhb_zh
stopwords = zh
# Use ICU
charset_table = chinese
morphology = icu_chinese
# or use ngram
#ngram_chars = chinese
#ngram_len = 1
}
#############################################################################
indexer settings
#############################################################################
indexer
{
# memory limit, in bytes, kiloytes (16384K) or megabytes (256M)
# optional, default is 128M, max is 2047M, recommended is 256M to 1024M
mem_limit = 1024M
# how to handle IO errors in file fields
# known values are 'ignore_field', 'skip_document', and 'fail_index'
# optional, default is 'ignore_field'
#
on_file_field_error = ignore_field
# lemmatizer cache size
# improves the indexing time when the lemmatization is enabled
# optional, default is 256K
#
lemmatizer_cache = 128M
max_file_field_buffer = 128M
}
–eof–