? 'icuchain words-icu.xml'
: 'charmap word-phrase-utf.chr';
+$config{ZEBRA_PTOKENIZER_STMT} = $config{ZEBRA_TOKENIZER} eq 'icu'
+ ? 'icuchain phrases-icu.xml'
+ : 'charmap word-phrase-utf.chr';
+
my %test_suite_override_dirs = (
KOHA_CONF_DIR => ['etc'],
ZEBRA_CONF_DIR => ['etc', 'zebradb'],
index p
completeness 1
firstinfield 1
-__ZEBRA_TOKENIZER_STMT__
+__ZEBRA_PTOKENIZER_STMT__
# URX (URL) index
# Used if structure=urx (@attr 4=104)
--- /dev/null
+<icu_chain locale="">
+ <transform rule="[:Control:] Any-Remove"/>
+ <tokenize rule="l"/>
+ <transform rule="[:Punctuation:] Remove"/>
+ <transform rule="NFD"/>
+ <transform rule="[:Nonspacing Mark:] Remove"/>
+ <transform rule="NFC"/>
+ <display/>
+ <casemap rule="l"/>
+</icu_chain>
'__ZEBRA_LANGUAGE__' => 'en',
'__ZEBRA_TOKENIZER__' => 'chr',
'__ZEBRA_TOKENIZER_STMT__' => 'charmap word-phrase-utf.chr',
+ '__ZEBRA_PTOKENIZER_STMT__' => 'charmap word-phrase-utf.chr',
'__ZEBRA_AUTH_CFG__' => 'zebra-authorities.cfg',
'__ZEBRA_BIB_CFG__' => 'zebra-biblios.cfg',
'__AUTH_RETRIEVAL_CFG__' => 'retrieval-info-auth-grs1.xml',