-## $Id: Makefile.am,v 1.9 2006-06-28 13:26:18 adam Exp $
+## $Id: Makefile.am,v 1.10 2007-12-13 18:10:35 adam Exp $
tabdatadir = $(datadir)/$(PACKAGE)$(PACKAGE_SUFFIX)/tab
tabdata_DATA = bib1.att dan1.att danmarc.abs danmarc.mar \
nwi.flt refer.flt scan.chr sgml.flt soif.flt string.chr summary.abs \
summary.tag tagsetg.tag tagsetm.tag urx.chr usmarc.abs usmarc-b.est \
usmarc.flt usmarc.mar usmarc.tag var1.var wais.abs wais-b.est \
- wais-variant.est marc21.abs
+ wais-variant.est marc21.abs words-icu.xml phrases-icu.xml icu.idx
EXTRA_DIST = $(tabdata_DATA)
--- /dev/null
+# ICU indexing for words and phrases.. Otherwise similar
+# to default.idx .
+# $Id: icu.idx,v 1.1 2007-12-13 18:10:35 adam Exp $
+
+# Traditional word index
+# Used if completenss is 'incomplete field' (@attr 6=1) and
+# structure is word/phrase/word-list/free-form-text/document-text
+index w
+completeness 0
+position 1
+alwaysmatches 1
+firstinfield 1
+icuchain words-icu.xml
+# debug 1
+
+# Phrase index
+# Used if completeness is 'complete {sub}field' (@attr 6=2, @attr 6=1)
+# and structure is word/phrase/word-list/free-form-text/document-text
+index p
+completeness 1
+icuchain phrases-icu.xml
+# debug 1
+
+# Sort register
+sort s
+completeness 1
+charmap string.chr
+
+# Staticrank (uncomment to enable)
+#staticrank r
--- /dev/null
+<icu_chain locale="en">
+ <transform rule="[:Control:] Any-Remove"/>
+ <tokenize rule="s"/>
+ <transform rule="[:Punctuation:] Remove"/>
+ <display/>
+ <casemap rule="l"/>
+</icu_chain>
--- /dev/null
+<icu_chain id="en:word" locale="en">
+ <transform rule="[:Control:] Any-Remove"/>
+ <tokenize rule="l"/>
+ <transform rule="[[:WhiteSpace:][:Punctuation:]] Remove"/>
+ <display/>
+ <casemap rule="l"/>
+</icu_chain>