Skip to content

Commit 23895a8

Browse files
committed
fix(lucene): add info about diacritics analyzer
close #83
1 parent 0a4689c commit 23895a8

20 files changed

+150
-124
lines changed
Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
11
<lucene>
2-
<text qname="p"/>
3-
<text qname="placeName"/>
4-
</lucene>
2+
<text qname="p"/>
3+
<text qname="placeName"/>
4+
</lucene>
Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
<text qname="p">
2-
<inline qname="em"/>
3-
</text>
2+
<inline qname="em"/>
3+
</text>
Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,3 @@
11
<p>This is a paragraph
2-
<note>containing an inline note</note>.</p>
2+
<note>containing an inline note</note>.
3+
</p>
Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
<lucene>
2-
<text qname="p"/>
3-
<text qname="note"/>
4-
<ignore qname="note"/>
5-
</lucene>
2+
<text qname="p"/>
3+
<text qname="note"/>
4+
<ignore qname="note"/>
5+
</lucene>
Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,12 @@
1+
<collection xmlns="http://exist-db.org/collection-config/1.0">
2+
<index xmlns:xs="http://www.w3.org/2001/XMLSchema">
3+
<lucene>
4+
<analyzer class="org.exist.indexing.lucene.analyzers.NoDiacriticsStandardAnalyzer" id="nodiacritics"/>
5+
<text qname="letter" analyzer="nodiacritics">
6+
<field name="place" expression="place" analyzer="nodiacritics"/>
7+
<field name="from" expression="from" store="no"/>
8+
<field name="to" expression="to"/>
9+
</text>
10+
</lucene>
11+
</index>
12+
</collection>
Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,12 @@
1+
<collection xmlns="http://exist-db.org/collection-config/1.0">
2+
<index>
3+
<!-- Lucene indexes -->
4+
<lucene diacritics='no'>
5+
<analyzer class='org.apache.lucene.analysis.standard.StandardAnalyzer'/>
6+
<text match="//title[@xml:lang='Sa-Ltn']"/>
7+
<text match="/TEI/text">
8+
<ignore qname="text"/>
9+
</text>
10+
</lucene>
11+
</index>
12+
</collection>
Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,12 @@
11
<lucene>
2-
<analyzer class="org.apache.lucene.analysis.standard.StandardAnalyzer"/>
3-
<text qname="section">
4-
<ignore qname="title"/>
5-
<ignore qname="programlisting"/>
6-
<ignore qname="screen"/>
7-
<ignore qname="synopsis"/>
8-
</text>
9-
<text qname="para"/>
10-
<text qname="title" boost="2.0"/>
2+
<analyzer class="org.apache.lucene.analysis.standard.StandardAnalyzer"/>
3+
<text qname="section">
114
<ignore qname="title"/>
12-
</lucene>
5+
<ignore qname="programlisting"/>
6+
<ignore qname="screen"/>
7+
<ignore qname="synopsis"/>
8+
</text>
9+
<text qname="para"/>
10+
<text qname="title" boost="2.0"/>
11+
<ignore qname="title"/>
12+
</lucene>
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
<text qname="@val">
2-
<match-sibling-attr boost="25" qname="att" value="writtenForm"/>
2+
<match-sibling-attr boost="25" qname="att" value="writtenForm"/>
33
</text>
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
<text qname="feat">
2-
<has-attr boost="0" qname="xml:lang"/>
2+
<has-attr boost="0" qname="xml:lang"/>
33
</text>
Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
<lucene>
2-
<analyzer class="org.apache.lucene.analysis.standard.StandardAnalyzer"/>
3-
<analyzer id="ws" class="org.apache.lucene.analysis.core.WhitespaceAnalyzer"/>
4-
<text match="//SPEECH//*"/>
5-
<text qname="TITLE" analyzer="ws"/>
6-
</lucene>
2+
<analyzer class="org.apache.lucene.analysis.standard.StandardAnalyzer"/>
3+
<analyzer id="ws" class="org.apache.lucene.analysis.core.WhitespaceAnalyzer"/>
4+
<text match="//SPEECH//*"/>
5+
<text qname="TITLE" analyzer="ws"/>
6+
</lucene>

0 commit comments

Comments
 (0)