| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 1 | package de.ids_mannheim.korap.index; |
| 2 | |
| 3 | import static org.junit.Assert.*; |
| 4 | |
| 5 | import java.io.IOException; |
| 6 | import java.util.ArrayList; |
| 7 | import java.util.List; |
| 8 | |
| 9 | import org.apache.lucene.index.Term; |
| 10 | import org.apache.lucene.search.spans.SpanQuery; |
| 11 | import org.apache.lucene.search.spans.SpanTermQuery; |
| 12 | import org.junit.Test; |
| 13 | import org.junit.runner.RunWith; |
| 14 | import org.junit.runners.JUnit4; |
| 15 | |
| 16 | import de.ids_mannheim.korap.KorapIndex; |
| 17 | import de.ids_mannheim.korap.KorapResult; |
| 18 | import de.ids_mannheim.korap.query.DistanceConstraint; |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 19 | import de.ids_mannheim.korap.query.SpanDistanceQuery; |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 20 | import de.ids_mannheim.korap.query.SpanElementQuery; |
| 21 | import de.ids_mannheim.korap.query.SpanMultipleDistanceQuery; |
| 22 | import de.ids_mannheim.korap.query.SpanNextQuery; |
| 23 | |
| 24 | @RunWith(JUnit4.class) |
| 25 | public class TestMultipleDistanceIndex { |
| 26 | |
| 27 | private KorapIndex ki; |
| 28 | private KorapResult kr; |
| 29 | |
| 30 | public SpanQuery createQuery(String x, String y, List<DistanceConstraint> |
| 31 | constraints, boolean isOrdered){ |
| 32 | |
| 33 | SpanQuery sx = new SpanTermQuery(new Term("base",x)); |
| 34 | SpanQuery sy = new SpanTermQuery(new Term("base",y)); |
| 35 | |
| 36 | return new SpanMultipleDistanceQuery(sx, sy, constraints, isOrdered, true); |
| 37 | } |
| 38 | |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 39 | public DistanceConstraint createConstraint(String unit, int min, int max, |
| 40 | boolean isOrdered, boolean exclusion){ |
| 41 | |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 42 | if (unit.equals("w")){ |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 43 | return new DistanceConstraint(min, max,isOrdered,exclusion); |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 44 | } |
| 45 | return new DistanceConstraint(new SpanElementQuery("base", unit), |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 46 | min, max, isOrdered, exclusion); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 47 | } |
| 48 | |
| 49 | private FieldDocument createFieldDoc0() { |
| 50 | FieldDocument fd = new FieldDocument(); |
| 51 | fd.addString("ID", "doc-0"); |
| 52 | fd.addTV("base", |
| 53 | "text", |
| 54 | "[(0-1)s:b|_1#0-1|<>:s#0-2$<i>2|<>:p#0-4$<i>4]" + |
| 55 | "[(1-2)s:b|s:c|_2#1-2]" + |
| 56 | "[(2-3)s:c|_3#2-3|<>:s#2-3$<i>4]" + |
| 57 | "[(3-4)s:b|_4#3-4]" + |
| 58 | "[(4-5)s:c|_5#4-5|<>:s#4-6$<i>6|<>:p#4-6$<i>6]" + |
| 59 | "[(5-6)s:e|_6#5-6]"); |
| 60 | return fd; |
| 61 | } |
| 62 | |
| 63 | private FieldDocument createFieldDoc1() { |
| 64 | FieldDocument fd = new FieldDocument(); |
| 65 | fd.addString("ID", "doc-1"); |
| 66 | fd.addTV("base", |
| 67 | "text", |
| 68 | "[(0-1)s:c|_1#0-1|<>:s#0-2$<i>2|<>:p#0-4$<i>4]" + |
| 69 | "[(1-2)s:c|s:e|_2#1-2]" + |
| 70 | "[(2-3)s:e|_3#2-3|<>:s#2-3$<i>4]" + |
| 71 | "[(3-4)s:c|_4#3-4]" + |
| 72 | "[(4-5)s:e|_5#4-5|<>:s#4-6$<i>6|<>:p#4-6$<i>6]" + |
| 73 | "[(5-6)s:c|_6#5-6]"); |
| 74 | return fd; |
| 75 | } |
| 76 | |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 77 | private FieldDocument createFieldDoc2() { |
| 78 | FieldDocument fd = new FieldDocument(); |
| 79 | fd.addString("ID", "doc-2"); |
| 80 | fd.addTV("base", |
| 81 | "text", |
| 82 | "[(0-1)s:b|_1#0-1|<>:s#0-2$<i>2|<>:p#0-4$<i>4]" + |
| 83 | "[(1-2)s:b|s:e|_2#1-2]" + |
| 84 | "[(2-3)s:e|_3#2-3|<>:s#2-3$<i>4]" + |
| 85 | "[(3-4)s:b|s:c|_4#3-4]" + |
| 86 | "[(4-5)s:e|_5#4-5|<>:s#4-6$<i>6|<>:p#4-6$<i>6]" + |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 87 | "[(5-6)s:d|_6#5-6]" + |
| 88 | "[(6-7)s:b|_7#6-7|<>:s#6-7$<i>7|<>:p#6-7$<i>7]" ); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 89 | return fd; |
| 90 | } |
| 91 | |
| 92 | private FieldDocument createFieldDoc3() { |
| 93 | FieldDocument fd = new FieldDocument(); |
| 94 | fd.addString("ID", "doc-0"); |
| 95 | fd.addTV("base", |
| 96 | "text", |
| 97 | "[(0-1)s:b|_1#0-1|<>:s#0-2$<i>2|<>:p#0-4$<i>4]" + |
| 98 | "[(1-2)s:b|s:c|_2#1-2]" + |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 99 | "[(2-3)s:c|_3#2-3|<>:s#2-3$<i>5]" + |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 100 | "[(3-4)s:b|_4#3-4]" + |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 101 | "[(4-5)s:b|_5#4-5]" + |
| 102 | "[(5-6)s:b|_6#5-6]" + // gap |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 103 | "[(6-7)s:c|_7#6-7|<>:s#6-7$<i>7|<>:p#6-7$<i>7]" ); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 104 | return fd; |
| 105 | } |
| 106 | |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 107 | /** Unordered, same sentence |
| 108 | * */ |
| 109 | @Test |
| 110 | public void testCase1() throws IOException { |
| 111 | ki = new KorapIndex(); |
| 112 | ki.addDoc(createFieldDoc0()); |
| 113 | ki.commit(); |
| 114 | |
| 115 | List<DistanceConstraint> constraints = new ArrayList<DistanceConstraint>(); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 116 | constraints.add(createConstraint("w", 0, 2, false, false)); |
| 117 | constraints.add(createConstraint("s", 0, 0, false, false)); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 118 | |
| 119 | SpanQuery mdq; |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 120 | mdq = createQuery("s:b", "s:c", constraints,false); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 121 | kr = ki.search(mdq, (short) 10); |
| Nils Diewald | 0f5a279 | 2014-02-13 17:20:36 +0000 | [diff] [blame] | 122 | // System.out.println(mdq); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 123 | |
| 124 | assertEquals(3, kr.getTotalResults()); |
| 125 | assertEquals(0, kr.getMatch(0).getStartPos()); |
| 126 | assertEquals(2, kr.getMatch(0).getEndPos()); |
| 127 | assertEquals(1, kr.getMatch(1).getStartPos()); |
| 128 | assertEquals(2, kr.getMatch(1).getEndPos()); |
| 129 | assertEquals(2, kr.getMatch(2).getStartPos()); |
| 130 | assertEquals(4, kr.getMatch(2).getEndPos()); |
| 131 | } |
| 132 | |
| 133 | /** Ordered |
| 134 | * Unordered |
| 135 | * Two constraints |
| 136 | * Three constraints |
| 137 | * */ |
| 138 | @Test |
| 139 | public void testCase2() throws IOException { |
| 140 | ki = new KorapIndex(); |
| 141 | ki.addDoc(createFieldDoc0()); |
| 142 | ki.commit(); |
| 143 | |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 144 | // Ordered - two constraints |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 145 | List<DistanceConstraint> constraints = new ArrayList<DistanceConstraint>(); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 146 | constraints.add(createConstraint("w", 0, 2, true, false)); |
| 147 | constraints.add(createConstraint("s", 1, 1, true, false)); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 148 | |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 149 | SpanQuery mdq; |
| 150 | mdq = createQuery("s:b", "s:c", constraints,true); |
| 151 | kr = ki.search(mdq, (short) 10); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 152 | assertEquals(3, kr.getTotalResults()); |
| 153 | assertEquals(0, kr.getMatch(0).getStartPos()); |
| 154 | assertEquals(3, kr.getMatch(0).getEndPos()); |
| 155 | assertEquals(1, kr.getMatch(1).getStartPos()); |
| 156 | assertEquals(3, kr.getMatch(1).getEndPos()); |
| 157 | assertEquals(3, kr.getMatch(2).getStartPos()); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 158 | assertEquals(5, kr.getMatch(2).getEndPos()); |
| 159 | |
| 160 | // Three constraints |
| 161 | constraints.add(createConstraint("p", 0, 0, true, false)); |
| 162 | mdq = createQuery("s:b", "s:c", constraints,true); |
| 163 | kr = ki.search(mdq, (short) 10); |
| 164 | assertEquals(2, kr.getTotalResults()); |
| 165 | |
| 166 | |
| 167 | // Unordered - two constraints |
| 168 | constraints.clear(); |
| 169 | constraints.add(createConstraint("w", 0, 2, false, false)); |
| 170 | constraints.add(createConstraint("s", 1, 1, false, false)); |
| 171 | |
| 172 | mdq = createQuery("s:c", "s:b", constraints,false); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 173 | kr = ki.search(mdq, (short) 10); |
| 174 | assertEquals(4, kr.getTotalResults()); |
| 175 | assertEquals(1, kr.getMatch(2).getStartPos()); |
| 176 | assertEquals(4, kr.getMatch(2).getEndPos()); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 177 | |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 178 | // Three constraints |
| 179 | constraints.add(createConstraint("p", 0, 0, false, false)); |
| 180 | mdq = createQuery("s:b", "s:c", constraints,false); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 181 | kr = ki.search(mdq, (short) 10); |
| Eliza Margaretha | 7788a98 | 2014-08-29 16:10:52 +0000 | [diff] [blame] | 182 | assertEquals(3, kr.getTotalResults()); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 183 | |
| 184 | } |
| 185 | |
| 186 | /** Multiple documents |
| 187 | * Ensure same doc (inner term span) |
| 188 | * */ |
| 189 | @Test |
| 190 | public void testCase3() throws IOException { |
| 191 | ki = new KorapIndex(); |
| 192 | ki.addDoc(createFieldDoc0()); |
| 193 | ki.addDoc(createFieldDoc1()); |
| 194 | ki.addDoc(createFieldDoc2()); |
| 195 | ki.commit(); |
| 196 | |
| 197 | List<DistanceConstraint> constraints = new ArrayList<DistanceConstraint>(); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 198 | constraints.add(createConstraint("w", 1, 2, false, false)); |
| 199 | constraints.add(createConstraint("s", 1, 2, false, false)); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 200 | |
| 201 | SpanQuery mdq; |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 202 | mdq = createQuery("s:b", "s:e", constraints,false); |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 203 | kr = ki.search(mdq, (short) 10); |
| 204 | |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 205 | assertEquals(5, kr.getTotalResults()); |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 206 | assertEquals(3, kr.getMatch(0).getStartPos()); |
| 207 | assertEquals(6, kr.getMatch(0).getEndPos()); |
| 208 | assertEquals(2, kr.getMatch(1).getLocalDocID()); |
| 209 | assertEquals(1, kr.getMatch(2).getStartPos()); |
| 210 | assertEquals(4, kr.getMatch(2).getEndPos()); |
| 211 | assertEquals(3, kr.getMatch(3).getStartPos()); |
| 212 | assertEquals(5, kr.getMatch(3).getEndPos()); |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 213 | assertEquals(4, kr.getMatch(4).getStartPos()); |
| 214 | assertEquals(7, kr.getMatch(4).getEndPos()); |
| 215 | |
| 216 | // System.out.print(kr.getTotalResults()+"\n"); |
| 217 | // for (int i=0; i< kr.getTotalResults(); i++){ |
| 218 | // System.out.println( |
| 219 | // kr.match(i).getLocalDocID()+" "+ |
| 220 | // kr.match(i).startPos + " " + |
| 221 | // kr.match(i).endPos |
| 222 | // ); |
| 223 | // } |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 224 | |
| 225 | } |
| 226 | |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 227 | /** Skip to |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 228 | * */ |
| 229 | @Test |
| 230 | public void testCase4() throws IOException { |
| 231 | ki = new KorapIndex(); |
| 232 | ki.addDoc(createFieldDoc0()); |
| 233 | ki.addDoc(createFieldDoc3()); |
| 234 | ki.addDoc(createFieldDoc1()); |
| 235 | ki.addDoc(createFieldDoc2()); |
| 236 | ki.commit(); |
| 237 | |
| 238 | List<DistanceConstraint> constraints = new ArrayList<DistanceConstraint>(); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 239 | constraints.add(createConstraint("w", 1, 2, false, false)); |
| 240 | constraints.add(createConstraint("s", 1, 2, false, false)); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 241 | |
| 242 | SpanQuery mdq; |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 243 | mdq = createQuery("s:b", "s:c", constraints,false); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 244 | |
| 245 | SpanQuery sq = new SpanNextQuery(mdq, |
| 246 | new SpanTermQuery(new Term("base","s:e"))); |
| 247 | kr = ki.search(sq, (short) 10); |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 248 | |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 249 | assertEquals(2, kr.getTotalResults()); |
| 250 | assertEquals(3, kr.getMatch(0).getStartPos()); |
| 251 | assertEquals(6, kr.getMatch(0).getEndPos()); |
| 252 | assertEquals(3, kr.getMatch(1).getLocalDocID()); |
| 253 | assertEquals(1, kr.getMatch(1).getStartPos()); |
| 254 | assertEquals(5, kr.getMatch(1).getEndPos()); |
| 255 | |
| 256 | } |
| 257 | |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 258 | /** Same tokens: ordered and unordered yield the same results |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 259 | * */ |
| 260 | @Test |
| 261 | public void testCase5() throws IOException { |
| 262 | ki = new KorapIndex(); |
| 263 | ki.addDoc(createFieldDoc0()); |
| 264 | ki.addDoc(createFieldDoc1()); |
| 265 | ki.commit(); |
| 266 | |
| 267 | List<DistanceConstraint> constraints = new ArrayList<DistanceConstraint>(); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 268 | constraints.add(createConstraint("w", 1, 2, false, false)); |
| 269 | constraints.add(createConstraint("s", 1, 2, false, false)); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 270 | |
| 271 | SpanQuery mdq; |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 272 | mdq = createQuery("s:c", "s:c", constraints,false); |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 273 | kr = ki.search(mdq, (short) 10); |
| 274 | |
| 275 | assertEquals(4, kr.getTotalResults()); |
| 276 | assertEquals(1, kr.getMatch(0).getStartPos()); |
| 277 | assertEquals(3, kr.getMatch(0).getEndPos()); |
| 278 | assertEquals(2, kr.getMatch(1).getStartPos()); |
| 279 | assertEquals(5, kr.getMatch(1).getEndPos()); |
| 280 | assertEquals(1, kr.getMatch(2).getLocalDocID()); |
| 281 | assertEquals(1, kr.getMatch(2).getStartPos()); |
| 282 | assertEquals(4, kr.getMatch(2).getEndPos()); |
| 283 | assertEquals(3, kr.getMatch(3).getStartPos()); |
| 284 | assertEquals(6, kr.getMatch(3).getEndPos()); |
| 285 | |
| 286 | } |
| 287 | |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 288 | /** Exclusion |
| 289 | * Gaps |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 290 | * */ |
| 291 | @Test |
| 292 | public void testCase6() throws IOException { |
| 293 | ki = new KorapIndex(); |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 294 | ki.addDoc(createFieldDoc3()); |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 295 | ki.commit(); |
| 296 | |
| 297 | // First constraint - token exclusion |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 298 | SpanQuery sx = new SpanTermQuery(new Term("base","s:b")); |
| 299 | SpanQuery sy = new SpanTermQuery(new Term("base","s:c")); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 300 | |
| 301 | DistanceConstraint dc1 = createConstraint("w", 0, 1, false, true); |
| 302 | SpanDistanceQuery sq = new SpanDistanceQuery(sx, sy, dc1, true); |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 303 | |
| 304 | kr = ki.search(sq, (short) 10); |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 305 | assertEquals(1, kr.getTotalResults()); |
| 306 | // 4-5 |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 307 | |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 308 | // Second constraint - element distance |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 309 | DistanceConstraint dc2 = createConstraint("s", 1, 1, false, false); |
| 310 | sq = new SpanDistanceQuery(sx, sy, dc2, true); |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 311 | kr = ki.search(sq, (short) 10); |
| 312 | // 0-3, 1-3, 1-4, 1-5, 3-7, 4-7 |
| 313 | assertEquals(6, kr.getTotalResults()); |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 314 | |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 315 | |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 316 | List<DistanceConstraint> constraints = new ArrayList<DistanceConstraint>(); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 317 | constraints.add(dc1); |
| 318 | constraints.add(dc2); |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 319 | |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 320 | SpanQuery mdq; |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 321 | mdq = createQuery("s:b", "s:c", constraints,false); |
| Eliza Margaretha | cdb769b | 2014-02-11 17:24:13 +0000 | [diff] [blame] | 322 | kr = ki.search(mdq, (short) 10); |
| 323 | |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 324 | assertEquals(2, kr.getTotalResults()); |
| 325 | assertEquals(1, kr.getMatch(0).getStartPos()); |
| 326 | assertEquals(5, kr.getMatch(0).getEndPos()); |
| 327 | assertEquals(4, kr.getMatch(1).getStartPos()); |
| 328 | assertEquals(7, kr.getMatch(1).getEndPos()); |
| 329 | } |
| Eliza Margaretha | 5f60692 | 2014-02-18 15:33:49 +0000 | [diff] [blame] | 330 | |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 331 | |
| 332 | /** Exclusion, multiple documents |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 333 | * */ |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 334 | @Test |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 335 | public void testCase7() throws IOException { |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 336 | ki = new KorapIndex(); |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 337 | ki.addDoc(createFieldDoc2()); |
| 338 | ki.commit(); |
| 339 | |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 340 | SpanQuery sx = new SpanTermQuery(new Term("base","s:b")); |
| 341 | SpanQuery sy = new SpanTermQuery(new Term("base","s:c")); |
| 342 | // Second constraint |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 343 | SpanDistanceQuery sq = new SpanDistanceQuery(sx,sy, |
| 344 | createConstraint("s", 0, 0, false, true), |
| 345 | true); |
| 346 | kr = ki.search(sq, (short) 10); |
| 347 | assertEquals(3, kr.getTotalResults()); |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 348 | // 0-1, 1-2, 6-7 |
| 349 | |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 350 | // Exclusion within the same sentence |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 351 | List<DistanceConstraint> constraints = new ArrayList<DistanceConstraint>(); |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 352 | constraints.add(createConstraint("w", 0, 2,false,true)); |
| 353 | constraints.add(createConstraint("s", 0, 0,false,true)); |
| 354 | |
| Eliza Margaretha | 0192918 | 2014-02-19 11:48:59 +0000 | [diff] [blame] | 355 | SpanQuery mdq; |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 356 | mdq = createQuery("s:b", "s:c", constraints,false); |
| 357 | kr = ki.search(mdq, (short) 10); |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 358 | assertEquals(2, kr.getTotalResults()); |
| 359 | assertEquals(0, kr.getMatch(0).getStartPos()); |
| 360 | assertEquals(1, kr.getMatch(0).getEndPos()); |
| 361 | assertEquals(6, kr.getMatch(1).getStartPos()); |
| 362 | assertEquals(7, kr.getMatch(1).getEndPos()); |
| 363 | |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 364 | |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 365 | // Third constraint |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 366 | sq = new SpanDistanceQuery(sx, sy, |
| 367 | createConstraint("p", 0, 0, false, true), |
| 368 | true); |
| 369 | kr = ki.search(sq, (short) 10); |
| 370 | assertEquals(1, kr.getTotalResults()); |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 371 | // 6-7 |
| 372 | |
| Eliza Margaretha | d469346 | 2014-03-17 13:16:18 +0000 | [diff] [blame] | 373 | constraints.add(createConstraint("p", 0, 0, false, true)); |
| 374 | mdq = createQuery("s:b", "s:c", constraints,false); |
| Eliza Margaretha | e335beb | 2014-02-27 12:56:14 +0000 | [diff] [blame] | 375 | kr = ki.search(mdq, (short) 10); |
| 376 | |
| 377 | assertEquals(1, kr.getTotalResults()); |
| 378 | assertEquals(6, kr.getMatch(0).getStartPos()); |
| 379 | assertEquals(7, kr.getMatch(0).getEndPos()); |
| 380 | |
| 381 | } |
| Eliza Margaretha | e18d62e | 2014-02-11 11:30:48 +0000 | [diff] [blame] | 382 | } |
| 383 | |