| Eliza Margaretha | 67a8857 | 2014-11-04 14:38:56 +0000 | [diff] [blame] | 1 | package de.ids_mannheim.korap.highlight; |
| 2 | |
| 3 | import static org.junit.Assert.assertEquals; |
| 4 | import static org.junit.Assert.fail; |
| 5 | |
| Akron | 798e6a2 | 2018-06-18 15:29:35 +0200 | [diff] [blame] | 6 | import java.io.*; |
| Akron | 67d2ff0 | 2018-06-19 10:51:16 +0200 | [diff] [blame] | 7 | import static de.ids_mannheim.korap.TestSimple.*; |
| Eliza Margaretha | 67a8857 | 2014-11-04 14:38:56 +0000 | [diff] [blame] | 8 | |
| Eliza Margaretha | b698f82 | 2014-11-12 10:14:21 +0000 | [diff] [blame] | 9 | import org.apache.lucene.search.spans.SpanQuery; |
| Eliza Margaretha | 67a8857 | 2014-11-04 14:38:56 +0000 | [diff] [blame] | 10 | import org.junit.Test; |
| 11 | |
| Nils Diewald | a14ecd6 | 2015-02-26 21:00:20 +0000 | [diff] [blame] | 12 | import de.ids_mannheim.korap.KrillIndex; |
| Nils Diewald | 392bcf3 | 2015-02-26 20:01:17 +0000 | [diff] [blame] | 13 | import de.ids_mannheim.korap.response.Match; |
| Nils Diewald | 0339d46 | 2015-02-26 14:53:56 +0000 | [diff] [blame] | 14 | import de.ids_mannheim.korap.KrillQuery; |
| Nils Diewald | 884dbcf | 2015-02-27 17:02:28 +0000 | [diff] [blame] | 15 | import de.ids_mannheim.korap.response.Result; |
| Nils Diewald | bbd39a5 | 2015-02-23 19:56:57 +0000 | [diff] [blame] | 16 | import de.ids_mannheim.korap.Krill; |
| Eliza Margaretha | 67a8857 | 2014-11-04 14:38:56 +0000 | [diff] [blame] | 17 | import de.ids_mannheim.korap.query.SpanNextQuery; |
| 18 | import de.ids_mannheim.korap.query.wrap.SpanQueryWrapper; |
| 19 | import de.ids_mannheim.korap.util.QueryException; |
| 20 | |
| 21 | |
| 22 | public class TestClass { |
| Nils Diewald | bb33da2 | 2015-03-04 16:24:25 +0000 | [diff] [blame] | 23 | KrillIndex ki; |
| 24 | Result kr; |
| 25 | Krill ks; |
| Eliza Margaretha | 67a8857 | 2014-11-04 14:38:56 +0000 | [diff] [blame] | 26 | |
| Nils Diewald | 11e9186 | 2014-11-12 16:29:18 +0000 | [diff] [blame] | 27 | |
| Nils Diewald | 7d32064 | 2014-11-12 17:39:42 +0000 | [diff] [blame] | 28 | @Test |
| Nils Diewald | bb33da2 | 2015-03-04 16:24:25 +0000 | [diff] [blame] | 29 | public void queryJSONpoly1 () throws QueryException, IOException { |
| Nils Diewald | 7d32064 | 2014-11-12 17:39:42 +0000 | [diff] [blame] | 30 | |
| Akron | 67d2ff0 | 2018-06-19 10:51:16 +0200 | [diff] [blame] | 31 | String jsonPath = getClass().getResource("/queries/poly1.json").getFile(); |
| 32 | String jsonQuery = getJsonString(jsonPath); |
| Akron | 850b46e | 2016-06-08 10:08:55 +0200 | [diff] [blame] | 33 | SpanQueryWrapper sqwi = new KrillQuery("tokens").fromKoral(jsonQuery); |
| Nils Diewald | bb33da2 | 2015-03-04 16:24:25 +0000 | [diff] [blame] | 34 | |
| 35 | SpanNextQuery sq = (SpanNextQuery) sqwi.toQuery(); |
| 36 | //System.out.println(sq.toString()); |
| 37 | |
| 38 | ki = new KrillIndex(); |
| 39 | ki.addDoc(getClass().getResourceAsStream("/wiki/JJJ-00785.json.gz"), |
| 40 | true); |
| 41 | ki.addDoc(getClass().getResourceAsStream("/wiki/DDD-01402.json.gz"), |
| 42 | true); |
| 43 | ki.commit(); |
| 44 | kr = ki.search(sq, (short) 10); |
| 45 | |
| 46 | assertEquals(61, kr.getMatch(0).getStartPos()); |
| 47 | assertEquals(64, kr.getMatch(0).getEndPos()); |
| 48 | assertEquals( |
| Akron | f05fde6 | 2016-08-03 23:46:17 +0200 | [diff] [blame] | 49 | "... Bruckner (Wien) und Mathis Lussy (Paris). [[{1:Inspiriert} " |
| 50 | + "{2:durch die}]] additiven Modelle arabischer Rhythmik (er half ...", |
| Nils Diewald | bb33da2 | 2015-03-04 16:24:25 +0000 | [diff] [blame] | 51 | kr.getMatch(0).getSnippetBrackets()); |
| 52 | |
| 53 | assertEquals(31, kr.getMatch(1).getStartPos()); |
| 54 | assertEquals(34, kr.getMatch(1).getEndPos()); |
| 55 | assertEquals( |
| Akron | f05fde6 | 2016-08-03 23:46:17 +0200 | [diff] [blame] | 56 | "... des Sendens wird ein unhörbarer Unterton [[{1:mitgesendet}, " |
| 57 | + "{2:auf den}]] das angesprochene Funkgerät reagiert. Die Abkürzung ...", |
| Nils Diewald | bb33da2 | 2015-03-04 16:24:25 +0000 | [diff] [blame] | 58 | kr.getMatch(1).getSnippetBrackets()); |
| 59 | } |
| 60 | |
| 61 | |
| 62 | @Test |
| 63 | public void queryJSONpoly4 () throws QueryException, IOException { |
| 64 | |
| Akron | 67d2ff0 | 2018-06-19 10:51:16 +0200 | [diff] [blame] | 65 | String jsonPath = getClass().getResource("/queries/poly4.json").getFile(); |
| 66 | String jsonQuery = getJsonString(jsonPath); |
| Akron | 850b46e | 2016-06-08 10:08:55 +0200 | [diff] [blame] | 67 | SpanQueryWrapper sqwi = new KrillQuery("tokens").fromKoral(jsonQuery); |
| Nils Diewald | bb33da2 | 2015-03-04 16:24:25 +0000 | [diff] [blame] | 68 | SpanQuery sq = sqwi.toQuery(); |
| 69 | |
| 70 | // System.out.println(sq.toString()); |
| 71 | |
| 72 | |
| 73 | ki = new KrillIndex(); |
| 74 | ki.addDoc(getClass().getResourceAsStream("/wiki/SSS-09803.json.gz"), |
| 75 | true); |
| 76 | |
| 77 | ki.commit(); |
| 78 | kr = ki.search(sq, (short) 10); |
| 79 | |
| 80 | /* |
| 81 | for (Match km : kr.getMatches()){ |
| 82 | System.out.println(km.getStartPos() +","+km.getEndPos()+" " |
| 83 | +km.getSnippetBrackets() |
| 84 | ); |
| 85 | } |
| 86 | */ |
| margaretha | 4cfc89e | 2016-04-25 18:01:14 +0200 | [diff] [blame] | 87 | assertEquals((long) 5315, kr.getTotalResults()); |
| Nils Diewald | bb33da2 | 2015-03-04 16:24:25 +0000 | [diff] [blame] | 88 | assertEquals(3, kr.getMatch(0).getStartPos()); |
| 89 | assertEquals(5, kr.getMatch(0).getEndPos()); |
| 90 | |
| 91 | //fail("Tests have to be updated"); |
| 92 | } |
| Eliza Margaretha | 67a8857 | 2014-11-04 14:38:56 +0000 | [diff] [blame] | 93 | } |