| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 1 | package de.ids_mannheim.korap.utils; |
| 2 | |
| margaretha | 2558a7c | 2019-02-18 16:48:54 +0100 | [diff] [blame] | 3 | import java.util.HashMap; |
| margaretha | b786411 | 2017-06-29 16:36:13 +0200 | [diff] [blame] | 4 | import java.util.List; |
| margaretha | 2558a7c | 2019-02-18 16:48:54 +0100 | [diff] [blame] | 5 | import java.util.Map; |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 6 | |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 7 | import com.fasterxml.jackson.databind.JsonNode; |
| 8 | import com.fasterxml.jackson.databind.node.ArrayNode; |
| 9 | import com.fasterxml.jackson.databind.node.ObjectNode; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 10 | |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 11 | import de.ids_mannheim.korap.exceptions.KustvaktException; |
| margaretha | b786411 | 2017-06-29 16:36:13 +0200 | [diff] [blame] | 12 | import de.ids_mannheim.korap.exceptions.StatusCodes; |
| 13 | import de.ids_mannheim.korap.query.serialize.CollectionQueryProcessor; |
| 14 | import de.ids_mannheim.korap.response.Notifications; |
| margaretha | b786411 | 2017-06-29 16:36:13 +0200 | [diff] [blame] | 15 | import edu.emory.mathcs.backport.java.util.Arrays; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 16 | |
| 17 | /** |
| 18 | * convenience builder class for collection query |
| 19 | * |
| margaretha | b786411 | 2017-06-29 16:36:13 +0200 | [diff] [blame] | 20 | * @author hanl, margaretha |
| 21 | * @date 29/06/2017 |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 22 | */ |
| 23 | public class KoralCollectionQueryBuilder { |
| 24 | |
| 25 | public enum EQ { |
| 26 | EQUAL, UNEQUAL |
| 27 | } |
| 28 | |
| 29 | private boolean verbose; |
| 30 | private JsonNode base; |
| 31 | private StringBuilder builder; |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 32 | private String mergeOperator; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 33 | |
| Michael Hanl | 33829ec | 2016-05-28 17:03:38 +0200 | [diff] [blame] | 34 | public KoralCollectionQueryBuilder () { |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 35 | this(false); |
| 36 | } |
| 37 | |
| 38 | |
| Michael Hanl | 33829ec | 2016-05-28 17:03:38 +0200 | [diff] [blame] | 39 | public KoralCollectionQueryBuilder (boolean verbose) { |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 40 | this.verbose = verbose; |
| 41 | this.builder = new StringBuilder(); |
| 42 | this.base = null; |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 43 | this.mergeOperator = null; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 44 | } |
| 45 | |
| 46 | |
| 47 | /** |
| 48 | * raw method for field - value pair adding. Supports all |
| 49 | * operators (leq, geq, contains, etc.) |
| 50 | * |
| 51 | * @param field |
| 52 | * @param op |
| 53 | * @param value |
| 54 | * @return |
| 55 | */ |
| Michael Hanl | 9a24216 | 2016-06-03 11:18:06 +0200 | [diff] [blame] | 56 | public KoralCollectionQueryBuilder with (String field, String op, |
| Michael Hanl | 33829ec | 2016-05-28 17:03:38 +0200 | [diff] [blame] | 57 | String value) { |
| Michael Hanl | 9a24216 | 2016-06-03 11:18:06 +0200 | [diff] [blame] | 58 | //String end = this.builder.substring(this.builder.length() - 4, |
| 59 | // this.builder.length() - 1); |
| 60 | //if (this.builder.length() != 0 |
| 61 | // && (!end.contains("&") | !end.contains("|"))) |
| 62 | // throw new RuntimeException("no join operator given!"); |
| 63 | this.with(field + op + value); |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 64 | return this; |
| 65 | } |
| 66 | |
| 67 | |
| 68 | /** |
| 69 | * element can be a more complex sub query like |
| 70 | * (textClass=freizeit & Attributes.CORPUS_SIGLE=WPD) |
| 71 | * |
| 72 | * @param query |
| 73 | * will be enclosed by parenthesis in order to make sub |
| 74 | * query |
| 75 | * element |
| 76 | * @return |
| 77 | */ |
| Michael Hanl | 33829ec | 2016-05-28 17:03:38 +0200 | [diff] [blame] | 78 | public KoralCollectionQueryBuilder with (String query) { |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 79 | if (!query.startsWith("(") && !query.endsWith(")")) |
| 80 | query = "(" + query + ")"; |
| 81 | this.builder.append(query); |
| 82 | return this; |
| 83 | } |
| 84 | |
| 85 | |
| 86 | |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 87 | public KoralCollectionQueryBuilder and () { |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 88 | if (this.builder.length() != 0) this.builder.append(" & "); |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 89 | if (this.base != null && this.mergeOperator == null) |
| 90 | this.mergeOperator = "AND"; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 91 | return this; |
| 92 | } |
| 93 | |
| 94 | |
| 95 | public KoralCollectionQueryBuilder or () { |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 96 | if (this.builder.length() != 0) this.builder.append(" | "); |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 97 | if (this.base != null && this.mergeOperator == null) |
| 98 | this.mergeOperator = "OR"; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 99 | return this; |
| 100 | } |
| 101 | |
| 102 | |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 103 | public JsonNode rebaseCollection () throws KustvaktException { |
| 104 | if (this.builder.length() == 0 && this.base == null) return null; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 105 | |
| 106 | JsonNode request = null; |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 107 | if (this.builder.length() != 0) { |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 108 | CollectionQueryProcessor tree = |
| 109 | new CollectionQueryProcessor(this.verbose); |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 110 | tree.process(this.builder.toString()); |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 111 | if (tree.getErrors().size() > 0) { |
| margaretha | 2558a7c | 2019-02-18 16:48:54 +0100 | [diff] [blame] | 112 | // legacy support |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 113 | for (List<Object> e : tree.getErrors()) { |
| margaretha | 2558a7c | 2019-02-18 16:48:54 +0100 | [diff] [blame] | 114 | if (e.get(1) instanceof String[]) { |
| 115 | Notifications notif = new Notifications(); |
| 116 | int code = (int) e.get(0); |
| margaretha | b786411 | 2017-06-29 16:36:13 +0200 | [diff] [blame] | 117 | notif.addError(code, (String[]) e.get(1)); |
| margaretha | 2558a7c | 2019-02-18 16:48:54 +0100 | [diff] [blame] | 118 | String notificationStr = notif.toJsonString(); |
| 119 | throw new KustvaktException(StatusCodes.SERIALIZATION_FAILED, |
| 120 | notificationStr, true); |
| 121 | } |
| 122 | else{ |
| 123 | break; |
| margaretha | b786411 | 2017-06-29 16:36:13 +0200 | [diff] [blame] | 124 | } |
| 125 | } |
| margaretha | 2558a7c | 2019-02-18 16:48:54 +0100 | [diff] [blame] | 126 | // -- end of legacy support |
| 127 | |
| 128 | Map<String, Object> map = new HashMap<>(); |
| 129 | map.put("errors", tree.getErrors()); |
| 130 | String errors = JsonUtils.toJSON(map); |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 131 | throw new KustvaktException(StatusCodes.SERIALIZATION_FAILED, |
| margaretha | 2558a7c | 2019-02-18 16:48:54 +0100 | [diff] [blame] | 132 | errors, true); |
| margaretha | b786411 | 2017-06-29 16:36:13 +0200 | [diff] [blame] | 133 | } |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 134 | request = JsonUtils.valueToTree(tree.getRequestMap()); |
| 135 | } |
| 136 | |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 137 | if (this.base != null) { |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 138 | // check that collection non empty |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 139 | JsonNode tmp = this.base.deepCopy(); |
| Michael Hanl | 9a24216 | 2016-06-03 11:18:06 +0200 | [diff] [blame] | 140 | if (request != null) |
| 141 | request = mergeWith(request); |
| Michael Hanl | 33829ec | 2016-05-28 17:03:38 +0200 | [diff] [blame] | 142 | else |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 143 | request = tmp; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 144 | } |
| 145 | return request; |
| 146 | } |
| 147 | |
| Michael Hanl | 33829ec | 2016-05-28 17:03:38 +0200 | [diff] [blame] | 148 | |
| 149 | public JsonNode mergeWith (JsonNode node) { |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 150 | if (this.base != null) { |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 151 | if (node != null) { |
| 152 | JsonNode tobase = node.at("/collection"); |
| 153 | JsonNode base = this.base.deepCopy(); |
| Michael Hanl | cb2d3f9 | 2016-06-02 17:34:06 +0200 | [diff] [blame] | 154 | JsonNode result = base.at("/collection"); |
| 155 | |
| 156 | if (result.isMissingNode() && !tobase.isMissingNode()) |
| 157 | result = tobase; |
| 158 | else if (result.isMissingNode() && tobase.isMissingNode()) |
| 159 | return base; |
| 160 | else { |
| 161 | result = JsonBuilder.buildDocGroup( |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 162 | this.mergeOperator != null |
| 163 | ? this.mergeOperator.toLowerCase() : "and", |
| 164 | result, tobase); |
| Michael Hanl | cb2d3f9 | 2016-06-02 17:34:06 +0200 | [diff] [blame] | 165 | } |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 166 | ((ObjectNode) base).put("collection", result); |
| 167 | return base; |
| 168 | } |
| Michael Hanl | cb2d3f9 | 2016-06-02 17:34:06 +0200 | [diff] [blame] | 169 | return this.base; |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 170 | } |
| Michael Hanl | cb2d3f9 | 2016-06-02 17:34:06 +0200 | [diff] [blame] | 171 | throw new RuntimeException("no query found to merge with!"); |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 172 | } |
| 173 | |
| 174 | |
| 175 | /** |
| 176 | * sets base query. All consequent queries are added to the first |
| 177 | * koral:docGroup within the collection base query |
| 178 | * If no group in base query, consequent queries are skipped. |
| 179 | * |
| 180 | * @param query |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 181 | * @throws KustvaktException |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 182 | */ |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 183 | public KoralCollectionQueryBuilder setBaseQuery (String query) throws KustvaktException { |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 184 | this.base = JsonUtils.readTree(query); |
| 185 | return this; |
| 186 | } |
| Michael Hanl | 33829ec | 2016-05-28 17:03:38 +0200 | [diff] [blame] | 187 | |
| 188 | |
| Michael Hanl | cedf721 | 2016-05-28 10:43:09 +0200 | [diff] [blame] | 189 | public KoralCollectionQueryBuilder setBaseQuery (JsonNode query) { |
| 190 | this.base = query; |
| 191 | return this; |
| 192 | } |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 193 | |
| 194 | |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 195 | public String toJSON () throws KustvaktException { |
| Michael Hanl | 9a24216 | 2016-06-03 11:18:06 +0200 | [diff] [blame] | 196 | return JsonUtils.toJSON(rebaseCollection()); |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 197 | } |
| 198 | |
| 199 | |
| 200 | @Override |
| 201 | public String toString () { |
| 202 | return this.builder.toString(); |
| 203 | } |
| 204 | |
| 205 | |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 206 | private static class JsonBuilder { |
| 207 | |
| 208 | public static ObjectNode buildDoc (String key, String value) { |
| 209 | ObjectNode node = JsonUtils.createObjectNode(); |
| 210 | node.put("@type", "koral:doc"); |
| 211 | // eq.equals(EQ.EQUAL) ? "match:eq" : "match:ne" |
| 212 | node.put("match", "match:eq"); |
| 213 | node.put("key", key); |
| 214 | node.put("value", value); |
| 215 | return node; |
| 216 | } |
| 217 | |
| 218 | |
| margaretha | 894a7d7 | 2017-11-08 19:24:20 +0100 | [diff] [blame] | 219 | public static ObjectNode buildDocGroup (String op, |
| 220 | JsonNode ... groups) { |
| Michael Hanl | 173ba4b | 2016-05-24 20:25:05 +0200 | [diff] [blame] | 221 | ObjectNode node = JsonUtils.createObjectNode(); |
| 222 | node.put("@type", "koral:docGroup"); |
| 223 | node.put("operation", "operation:" + op); |
| 224 | ArrayNode ops = JsonUtils.createArrayNode(); |
| 225 | ops.addAll(Arrays.asList(groups)); |
| 226 | node.put("operands", ops); |
| 227 | return node; |
| 228 | } |
| 229 | |
| 230 | } |
| 231 | |
| 232 | } |