blob: a823f9d911038033d4b11e646ed99d08f4c22af6 [file] [log] [blame]
Joachim Bingeldc03c002014-04-17 13:40:40 +00001package de.ids_mannheim.korap.query.serialize;
2
3import java.lang.reflect.Method;
4import java.util.ArrayList;
Joachim Bingel7ee07862014-04-28 15:22:41 +00005import java.util.Arrays;
Joachim Bingel019ba5c2014-04-28 14:59:04 +00006import java.util.HashMap;
Joachim Bingeldc03c002014-04-17 13:40:40 +00007import java.util.LinkedHashMap;
8import java.util.LinkedList;
9import java.util.List;
10import java.util.Map;
Joachim Bingelfb9d5fd2014-06-25 09:32:43 +000011import java.util.NoSuchElementException;
Joachim Bingeldc03c002014-04-17 13:40:40 +000012
13import org.antlr.v4.runtime.ANTLRInputStream;
14import org.antlr.v4.runtime.BailErrorStrategy;
15import org.antlr.v4.runtime.CharStream;
16import org.antlr.v4.runtime.CommonTokenStream;
17import org.antlr.v4.runtime.Lexer;
Joachim Bingeldc03c002014-04-17 13:40:40 +000018import org.antlr.v4.runtime.ParserRuleContext;
Joachim Bingeldc03c002014-04-17 13:40:40 +000019import org.antlr.v4.runtime.tree.ParseTree;
Joachim Bingel75038792014-05-19 15:12:23 +000020import org.slf4j.LoggerFactory;
Joachim Bingelc63f7812014-07-30 09:12:25 +000021import org.slf4j.Logger;
Joachim Bingeldc03c002014-04-17 13:40:40 +000022
Joachim Bingel6003b852014-12-18 14:20:55 +000023import de.ids_mannheim.korap.query.parse.annis.AqlLexer;
24import de.ids_mannheim.korap.query.parse.annis.AqlParser;
Joachim Bingel3fa584b2014-12-17 13:35:43 +000025import de.ids_mannheim.korap.query.serialize.util.Antlr4DescriptiveErrorListener;
Joachim Bingel0e54d222015-01-12 13:22:16 +000026import de.ids_mannheim.korap.query.serialize.util.CqlfObjectGenerator;
Joachim Bingeldc03c002014-04-17 13:40:40 +000027
28/**
Joachim Bingelc8a28e42014-04-24 15:06:42 +000029 * Map representation of ANNIS QL syntax tree as returned by ANTLR
Joachim Bingeldc03c002014-04-17 13:40:40 +000030 * @author joachim
31 *
32 */
Joachim Bingel1faf8a52015-01-09 13:17:34 +000033public class AnnisQueryProcessor extends Antlr4AbstractQueryProcessor {
34 private static Logger log = LoggerFactory.getLogger(AnnisQueryProcessor.class);
Joachim Bingeldc03c002014-04-17 13:40:40 +000035 /**
Joachim Bingeldc03c002014-04-17 13:40:40 +000036 * Flag that indicates whether token fields or meta fields are currently being processed
37 */
38 boolean inMeta = false;
39 /**
Joachim Bingel949e3a82014-06-16 13:20:43 +000040 * Keeps track of operands that are to be integrated into yet uncreated objects.
41 */
42 LinkedList<LinkedHashMap<String,Object>> operandStack = new LinkedList<LinkedHashMap<String,Object>>();
43 /**
Joachim Bingelc8a28e42014-04-24 15:06:42 +000044 * Keeps track of explicitly (by #-var definition) or implicitly (number as reference) introduced entities (for later reference by #-operator)
45 */
Joachim Bingelab1aff42014-12-16 16:38:00 +000046 Map<String, LinkedHashMap<String,Object>> nodeVariables = new LinkedHashMap<String, LinkedHashMap<String,Object>>();
Joachim Bingelc8a28e42014-04-24 15:06:42 +000047 /**
48 * Counter for variable definitions.
49 */
50 Integer variableCounter = 1;
51 /**
Joachim Bingeldc03c002014-04-17 13:40:40 +000052 * Marks the currently active token in order to know where to add flags (might already have been taken away from token stack).
53 */
54 LinkedHashMap<String,Object> curToken = new LinkedHashMap<String,Object>();
Joachim Bingel75038792014-05-19 15:12:23 +000055 /**
56 * Keeps track of operands lists that are to be serialised in an inverted
57 * order (e.g. the IN() operator) compared to their AST representation.
58 */
59 private LinkedList<ArrayList<Object>> invertedOperandsLists = new LinkedList<ArrayList<Object>>();
Joachim Bingel77ac5cb2014-04-22 14:03:28 +000060 /**
Joachim Bingelfc428812014-06-18 14:50:14 +000061 * Keeps track of operation:class numbers.
62 */
63 int classCounter = 0;
64 /**
Joachim Bingel9c3ddb92014-06-23 13:49:58 +000065 * Keeps track of numers of relations processed (important when dealing with multiple predications).
66 */
67 int relationCounter = 0;
68 /**
Joachim Bingel019ba5c2014-04-28 14:59:04 +000069 * Keeps track of references to nodes that are operands of groups (e.g. tree relations). Those nodes appear on the top level of the parse tree
70 * but are to be integrated into the AqlTree at a later point (namely as operands of the respective group). Therefore, store references to these
71 * nodes here and exclude the operands from being written into the query map individually.
72 */
Joachim Bingel1846c8c2014-07-08 14:13:31 +000073 private List<ParseTree> globalLingTermNodes = new ArrayList<ParseTree>();
Joachim Bingel9c3ddb92014-06-23 13:49:58 +000074 private int totalRelationCount;
Joachim Bingel1846c8c2014-07-08 14:13:31 +000075 /**
76 * Keeps a record of reference-class-mapping, i.e. which 'class' has been assigned to which #n reference. This is important when introducing korap:reference
77 * spans to refer back to previously established classes for entities.
78 */
Joachim Bingelb001d192014-06-25 11:34:36 +000079 private LinkedHashMap<String, Integer> refClassMapping = new LinkedHashMap<String, Integer>();
Joachim Bingel9c3ddb92014-06-23 13:49:58 +000080 private LinkedHashMap<String, Integer> nodeReferencesTotal = new LinkedHashMap<String, Integer>();
81 private LinkedHashMap<String, Integer> nodeReferencesProcessed = new LinkedHashMap<String, Integer>();
Joachim Bingel1846c8c2014-07-08 14:13:31 +000082
Joachim Bingeldc03c002014-04-17 13:40:40 +000083 /**
84 *
85 * @param tree The syntax tree as returned by ANTLR
86 * @param parser The ANTLR parser instance that generated the parse tree
87 */
Joachim Bingel1faf8a52015-01-09 13:17:34 +000088 public AnnisQueryProcessor(String query) {
Joachim Bingel0e54d222015-01-12 13:22:16 +000089 CqlfObjectGenerator.setQueryProcessor(this);
Joachim Bingel3d5b69b2015-01-14 10:46:44 +000090 process(query);
Joachim Bingeldc03c002014-04-17 13:40:40 +000091 System.out.println(">>> "+requestMap.get("query")+" <<<");
92 }
93
Joachim Bingeldc03c002014-04-17 13:40:40 +000094 @Override
Joachim Bingel3d5b69b2015-01-14 10:46:44 +000095 public void process(String query) {
Joachim Bingeldc03c002014-04-17 13:40:40 +000096 ParseTree tree = parseAnnisQuery(query);
Joachim Bingelc8a28e42014-04-24 15:06:42 +000097 if (this.parser != null) {
98 super.parser = this.parser;
99 } else {
100 throw new NullPointerException("Parser has not been instantiated!");
101 }
Joachim Bingel84395b22014-12-18 10:46:18 +0000102 log.info("Processing Annis query: "+query);
Joachim Bingele3fe3672014-12-17 18:35:58 +0000103 if (tree != null) {
104 log.debug("ANTLR parse tree: "+tree.toStringTree(parser));
105 processNode(tree);
Joachim Bingelab1aff42014-12-16 16:38:00 +0000106 }
Joachim Bingeldc03c002014-04-17 13:40:40 +0000107 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000108
Joachim Bingeldc03c002014-04-17 13:40:40 +0000109 private void processNode(ParseTree node) {
110 // Top-down processing
111 if (visited.contains(node)) return;
112 else visited.add(node);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000113
Joachim Bingeldc03c002014-04-17 13:40:40 +0000114 String nodeCat = getNodeCat(node);
115 openNodeCats.push(nodeCat);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000116
Joachim Bingel77ac5cb2014-04-22 14:03:28 +0000117 stackedObjects = 0;
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000118
Joachim Bingel77ac5cb2014-04-22 14:03:28 +0000119 if (verbose) {
120 System.err.println(" "+objectStack);
121 System.out.println(openNodeCats);
122 }
Joachim Bingeldc03c002014-04-17 13:40:40 +0000123
124 /*
125 ****************************************************************
126 ****************************************************************
127 * Processing individual node categories *
128 ****************************************************************
129 ****************************************************************
130 */
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000131 if (nodeCat.equals("exprTop")) {
Joachim Bingel84395b22014-12-18 10:46:18 +0000132 processExprTop(node);
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000133 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000134
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000135 if (nodeCat.equals("andTopExpr")) {
Joachim Bingel84395b22014-12-18 10:46:18 +0000136 processAndTopExpr(node);
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000137 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000138
Joachim Bingelc89952e2014-06-06 12:08:42 +0000139 if (nodeCat.equals("unary_linguistic_term")) {
Joachim Bingel84395b22014-12-18 10:46:18 +0000140 processUnary_linguistic_term(node);
Joachim Bingelc89952e2014-06-06 12:08:42 +0000141 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000142
Joachim Bingelc89952e2014-06-06 12:08:42 +0000143 if (nodeCat.equals("n_ary_linguistic_term")) {
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000144 processN_ary_linguistic_term(node);
Joachim Bingeldc03c002014-04-17 13:40:40 +0000145 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000146
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000147 if (nodeCat.equals("variableExpr")) {
Joachim Bingelab1aff42014-12-16 16:38:00 +0000148 processVariableExpr(node);
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000149 }
Joachim Bingeldc03c002014-04-17 13:40:40 +0000150
Joachim Bingel77ac5cb2014-04-22 14:03:28 +0000151 objectsToPop.push(stackedObjects);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000152
Joachim Bingeldc03c002014-04-17 13:40:40 +0000153 /*
154 ****************************************************************
155 ****************************************************************
156 * recursion until 'request' node (root of tree) is processed *
157 ****************************************************************
158 ****************************************************************
159 */
160 for (int i=0; i<node.getChildCount(); i++) {
161 ParseTree child = node.getChild(i);
162 processNode(child);
163 }
Joachim Bingel019ba5c2014-04-28 14:59:04 +0000164
Joachim Bingel77ac5cb2014-04-22 14:03:28 +0000165 /*
166 **************************************************************
167 * Stuff that happens after processing the children of a node *
168 **************************************************************
169 */
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000170 if (!objectsToPop.isEmpty()) {
171 for (int i=0; i<objectsToPop.pop(); i++) {
172 objectStack.pop();
173 }
Joachim Bingeldc03c002014-04-17 13:40:40 +0000174 }
Joachim Bingeldc03c002014-04-17 13:40:40 +0000175 openNodeCats.pop();
Joachim Bingeldc03c002014-04-17 13:40:40 +0000176 }
177
Joachim Bingel84395b22014-12-18 10:46:18 +0000178 private void processAndTopExpr(ParseTree node) {
179 // Before processing any child expr node, check if it has one or more "*ary_linguistic_term" nodes.
180 // Those nodes may use references to earlier established operand nodes.
181 // Those operand nodes are not to be included into the query map individually but
182 // naturally as operands of the relations/groups introduced by the
183 // *node. For that purpose, this section mines all used references
184 // and stores them in a list for later reference.
185 for (ParseTree exprNode : getChildrenWithCat(node,"expr")) {
186 // Pre-process any 'variableExpr' such that the variableReferences map can be filled
187 List<ParseTree> definitionNodes = new ArrayList<ParseTree>();
188 definitionNodes.addAll(getChildrenWithCat(exprNode, "variableExpr"));
189 for (ParseTree definitionNode : definitionNodes) {
190 processNode(definitionNode);
191 }
192 // Then, mine all relations between nodes
193 List<ParseTree> lingTermNodes = new ArrayList<ParseTree>();
194 lingTermNodes.addAll(getChildrenWithCat(exprNode, "n_ary_linguistic_term"));
195 globalLingTermNodes.addAll(lingTermNodes);
196 totalRelationCount = globalLingTermNodes.size();
197 // Traverse refOrNode nodes under *ary_linguistic_term nodes and extract references
198 for (ParseTree lingTermNode : lingTermNodes) {
199 for (ParseTree refOrNode : getChildrenWithCat(lingTermNode, "refOrNode")) {
200 String refOrNodeString = refOrNode.getChild(0).toStringTree(parser);
201 if (refOrNodeString.startsWith("#")) {
202 String ref = refOrNode.getChild(0).toStringTree(parser).substring(1);
203 if (nodeReferencesTotal.containsKey(ref)) {
204 nodeReferencesTotal.put(ref, nodeReferencesTotal.get(ref)+1);
205 } else {
206 nodeReferencesTotal.put(ref, 1);
207 nodeReferencesProcessed.put(ref, 0);
208 }
209 }
210 }
211 }
212 }
213 System.err.println(nodeVariables);
214 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000215
Joachim Bingel84395b22014-12-18 10:46:18 +0000216 private void processUnary_linguistic_term(ParseTree node) {
217 LinkedHashMap<String, Object> unaryOperator = parseUnaryOperator(node);
218 String reference = node.getChild(0).toStringTree(parser).substring(1);
219 LinkedHashMap<String, Object> object = nodeVariables.get(reference);
220 object.putAll(unaryOperator);
221 }
222
223 private void processExprTop(ParseTree node) {
224 List<ParseTree> andTopExprs = getChildrenWithCat(node, "andTopExpr");
225 if (andTopExprs.size() > 1) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000226 LinkedHashMap<String, Object> topOr = CqlfObjectGenerator.makeGroup("or");
Joachim Bingel84395b22014-12-18 10:46:18 +0000227 requestMap.put("query", topOr);
228 objectStack.push(topOr);
229 }
230 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000231
Joachim Bingelab1aff42014-12-16 16:38:00 +0000232 private LinkedHashMap<String, Object> processVariableExpr(ParseTree node) {
233 // simplex word or complex assignment (like qname = textSpec)?
234 String firstChildNodeCat = getNodeCat(node.getChild(0));
235 LinkedHashMap<String, Object> object = null;
236 if (firstChildNodeCat.equals("node")) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000237 object = CqlfObjectGenerator.makeSpan();
Joachim Bingelab1aff42014-12-16 16:38:00 +0000238 } else if (firstChildNodeCat.equals("tok")) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000239 object = CqlfObjectGenerator.makeToken();
Joachim Bingelab1aff42014-12-16 16:38:00 +0000240 if (node.getChildCount() > 1) { // empty tokens do not wrap a term
Joachim Bingel0e54d222015-01-12 13:22:16 +0000241 LinkedHashMap<String, Object> term = CqlfObjectGenerator.makeTerm();
Joachim Bingelab1aff42014-12-16 16:38:00 +0000242 term.put("layer", "orth");
243 object.put("wrap", term);
244 }
245 } else if (firstChildNodeCat.equals("qName")) { // only (foundry/)?layer specified
246 // may be token or span, depending on indicated layer! (e.g. cnx/cat=NP vs mate/pos=NN)
247 // TODO generalize the list below -> look up layers associated with tokens rather than spans somewhere
248 HashMap<String, Object> qNameParse = parseQNameNode(node.getChild(0));
249 if (Arrays.asList(new String[]{"p", "lemma", "m", "orth"}).contains(qNameParse.get("layer"))) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000250 object = CqlfObjectGenerator.makeToken();
251 LinkedHashMap<String, Object> term = CqlfObjectGenerator.makeTerm();
Joachim Bingelab1aff42014-12-16 16:38:00 +0000252 object.put("wrap", term);
253 term.putAll(qNameParse);
254 } else {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000255 object = CqlfObjectGenerator.makeSpan();
Joachim Bingelab1aff42014-12-16 16:38:00 +0000256 object.putAll(qNameParse);
257 }
258 } else if (firstChildNodeCat.equals("textSpec")) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000259 object = CqlfObjectGenerator.makeToken();
260 LinkedHashMap<String, Object> term = CqlfObjectGenerator.makeTerm();
Joachim Bingelab1aff42014-12-16 16:38:00 +0000261 object.put("wrap", term);
262 term.put("layer", "orth");
263 term.putAll(parseTextSpec(node.getChild(0)));
264 }
265
266 if (node.getChildCount() == 3) { // (foundry/)?layer=key specification
267 if (object.get("@type").equals("korap:token")) {
Joachim Bingel84395b22014-12-18 10:46:18 +0000268 @SuppressWarnings("unchecked")
Joachim Bingelab1aff42014-12-16 16:38:00 +0000269 HashMap<String, Object> term = (HashMap<String, Object>) object.get("wrap");
270 term.putAll(parseTextSpec(node.getChild(2)));
271 term.put("match", parseMatchOperator(getFirstChildWithCat(node, "eqOperator")));
272 } else {
273 object.putAll(parseTextSpec(node.getChild(2)));
274 object.put("match", parseMatchOperator(getFirstChildWithCat(node, "eqOperator")));
275 }
276 }
277
278 if (object != null) {
279// if (! operandOnlyNodeRefs.contains(variableCounter.toString())) {
280// putIntoSuperObject(object);
281// }
282 if (! getNodeCat(node.getParent().getParent()).equals("n_ary_linguistic_term")) {
283 putIntoSuperObject(object);
284 }
285 ParseTree parentsFirstChild = node.getParent().getChild(0);
286 if (getNodeCat(parentsFirstChild).endsWith("#")) {
287 nodeVariables.put(getNodeCat(parentsFirstChild).replaceAll("#", ""), object);
288 }
289 nodeVariables.put(variableCounter.toString(), object);
290 variableCounter++;
291 }
292 return object;
293 }
294
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000295 /**
296 * Processes an operand node, creating a map for the operand containing all its information
Joachim Bingelab1aff42014-12-16 16:38:00 +0000297 * given in the node definition (referenced via '#'). If this node has been referred to and used earlier,
298 * a reference is created in its place.
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000299 * The operand will be wrapped in a class group if necessary.
Joachim Bingelab1aff42014-12-16 16:38:00 +0000300 * @param operandNode
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000301 * @return A map object with the appropriate CQLF representation of the operand
302 */
Joachim Bingelab1aff42014-12-16 16:38:00 +0000303 private LinkedHashMap<String, Object> retrieveOperand(ParseTree operandNode) {
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000304 LinkedHashMap<String, Object> operand = null;
Joachim Bingelab1aff42014-12-16 16:38:00 +0000305 if (!getNodeCat(operandNode.getChild(0)).equals("variableExpr")) {
306 String ref = operandNode.getChild(0).toStringTree(parser).substring(1);
307 operand = nodeVariables.get(ref);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000308 if (nodeReferencesTotal.get(ref) > 1) {
309 if (nodeReferencesProcessed.get(ref)==0) {
310 refClassMapping.put(ref, classCounter);
Joachim Bingel0e54d222015-01-12 13:22:16 +0000311 operand = CqlfObjectGenerator.wrapInClass(operand, classCounter++);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000312 } else if (nodeReferencesProcessed.get(ref)>0 && nodeReferencesTotal.get(ref)>1) {
313 try {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000314 operand = CqlfObjectGenerator.wrapInReference(operandStack.pop(), refClassMapping.get(ref));
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000315 } catch (NoSuchElementException e) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000316 operand = CqlfObjectGenerator.makeReference(refClassMapping.get(ref));
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000317 }
318 }
Joachim Bingelab1aff42014-12-16 16:38:00 +0000319 nodeReferencesProcessed.put(ref, nodeReferencesProcessed.get(ref)+1);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000320 }
Joachim Bingelab1aff42014-12-16 16:38:00 +0000321 } else {
322 operand = processVariableExpr(operandNode.getChild(0));
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000323 }
324 return operand;
Joachim Bingel9c3ddb92014-06-23 13:49:58 +0000325 }
326
327 @SuppressWarnings("unchecked")
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000328 private void processN_ary_linguistic_term(ParseTree node) {
329 relationCounter++;
330 // get operator and determine type of group (sequence/treeRelation/relation/...)
331 // It's possible in Annis QL to concatenate operators, so there may be several operators under one n_ary_linguistic_term node.
332 // Counter 'i' will iteratively point to all operator nodes (odd-numbered) under this node.
333 for (int i=1; i<node.getChildCount(); i = i+2) {
334 ParseTree operandTree1 = node.getChild(i-1);
335 ParseTree operandTree2 = node.getChild(i+1);
336 String reltype = getNodeCat(node.getChild(i).getChild(0));
337
338 LinkedHashMap<String,Object> group = null;
339 ArrayList<Object> operands = null;
340 // Retrieve operands.
341 LinkedHashMap<String, Object> operand1 = retrieveOperand(operandTree1);
342 LinkedHashMap<String, Object> operand2 = retrieveOperand(operandTree2);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000343 // 'Proper' n_ary_linguistic_operators receive a considerably different serialisation than 'commonparent' and 'commonancestor'.
344 // For the latter cases, a dummy span is introduced and declared as a span class that has a dominance relation towards
345 // the two operands, one after the other, thus resulting in two nested relations! A Poliqarp+ equivalent for A $ B would be
346 // contains(focus(1:contains({1:<>},A)), B).
347 // This is modeled here...
348 if (reltype.equals("commonparent") || reltype.equals("commonancestor")) {
349 // make an (outer) group and an inner group containing the dummy node or previous relations
Joachim Bingel0e54d222015-01-12 13:22:16 +0000350 group = CqlfObjectGenerator.makeGroup("relation");
351 LinkedHashMap<String,Object> innerGroup = CqlfObjectGenerator.makeGroup("relation");
352 LinkedHashMap<String,Object> relation = CqlfObjectGenerator.makeRelation();
353 LinkedHashMap<String,Object> term = CqlfObjectGenerator.makeTerm();
Joachim Bingel62892412014-08-06 15:18:59 +0000354 term.put("layer", "c");
355 relation.put("wrap", term);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000356 // commonancestor is an indirect commonparent relation
Joachim Bingel0e54d222015-01-12 13:22:16 +0000357 if (reltype.equals("commonancestor")) relation.put("boundary", CqlfObjectGenerator.makeBoundary(1, null));
Joachim Bingel62892412014-08-06 15:18:59 +0000358 group.put("relation", relation);
359 innerGroup.put("relation", relation);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000360 // Get operands list before possible re-assignment of 'group' (see following 'if')
361 ArrayList<Object> outerOperands = (ArrayList<Object>) group.get("operands");
362 ArrayList<Object> innerOperands = (ArrayList<Object>) innerGroup.get("operands");
363 // for lowest level, add the underspecified node as first operand and wrap it in a class group
364 if (i == 1) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000365 innerOperands.add(CqlfObjectGenerator.wrapInClass(CqlfObjectGenerator.makeSpan(), classCounter));
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000366 // add the first operand and wrap the whole group in a focusing reference
367 innerOperands.add(operand1);
Joachim Bingel0e54d222015-01-12 13:22:16 +0000368 innerGroup = CqlfObjectGenerator.wrapInReference(innerGroup, classCounter);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000369 outerOperands.add(innerGroup);
370 } else {
371 outerOperands.add(operandStack.pop());
372 }
373 // Lookahead: if next operator is not commonparent or commonancestor, wrap in class for accessibility
374 if (i < node.getChildCount()-2 && !getNodeCat(node.getChild(i+2).getChild(0)).startsWith("common")) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000375 operand2 = CqlfObjectGenerator.wrapInClass(operand2, ++classCounter);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000376 }
377 outerOperands.add(operand2);
378
379 // Wrap in another reference object in case other relations are following
380 if (i < node.getChildCount()-2) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000381 group = CqlfObjectGenerator.wrapInReference(group, classCounter);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000382 }
Joachim Bingel62892412014-08-06 15:18:59 +0000383 // All other n-ary linguistic relations have special 'relation' attributes defined in CQLF and can be
384 // handled more easily...
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000385 } else {
386 LinkedHashMap<String, Object> operatorGroup = parseOperatorNode(node.getChild(i).getChild(0));
387 String groupType;
388 try {
389 groupType = (String) operatorGroup.get("groupType");
390 } catch (ClassCastException | NullPointerException n) {
391 groupType = "relation";
392 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000393 if (groupType.equals("relation") || groupType.equals("treeRelation")) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000394 group = CqlfObjectGenerator.makeGroup(groupType);
Joachim Bingel62892412014-08-06 15:18:59 +0000395 LinkedHashMap<String, Object> relation = new LinkedHashMap<String, Object>();
396 putAllButGroupType(relation, operatorGroup);
Joachim Bingel62892412014-08-06 15:18:59 +0000397 group.put("relation", relation);
Joachim Bingele6d73b12014-09-30 15:34:59 +0000398 } else if (groupType.equals("sequence")) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000399 group = CqlfObjectGenerator.makeGroup(groupType);
Joachim Bingele6d73b12014-09-30 15:34:59 +0000400 putAllButGroupType(group, operatorGroup);
401 } else if (groupType.equals("position")) {
402 group = new LinkedHashMap<String,Object>();
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000403 putAllButGroupType(group, operatorGroup);
404 }
Joachim Bingele6d73b12014-09-30 15:34:59 +0000405
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000406 // Get operands list before possible re-assignment of 'group' (see following 'if')
407 operands = (ArrayList<Object>) group.get("operands");
Joachim Bingel755ada92014-12-16 13:55:37 +0000408
409 ParseTree leftChildSpec = getFirstChildWithCat(node.getChild(i).getChild(0), "@l");
410 ParseTree rightChildSpec = getFirstChildWithCat(node.getChild(i).getChild(0), "@r");
Joachim Bingelab1aff42014-12-16 16:38:00 +0000411 if (leftChildSpec != null || rightChildSpec != null) {
Joachim Bingel755ada92014-12-16 13:55:37 +0000412 String frame = (leftChildSpec!=null) ? "frames:startswith" : "frames:endswith";
Joachim Bingel0e54d222015-01-12 13:22:16 +0000413 LinkedHashMap<String,Object> positionGroup = CqlfObjectGenerator.makePosition(new String[]{frame}, null);
414 operand2 = CqlfObjectGenerator.wrapInClass(operand2, ++classCounter);
Joachim Bingel755ada92014-12-16 13:55:37 +0000415 ((ArrayList<Object>) positionGroup.get("operands")).add(group);
Joachim Bingel0e54d222015-01-12 13:22:16 +0000416 ((ArrayList<Object>) positionGroup.get("operands")).add(CqlfObjectGenerator.makeReference(classCounter,true));
Joachim Bingel755ada92014-12-16 13:55:37 +0000417 group = positionGroup;
418 }
419
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000420 // Wrap in reference object in case other relations are following
421 if (i < node.getChildCount()-2) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000422 group = CqlfObjectGenerator.wrapInReference(group, classCounter);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000423 }
424
425 // Inject operands.
426 // -> Case distinction:
427 if (node.getChildCount()==3) {
428 // Things are easy when there's just one operator (thus 3 children incl. operands)...
429 if (operand1 != null) operands.add(operand1);
430 if (operand2 != null) operands.add(operand2);
431 } else {
Joachim Bingel66472b82014-12-04 16:00:05 +0000432 // ... but things get a little more complicated here. The AST is of this form: (operand1 operator1 operand2 operator2 operand3 operator3 ...)
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000433 // but we'll have to serialize it in a nested, binary way: (((operand1 operator1 operand2) operator2 operand3) operator3 ...)
434 // the following code will do just that:
435 if (i == 1) {
436 // for the first operator, include both operands
437 if (operand1 != null) operands.add(operand1);
Joachim Bingel0e54d222015-01-12 13:22:16 +0000438 if (operand2 != null) operands.add(CqlfObjectGenerator.wrapInClass(operand2, classCounter++));
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000439 // Don't put this into the super object directly but store on operandStack
440 // (because this group will have to be an operand of a subsequent operator)
441 operandStack.push(group);
442 // for all subsequent operators, only take the 2nd operand (first was already added by previous operator)
443 } else if (i < node.getChildCount()-2) {
444 // for all intermediate operators, include other previous groups and 2nd operand. Store this on the operandStack, too.
Joachim Bingel0e54d222015-01-12 13:22:16 +0000445 if (operand2 != null) operands.add(CqlfObjectGenerator.wrapInClass(operand2, classCounter++));
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000446 operands.add(0, operandStack.pop());
447 operandStack.push(group);
448 } else if (i == node.getChildCount()-2) {
449 // This is the last operator. Include 2nd operand only
450 if (operand2 != null) operands.add(operand2);
451 }
452 }
453 }
454 // Final step: decide what to do with the 'group' object, depending on whether all relations have been processed
455 if (i == node.getChildCount()-2 && relationCounter == totalRelationCount) {
456 putIntoSuperObject(group);
457 if (!operandStack.isEmpty()) {
458 operands.add(0, operandStack.pop());
459 }
460 objectStack.push(group);
461 stackedObjects++;
462 } else {
463 operandStack.push(group);
464 }
465 }
Joachim Bingel9c3ddb92014-06-23 13:49:58 +0000466 }
467
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000468
469
Joachim Bingelca4944e2014-06-13 13:55:10 +0000470 /**
471 * Parses a unary_linguistic_operator node. Possible operators are: root, arity, tokenarity.
472 * Operators are embedded into a korap:term, in turn wrapped by an 'attr' property in a korap:span.
473 * @param node The unary_linguistic_operator node
474 * @return A map containing the attr key, to be inserted into korap:span
475 */
476 private LinkedHashMap<String, Object> parseUnaryOperator(ParseTree node) {
477 LinkedHashMap<String, Object> attr = new LinkedHashMap<String, Object>();
Joachim Bingel0e54d222015-01-12 13:22:16 +0000478 LinkedHashMap<String, Object> term = CqlfObjectGenerator.makeTerm();
Joachim Bingelca4944e2014-06-13 13:55:10 +0000479 String op = node.getChild(1).toStringTree(parser).substring(1);
480 if (op.equals("arity") || op.equals("tokenarity")) {
481 LinkedHashMap<String, Object> boundary = boundaryFromRangeSpec(node.getChild(3), false);
482 term.put(op, boundary);
483 } else {
484 term.put(op, true);
485 }
Joachim Bingelca4944e2014-06-13 13:55:10 +0000486 attr.put("attr", term);
487 return attr;
488 }
489
Joachim Bingel66472b82014-12-04 16:00:05 +0000490 @SuppressWarnings("unchecked")
Joachim Bingeleee549e2014-04-29 11:15:37 +0000491 private LinkedHashMap<String, Object> parseOperatorNode(ParseTree operatorNode) {
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000492 LinkedHashMap<String, Object> relation = null;
Joachim Bingeleee549e2014-04-29 11:15:37 +0000493 String operator = getNodeCat(operatorNode);
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000494 // DOMINANCE
Joachim Bingeleee549e2014-04-29 11:15:37 +0000495 if (operator.equals("dominance")) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000496 relation = CqlfObjectGenerator.makeRelation();
Joachim Bingel13421ef2014-05-07 16:22:58 +0000497 relation.put("groupType", "relation");
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000498 ParseTree qName = getFirstChildWithCat(operatorNode, "qName");
Joachim Bingel66472b82014-12-04 16:00:05 +0000499 ParseTree edgeSpecNode = getFirstChildWithCat(operatorNode, "edgeSpec");
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000500 ParseTree star = getFirstChildWithCat(operatorNode, "*");
501 ParseTree rangeSpec = getFirstChildWithCat(operatorNode, "rangeSpec");
Joachim Bingel0e54d222015-01-12 13:22:16 +0000502 LinkedHashMap<String,Object> term = CqlfObjectGenerator.makeTerm();
Joachim Bingel62892412014-08-06 15:18:59 +0000503 term.put("layer", "c");
Joachim Bingel62892412014-08-06 15:18:59 +0000504 if (qName != null) term = parseQNameNode(qName);
Joachim Bingel66472b82014-12-04 16:00:05 +0000505 if (edgeSpecNode != null) {
506 LinkedHashMap<String,Object> edgeSpec = parseEdgeSpec(edgeSpecNode);
507 String edgeSpecType = (String) edgeSpec.get("@type");
508 if (edgeSpecType.equals("korap:termGroup")) {
509 ((ArrayList<Object>) edgeSpec.get("operands")).add(term);
510 term = edgeSpec;
511 } else {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000512 term = CqlfObjectGenerator.makeTermGroup("and");
Joachim Bingel66472b82014-12-04 16:00:05 +0000513 ArrayList<Object> termGroupOperands = (ArrayList<Object>) term.get("operands");
514 termGroupOperands.add(edgeSpec);
Joachim Bingel0e54d222015-01-12 13:22:16 +0000515 LinkedHashMap<String,Object> constTerm = CqlfObjectGenerator.makeTerm();
Joachim Bingel66472b82014-12-04 16:00:05 +0000516 constTerm.put("layer", "c");
517 termGroupOperands.add(constTerm);
518 }
519 }
Joachim Bingel0e54d222015-01-12 13:22:16 +0000520 if (star != null) relation.put("boundary", CqlfObjectGenerator.makeBoundary(0, null));
Joachim Bingel86195a52014-07-08 14:29:48 +0000521 if (rangeSpec != null) relation.put("boundary", boundaryFromRangeSpec(rangeSpec));
Joachim Bingel62892412014-08-06 15:18:59 +0000522 relation.put("wrap", term);
Joachim Bingeleee549e2014-04-29 11:15:37 +0000523 }
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000524 else if (operator.equals("pointing")) {
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000525 // String reltype = operatorNode.getChild(1).toStringTree(parser);
Joachim Bingel0e54d222015-01-12 13:22:16 +0000526 relation = CqlfObjectGenerator.makeRelation();
Joachim Bingel13421ef2014-05-07 16:22:58 +0000527 relation.put("groupType", "relation");
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000528 ParseTree qName = getFirstChildWithCat(operatorNode, "qName");
529 ParseTree edgeSpec = getFirstChildWithCat(operatorNode, "edgeSpec");
530 ParseTree star = getFirstChildWithCat(operatorNode, "*");
531 ParseTree rangeSpec = getFirstChildWithCat(operatorNode, "rangeSpec");
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000532 // if (qName != null) relation.putAll(parseQNameNode(qName));
Joachim Bingel0e54d222015-01-12 13:22:16 +0000533 LinkedHashMap<String,Object> term = CqlfObjectGenerator.makeTerm();
Joachim Bingel62892412014-08-06 15:18:59 +0000534 if (qName != null) term.putAll(parseQNameNode(qName));
535 if (edgeSpec != null) term.putAll(parseEdgeSpec(edgeSpec));
Joachim Bingel0e54d222015-01-12 13:22:16 +0000536 if (star != null) relation.put("boundary", CqlfObjectGenerator.makeBoundary(0, null));
Joachim Bingel86195a52014-07-08 14:29:48 +0000537 if (rangeSpec != null) relation.put("boundary", boundaryFromRangeSpec(rangeSpec));
Joachim Bingel62892412014-08-06 15:18:59 +0000538 relation.put("wrap", term);
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000539 }
540 else if (operator.equals("precedence")) {
Joachim Bingel13421ef2014-05-07 16:22:58 +0000541 relation = new LinkedHashMap<String, Object>();
542 relation.put("groupType", "sequence");
543 ParseTree rangeSpec = getFirstChildWithCat(operatorNode, "rangeSpec");
544 ParseTree star = getFirstChildWithCat(operatorNode, "*");
545 ArrayList<Object> distances = new ArrayList<Object>();
546 if (star != null) {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000547 distances.add(CqlfObjectGenerator.makeDistance("w", 0, null));
Joachim Bingel13421ef2014-05-07 16:22:58 +0000548 relation.put("distances", distances);
549 }
550 if (rangeSpec != null) {
551 distances.add(parseDistance(rangeSpec));
552 relation.put("distances", distances);
553 }
554 relation.put("inOrder", true);
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000555 }
556 else if (operator.equals("spanrelation")) {
Joachim Bingele6d73b12014-09-30 15:34:59 +0000557// relation = makeGroup("position");
558// relation.put("groupType", "position");
Joachim Bingel75038792014-05-19 15:12:23 +0000559 String reltype = operatorNode.getChild(0).toStringTree(parser);
Joachim Bingele6d73b12014-09-30 15:34:59 +0000560 String[] frames = new String[]{};
Joachim Bingel75038792014-05-19 15:12:23 +0000561 switch (reltype) {
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000562 case "_=_":
Joachim Bingel6b491c22014-10-21 08:35:18 +0000563 frames = new String[]{"frames:matches"};
Joachim Bingele6d73b12014-09-30 15:34:59 +0000564 break;
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000565 case "_l_":
Joachim Bingel6b491c22014-10-21 08:35:18 +0000566 frames = new String[]{"frames:startswith"};
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000567 break;
568 case "_r_":
Joachim Bingel6b491c22014-10-21 08:35:18 +0000569 frames = new String[]{"frames:endswith"};
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000570 break;
571 case "_i_":
Joachim Bingel6b491c22014-10-21 08:35:18 +0000572 frames = new String[]{"frames:contains"};break;
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000573 case "_o_":
Joachim Bingel6b491c22014-10-21 08:35:18 +0000574 frames = new String[]{"frames:overlapsLeft", "frames:overlapsRight"};
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000575 break;
576 case "_ol_":
Joachim Bingel6b491c22014-10-21 08:35:18 +0000577 frames = new String[]{"frames:overlapsLeft"};
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000578 break;
579 case "_or_":
Joachim Bingel6b491c22014-10-21 08:35:18 +0000580 frames = new String[]{"frames:overlapsRight"};
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000581 break;
Joachim Bingel75038792014-05-19 15:12:23 +0000582 }
Joachim Bingele6d73b12014-09-30 15:34:59 +0000583// relation.put("frames", frames);
584// relation.put("sharedClasses", sharedClasses);
Joachim Bingel0e54d222015-01-12 13:22:16 +0000585 relation = CqlfObjectGenerator.makePosition(frames, new String[]{});
Joachim Bingele6d73b12014-09-30 15:34:59 +0000586 relation.put("groupType", "position");
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000587 }
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000588 else if (operator.equals("identity")) {
Joachim Bingel66472b82014-12-04 16:00:05 +0000589 //TODO since ANNIS v. 3.1.6
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000590 }
591 else if (operator.equals("equalvalue")) {
Joachim Bingel66472b82014-12-04 16:00:05 +0000592 //TODO since ANNIS v. 3.1.6
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000593 }
594 else if (operator.equals("notequalvalue")) {
Joachim Bingel66472b82014-12-04 16:00:05 +0000595 //TODO since ANNIS v. 3.1.6
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000596 }
597 return relation;
598 }
599
Joachim Bingelceb79062014-09-22 11:50:37 +0000600 @SuppressWarnings("unchecked")
Joachim Bingel62892412014-08-06 15:18:59 +0000601 private LinkedHashMap<String,Object> parseEdgeSpec(ParseTree edgeSpec) {
602 List<ParseTree> annos = getChildrenWithCat(edgeSpec, "edgeAnno");
603 if (annos.size() == 1) return parseEdgeAnno(annos.get(0));
604 else {
Joachim Bingel0e54d222015-01-12 13:22:16 +0000605 LinkedHashMap<String,Object> termGroup = CqlfObjectGenerator.makeTermGroup("and");
Joachim Bingel62892412014-08-06 15:18:59 +0000606 ArrayList<Object> operands = (ArrayList<Object>) termGroup.get("operands");
607 for (ParseTree anno : annos) {
608 operands.add(parseEdgeAnno(anno));
609 }
610 return termGroup;
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000611 }
Joachim Bingeleee549e2014-04-29 11:15:37 +0000612 }
613
Joachim Bingel66472b82014-12-04 16:00:05 +0000614 private LinkedHashMap<String, Object> parseEdgeAnno(ParseTree edgeAnnoSpec) {
Joachim Bingeleee549e2014-04-29 11:15:37 +0000615 LinkedHashMap<String, Object> edgeAnno = new LinkedHashMap<String, Object>();
Joachim Bingela07b8e72014-05-09 15:06:07 +0000616 edgeAnno.put("@type", "korap:term");
Joachim Bingel66472b82014-12-04 16:00:05 +0000617 ParseTree textSpecNode = getFirstChildWithCat(edgeAnnoSpec, "textSpec");
618 ParseTree layerNode = getFirstChildWithCat(edgeAnnoSpec, "layer");
619 ParseTree foundryNode = getFirstChildWithCat(edgeAnnoSpec, "foundry");
620 ParseTree matchOperatorNode = getFirstChildWithCat(edgeAnnoSpec, "eqOperator");
Joachim Bingel639df9c2014-05-12 15:27:00 +0000621 if (foundryNode!=null) edgeAnno.put("foundry", foundryNode.getChild(0).toStringTree(parser));
622 if (layerNode!=null) edgeAnno.put("layer", layerNode.getChild(0).toStringTree(parser));
Joachim Bingeleee549e2014-04-29 11:15:37 +0000623 edgeAnno.putAll(parseTextSpec(textSpecNode));
624 edgeAnno.put("match", parseMatchOperator(matchOperatorNode));
625 return edgeAnno;
626 }
627
Joachim Bingela07b8e72014-05-09 15:06:07 +0000628 private LinkedHashMap<String, Object> boundaryFromRangeSpec(ParseTree rangeSpec) {
Joachim Bingelca4944e2014-06-13 13:55:10 +0000629 return boundaryFromRangeSpec(rangeSpec, true);
630 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000631
Joachim Bingelca4944e2014-06-13 13:55:10 +0000632 private LinkedHashMap<String, Object> boundaryFromRangeSpec(ParseTree rangeSpec, boolean expandToMax) {
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000633 Integer min = Integer.parseInt(rangeSpec.getChild(0).toStringTree(parser));
Joachim Bingelca4944e2014-06-13 13:55:10 +0000634 Integer max = min;
Joachim Bingel687e4d42014-07-30 09:34:18 +0000635 if (expandToMax) max = null;
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000636 if (rangeSpec.getChildCount()==3)
637 max = Integer.parseInt(rangeSpec.getChild(2).toStringTree(parser));
Joachim Bingel0e54d222015-01-12 13:22:16 +0000638 return CqlfObjectGenerator.makeBoundary(min, max);
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000639 }
Joachim Bingela07b8e72014-05-09 15:06:07 +0000640
Joachim Bingel13421ef2014-05-07 16:22:58 +0000641 private LinkedHashMap<String, Object> parseDistance(ParseTree rangeSpec) {
642 Integer min = Integer.parseInt(rangeSpec.getChild(0).toStringTree(parser));
Joachim Bingel687e4d42014-07-30 09:34:18 +0000643 Integer max = null;
Joachim Bingel13421ef2014-05-07 16:22:58 +0000644 if (rangeSpec.getChildCount()==3)
645 max = Integer.parseInt(rangeSpec.getChild(2).toStringTree(parser));
Joachim Bingel0e54d222015-01-12 13:22:16 +0000646 return CqlfObjectGenerator.makeDistance("w", min, max);
Joachim Bingel13421ef2014-05-07 16:22:58 +0000647 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000648
Joachim Bingeleee549e2014-04-29 11:15:37 +0000649 private LinkedHashMap<String, Object> parseTextSpec(ParseTree node) {
650 LinkedHashMap<String, Object> term = new LinkedHashMap<String, Object>();
Joachim Bingel019ba5c2014-04-28 14:59:04 +0000651 if (hasChild(node, "regex")) {
652 term.put("type", "type:regex");
653 term.put("key", node.getChild(0).getChild(0).toStringTree(parser).replaceAll("/", ""));
654 } else {
655 term.put("key", node.getChild(1).toStringTree(parser));
656 }
657 term.put("match", "match:eq");
658 return term;
659 }
660
Joachim Bingeldc03c002014-04-17 13:40:40 +0000661 /**
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000662 * Parses the match operator (= or !=)
Joachim Bingeldc03c002014-04-17 13:40:40 +0000663 * @param node
664 * @return
665 */
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000666 private String parseMatchOperator(ParseTree node) {
Joachim Bingel66472b82014-12-04 16:00:05 +0000667 if (node.getChildCount()>0) {
668 return node.getChild(0).toStringTree(parser).equals("=") ? "match:eq" : "match:ne";
669 }
670 return null;
Joachim Bingeldc03c002014-04-17 13:40:40 +0000671 }
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000672
673 private LinkedHashMap<String, Object> parseQNameNode(ParseTree node) {
674 LinkedHashMap<String, Object> fields = new LinkedHashMap<String, Object>();
Joachim Bingeld4ae5fd2014-04-29 15:00:16 +0000675 ParseTree layerNode = getFirstChildWithCat(node, "layer");
676 ParseTree foundryNode = getFirstChildWithCat(node, "foundry");
677 if (foundryNode != null) fields.put("foundry", foundryNode.getChild(0).toStringTree(parser));
Joachim Bingel66472b82014-12-04 16:00:05 +0000678 String layer = layerNode.getChild(0).toStringTree(parser);
679 if (layer.equals("pos")) layer = "p";
680 if (layer.equals("cat")) layer = "c";
681 fields.put("layer", layer);
Joachim Bingelc8a28e42014-04-24 15:06:42 +0000682 return fields;
683 }
684
Joachim Bingel77ac5cb2014-04-22 14:03:28 +0000685 private void putIntoSuperObject(LinkedHashMap<String, Object> object) {
686 putIntoSuperObject(object, 0);
687 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000688
Joachim Bingel77ac5cb2014-04-22 14:03:28 +0000689 @SuppressWarnings({ "unchecked" })
690 private void putIntoSuperObject(LinkedHashMap<String, Object> object, int objStackPosition) {
Joachim Bingel9c3ddb92014-06-23 13:49:58 +0000691 if (objectStack.size()>objStackPosition) {
Joachim Bingel77ac5cb2014-04-22 14:03:28 +0000692 ArrayList<Object> topObjectOperands = (ArrayList<Object>) objectStack.get(objStackPosition).get("operands");
Joachim Bingel75038792014-05-19 15:12:23 +0000693 if (!invertedOperandsLists.contains(topObjectOperands)) {
694 topObjectOperands.add(object);
695 } else {
696 topObjectOperands.add(0, object);
697 }
Joachim Bingel77ac5cb2014-04-22 14:03:28 +0000698 } else {
699 requestMap.put("query", object);
700 }
701 }
Joachim Bingel9c3ddb92014-06-23 13:49:58 +0000702
Joachim Bingel13421ef2014-05-07 16:22:58 +0000703 private void putAllButGroupType(Map<String, Object> container, Map<String, Object> input) {
704 for (String key : input.keySet()) {
705 if (!key.equals("groupType")) {
706 container.put(key, input.get(key));
707 }
708 }
709 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000710
Joachim Bingel3d5b69b2015-01-14 10:46:44 +0000711 private ParserRuleContext parseAnnisQuery (String query) {
Joachim Bingel3fa584b2014-12-17 13:35:43 +0000712 Lexer lexer = new AqlLexer((CharStream)null);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000713 ParserRuleContext tree = null;
Joachim Bingel3fa584b2014-12-17 13:35:43 +0000714 Antlr4DescriptiveErrorListener errorListener = new Antlr4DescriptiveErrorListener(query);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000715 // Like p. 111
716 try {
Joachim Bingeldc03c002014-04-17 13:40:40 +0000717
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000718 // Tokenize input data
Joachim Bingel3fa584b2014-12-17 13:35:43 +0000719 ANTLRInputStream input = new ANTLRInputStream(query);
720 lexer.setInputStream(input);
721 CommonTokenStream tokens = new CommonTokenStream(lexer);
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000722 parser = new AqlParser(tokens);
Joachim Bingeldc03c002014-04-17 13:40:40 +0000723
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000724 // Don't throw out erroneous stuff
725 parser.setErrorHandler(new BailErrorStrategy());
Joachim Bingel3fa584b2014-12-17 13:35:43 +0000726 lexer.removeErrorListeners();
727 lexer.addErrorListener(errorListener);
728 parser.removeErrorListeners();
729 parser.addErrorListener(errorListener);
Joachim Bingeldc03c002014-04-17 13:40:40 +0000730
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000731 // Get starting rule from parser
732 Method startRule = AqlParser.class.getMethod("start");
733 tree = (ParserRuleContext) startRule.invoke(parser, (Object[])null);
734 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000735 // Some things went wrong ...
736 catch (Exception e) {
Joachim Bingele3fe3672014-12-17 18:35:58 +0000737 log.error("Could not parse query. Please make sure it is well-formed.");
738 log.error(errorListener.generateFullErrorMsg().toString());
739 addError(errorListener.generateFullErrorMsg());
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000740 }
Joachim Bingel1846c8c2014-07-08 14:13:31 +0000741 return tree;
742 }
Joachim Bingel761d1c12014-12-17 14:02:40 +0000743}