blob: ba0e8c20ff76e78aaabcb86f8c446ff39629385e [file] [log] [blame]
Akrond05e2112016-02-18 15:47:18 +01001/*
Nils Diewald023c6712015-05-21 20:12:30 +00002var menuContent = [
3 ['cnx/c', 'cnx', 'c'],
4 ['mate/c', 'mate', 'c'],
5 ['base/c', 'base', 'c'],
6 ['xip/c', 'xip', 'c'],
7 ['tt/c', 'tt', 'c']
8];
Akrond05e2112016-02-18 15:47:18 +01009*/
Nils Diewald023c6712015-05-21 20:12:30 +000010
11var namedEntities = [
12 ["I-LOC", "I-LOC ", "Location"],
13 ["I-MISC", "I-MISC ", "Miscellaneous"],
14 ["I-ORG", "I-ORG ", "Organization"],
15 ["I-PER", "I-PER ", "Person"]
16];
17
18// http://www.ids-mannheim.de/cosmas2/projekt/referenz/stts/morph.html
19// http://nachhalt.sfb632.uni-potsdam.de/owl-docu/stts.html
20var sttsArray = [
21 // "$.", "$(", "$,"
22 ["ADJA","ADJA ", "Attributive Adjective"],
23 ["ADJD","ADJD ", "Predicative Adjective"],
24 ["ADV","ADV ", "Adverb"],
25 ["APPO","APPO ", "Postposition"],
26 ["APPR","APPR ", "Preposition"],
27 ["APPRART","APPRART ", "Preposition with Determiner"],
28 ["APZR","APZR ","Right Circumposition"],
29 ["ART","ART ", "Determiner"],
30 ["CARD","CARD ", "Cardinal Number"],
31 ["FM","FM ", "Foreign Material"],
32 ["ITJ","ITJ ", "Interjection"],
33 ["KOKOM","KOKOM ", "Comparison Particle"],
34 ["KON","KON ", "Coordinating Conjuncion"],
35 ["KOUI","KOUI ", "Subordinating Conjunction with 'zu'"],
36 ["KOUS","KOUS ", "Subordinating Conjunction with Sentence"],
37 ["NE","NE ", "Named Entity"],
38 ["NN","NN ", "Normal Nomina"],
39 ["PAV", "PAV ", "Pronominal Adverb"],
40 ["PDAT","PDAT ","Attributive Demonstrative Pronoun"],
41 ["PDS","PDS ", "Substitutive Demonstrative Pronoun"],
42 ["PIAT","PIAT ", "Attributive Indefinite Pronoun without Determiner"],
43 ["PIDAT","PIDAT ", "Attributive Indefinite Pronoun with Determiner"],
44 ["PIS","PIS ", "Substitutive Indefinite Pronoun"],
45 ["PPER","PPER ", "Personal Pronoun"],
46 ["PPOSAT","PPOSAT ", "Attributive Possessive Pronoun"],
47 ["PPOSS","PPOSS ", "Substitutive Possessive Pronoun"],
48 ["PRELAT","PRELAT ", "Attributive Relative Pronoun"],
49 ["PRELS","PRELS ", "Substitutive Relative Pronoun"],
50 ["PRF","PRF ", "Reflexive Pronoun"],
51 ["PROAV","PROAV ", "Pronominal Adverb"],
52 ["PTKA","PTKA ","Particle with Adjective"],
53 ["PTKANT","PTKANT ", "Answering Particle"],
54 ["PTKNEG","PTKNEG ", "Negation Particle"],
55 ["PTKVZ","PTKVZ ", "Separated Verbal Particle"],
56 ["PTKZU","PTKZU ", "'zu' Particle"],
57 ["PWAT","PWAT ", "Attributive Interrogative Pronoun"],
58 ["PWAV","PWAV ", "Adverbial Interrogative Pronoun"],
59 ["PWS","PWS ", "Substitutive Interrogative Pronoun"],
60 ["TRUNC","TRUNC ","Truncated"],
61 ["VAFIN","VAFIN ", "Auxiliary Finite Verb"],
Nils Diewald023c6712015-05-21 20:12:30 +000062 ["VAIMP","VAIMP ", "Auxiliary Finite Imperative Verb"],
Akroncff9bac2016-01-25 21:39:38 +010063 ["VAINF","VAINF ", "Auxiliary Infinite Verb"],
Nils Diewald023c6712015-05-21 20:12:30 +000064 ["VAPP","VAPP ", "Auxiliary Perfect Participle"],
65 ["VMFIN","VMFIN ", "Modal Finite Verb"],
66 ["VMINF","VMINF ", "Modal Infinite Verb"],
67 ["VMPP","VMPP ", "Modal Perfect Participle"],
68 ["VVFIN","VVFIN ","Finite Verb"],
69 ["VVIMP","VVIMP ", "Finite Imperative Verb"],
70 ["VVINF","VVINF ", "Infinite Verb"],
71 ["VVIZU","VVIZU ", "Infinite Verb with 'zu'"],
72 ["VVPP","VVPP ", "Perfect Participle"],
73 ["XY", "XY ", "Non-Word"]
74];
75
Akroncff9bac2016-01-25 21:39:38 +010076
Akron113cc1a2016-01-22 21:17:57 +010077// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/negra-corpus.html
78// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/knoten.html
79var negraNodes = [
80 ["AA", "AA", "superlative phrase with 'am'"],
81 ["AP","AP", "adjektive phrase"],
82 ["AVP","AVP", "adverbial phrase"],
83 ["CAP","CAP", "coordinated adjektive phrase"],
84 ["CAVP","CAVP", "coordinated adverbial phrase"],
85 ["CAC","CAC", "coordinated adposition"],
86 ["CCP","CCP", "coordinated complementiser"],
87 ["CH","CH", "chunk"],
88 ["CNP","CNP", "coordinated noun phrase"],
89 ["CO","CO", "coordination"],
90 ["CPP","CPP", "coordinated adpositional phrase"],
91 ["CS","CS", "coordinated sentence"],
92 ["CVP","CVP", "coordinated verb phrase (non-finite)"],
93 ["CVZ","CVZ", "coordinated zu-marked infinitive"],
94 ["DL","DL", "discourse level constituent"],
95 ["ISU","ISU", "idiosyncratis unit"],
96 ["MPN","MPN", "multi-word proper noun"],
97 ["MTA","MTA", "multi-token adjective"],
98 ["NM","NM", "multi-token number"],
99 ["NP","NP", "noun phrase"],
100 ["PP","PP", "adpositional phrase"],
101 ["QL","QL", "quasi-languag"],
102 ["ROOT","ROOT", "root node"],
103 ["S","S", "sentence"],
104 ["VP","VP", "verb phrase (non-finite)"],
105 ["VZ","VZ", "zu-marked infinitive"]
106];
107
108// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/kanten.html
109var negraEdges = [
110 ["AC","AC","adpositional case marker"],
111 ["ADC","ADC","adjective component"],
112 ["AMS","AMS","measure argument of adj"],
113 ["APP","APP","apposition"],
114 ["AVC","AVC","adverbial phrase component"],
115 ["CC","CC","comparative complement"],
116 ["CD","CD","coordinating conjunction"],
117 ["CJ","CJ","conjunct"],
118 ["CM","CM","comparative concjunction"],
119 ["CP","CP","complementizer"],
120 ["DA","DA","dative"],
121 ["DH","DH","discourse-level head"],
122 ["DM","DM","discourse marker"],
123 ["GL","GL","prenominal genitive"],
124 ["GR","GR","postnominal genitive"],
125 ["HD","HD","head"],
126 ["JU","JU","junctor"],
127 ["MC","MC","comitative"],
128 ["MI","MI","instrumental"],
129 ["ML","ML","locative"],
130 ["MNR","MNR","postnominal modifier"],
131 ["MO","MO","modifier"],
132 ["MR","MR","rhetorical modifier"],
133 ["MW","MW","way (directional modifier)"],
134 ["NG","NG","negation"],
135 ["NK","NK","noun kernel modifier"],
136 ["NMC","NMC","numerical component"],
137 ["OA","OA","accusative object"],
138 ["OA2","OA2","second accusative object"],
139 ["OC","OC","clausal object"],
140 ["OG","OG","genitive object"],
141 ["PD","PD","predicate"],
142 ["PG","PG","pseudo-genitive"],
143 ["PH","PH","placeholder"],
144 ["PM","PM","morphological particle"],
145 ["PNC","PNC","proper noun component"],
146 ["RC","RC","relative clause"],
147 ["RE","RE","repeated element"],
148 ["RS","RS","reported speech"],
149 ["SB","SB","subject"],
150 ["SBP","SBP","passivised subject (PP)"],
151 ["SP","SP","subject or predicate"],
152 ["SVP","SVP","separable verb prefix"],
153 ["UC","UC","(idiosyncratic) unit component"],
154 ["VO","VO","vocative"]
155];
156
Nils Diewald023c6712015-05-21 20:12:30 +0000157var mateSttsArray = sttsArray.slice(0);
158mateSttsArray.push(
159 ["<root-POS>","<root-POS>","Root Part of Speech"]
160);
161
Akronb2a09532016-02-16 19:14:42 +0100162var sgbrSttsArray = sttsArray.slice(0);
Akronb3923852016-02-01 16:07:59 +0100163
Akronb2a09532016-02-16 19:14:42 +0100164// Push specific information for Schreibgebrauch
165sgbrSttsArray.push(
166 ["NNE", "NNE", "Normal Nomina with Named Entity"],
167 ["ADVART","ADVART", "Adverb with Article"],
168 ["EMOASC","EMOASC", "ASCII emoticon"],
169 ["EMOIMG","EMOIMG", "Graphic emoticon"],
170 ["ERRTOK","ERRTOK", "Tokenisation Error"],
171 ["HST", "HST", "Hashtag"],
172 ["KOUSPPER","KOUSPPER", "Subordinating Conjunction (with Sentence) with Personal Pronoun"],
173 ["ONO", "ONO", "Onomatopoeia"],
174 ["PPERPPER","PPERPPER", "Personal Pronoun with Personal Pronoun"],
175 ["URL", "URL", "Uniform Resource Locator"],
176 ["VAPPER", "VAPPER", "Finite Auxiliary Verb with Personal Pronoun"],
177 ["VMPPER", "VMPPER", "Fintite Modal Verb with Personal Pronoun"],
178 ["VVPPER", "VVPPER", "Finite Full Verb with Personal Pronoun"],
179 ["AW", "AW", "Interaction Word"],
180 ["ADR", "ADR", "Addressing Term"],
181 ["AWIND", "AWIND", "Punctuation Indicating Addressing Term"],
182 ["ERRAW","ERRAW", "Part of Erroneously Separated Compound"]
183 /*
184 As KorAP currently doesn't support these tags, they could also be ommited
185 ["_KOMMA", "_KOMMA", "Comma"],
186 ["_SONST", "_SONST", "Intrasentential Punctuation Mark"],
187 ["_ENDE", "_ENDE", "Punctuation Mark at the end of the Sentence"]
188 */
189);
190
191// Sort by tag
192sgbrSttsArray.sort(function (a,b) { return a[0].localeCompare(b[0]) });
Akroncff9bac2016-01-25 21:39:38 +0100193
Akron113cc1a2016-01-22 21:17:57 +0100194define(function () {
195 var obj = {
196 "-" : [
Akrond05e2112016-02-18 15:47:18 +0100197 ["Base Annotation", "base/s=", "Structure"],
Akron9b9d09f2017-04-27 20:10:34 +0200198// ["Connexor", "cnx/", "Constituency, Lemma, Morphology, Part-of-Speech, Syntax"],
Akroncff9bac2016-01-25 21:39:38 +0100199 ["CoreNLP", "corenlp/", "Constituency, Named Entities, Part-of-Speech"],
Akrond05e2112016-02-18 15:47:18 +0100200 ["DeReKo", "dereko/s=", "Structure"],
Akron9b9d09f2017-04-27 20:10:34 +0200201// ["Mate", "mate/", "Lemma, Morphology, Part-of-Speech"],
202 ["Malt", "malt/", "Dependency"],
Akroncff9bac2016-01-25 21:39:38 +0100203 ["OpenNLP", "opennlp/", "Part-of-Speech"],
Akron9b9d09f2017-04-27 20:10:34 +0200204// ["Schreibgebrauch", "sgbr/", "Lemma, Lemma Variants, Part-of-Speech"],
Akroncff9bac2016-01-25 21:39:38 +0100205 ["TreeTagger", "tt/", "Lemma, Part-of-Speech"],
Akron9b9d09f2017-04-27 20:10:34 +0200206// ["Xerox Parser", "xip/", "Constituency, Lemma, Part-of-Speech"]
207 ["MarMoT", "marmot/", "Morphology, Part-of-Speech"],
Akron113cc1a2016-01-22 21:17:57 +0100208 ],
Akrond05e2112016-02-18 15:47:18 +0100209 "base/s=" : [
210 ["s", "s", "Sentence"],
211 ["p", "p", "Paragraph"],
212 ["t", "t", "Text"]
213 ],
Akron113cc1a2016-01-22 21:17:57 +0100214 "corenlp/" : [
215 ["Constituency", "c="],
216 ["Named Entity", "ne=" , "Combined"],
217 ["Named Entity", "ne_dewac_175m_600=" , "ne_dewac_175m_600"],
218 ["Named Entity", "ne_hgc_175m_600=", "ne_hgc_175m_600"],
219 ["Part-of-Speech", "p="]
220 ],
221 "corenlp/ne=" : namedEntities,
222 "corenlp/ne_dewac_175m_600=" : namedEntities,
223 "corenlp/ne_hgc_175m_600=" : namedEntities,
224 "corenlp/p=" : sttsArray,
225 "corenlp/c=" : negraNodes,
226 "cnx/" : [
227 ["Constituency", "c="],
228 ["Lemma", "l="],
229 ["Morphology", "m="],
230 ["Part-of-Speech", "p="],
231 ["Syntax", "syn="]
232 ],
233 "cnx/c=" : [
234 ["np", "np ", "Nominal Phrase"]
235 ],
236 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/morph.html
237 "cnx/m=" : [
238 ["Abbr","Abbr ", "Nouns: Abbreviation"],
239 ["CMP","CMP ", "Adjective: Comparative"],
240 ["IMP", "IMP ", "Mood: Imperative"],
241 ["IND", "IND ", "Mood: Indicative"],
242 ["INF", "INF ", "Infinitive"],
243 ["ORD","ORD ", "Numeral: Ordinal"],
244 ["PAST", "PAST ", "Tense: past"],
245 ["PCP", "PCP ", "Participle"],
246 ["PERF", "PERF ", "Perfective Participle"],
247 ["PL","PL ", "Nouns: Plural"],
248 ["PRES", "PRES ", "Tense: present"],
249 ["PROG", "PROG ", "Progressive Participle"],
250 ["Prop","Prop ", "Nouns: Proper Noun"],
251 ["SUB", "SUB ", "Mood: Subjunctive"],
252 ["SUP","SUP ", "Adjective: Superlative"]
253 ],
254 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/morph.html
255 "cnx/p=" : [
256 ["A", "A ", "Adjective"],
257 ["ADV", "ADV ", "Adverb"],
258 ["CC", "CC ", "Coordination Marker"],
259 ["CS", "CS ", "Clause Marker"],
260 ["DET", "DET ", "Determiner"],
261 ["INTERJ", "INTERJ ", "Interjection"],
262 ["N", "N ", "Noun"],
263 ["NUM", "NUM ", "Numeral"],
264 ["PREP", "PREP ", "Preposition"],
265 ["PRON", "PRON ", "Pro-Nominal"],
266 ["V", "V ", "Verb"]
267 ],
268 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/syntax.html
269 "cnx/syn=" : [
270 ["@ADVL", "@ADVL ", "Adverbial Head"],
271 ["@AUX", "@AUX ", "Auxiliary Verb"],
272 ["@CC", "@CC ", "Coordination"]
273 ["@MAIN", "@MAIN ", "Main Verb"],
274 ["@NH", "@NH ", "Nominal Head"],
275 ["@POSTMOD", "@POSTMOD ", "Postmodifier"],
276 ["@PREMARK", "@PREMARK ", "Preposed Marker"],
277 ["@PREMOD", "@POSTMOD ", "Premodifier"]
278 ],
279 "opennlp/" : [
280 ["Part-of-Speech", "p="]
281 ],
282 "opennlp/p=" : sttsArray,
Akroncff9bac2016-01-25 21:39:38 +0100283 "sgbr/" : [
284 ["Lemma", "l="],
285 ["Lemma Variants", "lv="],
286 ["Part-of-Speech", "p="]
287 ],
Akronb2a09532016-02-16 19:14:42 +0100288 "sgbr/p=" : sgbrSttsArray,
Akron113cc1a2016-01-22 21:17:57 +0100289 "xip/" : [
290 ["Constituency", "c="],
291 // Inactive: ["Dependency", "d="],
292 ["Lemma", "l="],
293 ["Part-of-Speech", "p="],
294 ],
295 // "xip/c=" : [],
296 // Inactive: "xip/d=" : [],
297 // "xip/p=" : [],
298 "tt/" : [
299 ["Lemma", "l="],
300 ["Part-of-Speech", "p="]
301 ],
302 "tt/p=" : sttsArray,
Akron9b9d09f2017-04-27 20:10:34 +0200303 "marmot/" : [
304 ["Morphology", "m="],
305 ["Part-of-Speech", "p="]
306 ],
307 "marmot/p=" : sttsArray,
308 "malt/" : [
309 ["Dependency", "d="]
310 ],
Akron113cc1a2016-01-22 21:17:57 +0100311 "mate/" : [
312 // Inactive: "d" : ["d=", "Dependency"],
313 ["Lemma", "l="],
314 ["Morphology", "m="],
315 ["Part-of-Speech", "p="]
316 ],
317 // Inactive: mate/d=
318 "mate/p=" : mateSttsArray,
319 "mate/m=" : [
320 ["Case", "case:"],
321 ["Degree", "degree:"],
322 ["Gender", "gender:"],
323 ["Mood", "mood:"],
324 ["Number", "number:"],
325 ["Person", "person:"],
326 ["Tense","tense:"],
327 ["No type", "<no-type> "]
328 ],
Akron9b9d09f2017-04-27 20:10:34 +0200329 "marmot/m=" : [
330 ["Case", "case:"],
331 ["Degree", "degree:"],
332 ["Gender", "gender:"],
333 ["Mood", "mood:"],
334 ["Number", "number:"],
335 ["Person", "person:"],
336 ["Tense","tense:"],
337 ["No type", "<no-type> "]
338 ],
Akron113cc1a2016-01-22 21:17:57 +0100339 "mate/m=case:" : [
340 ["acc", "acc ", "Accusative"],
341 ["dat","dat ", "Dative"],
342 ["gen", "gen ","Genitive"],
343 ["nom","nom ", "Nominative"],
344 ["*","* ", "Undefined"]
345 ],
Akron9b9d09f2017-04-27 20:10:34 +0200346 "marmot/m=case:" : [
347 ["acc", "acc ", "Accusative"],
348 ["dat","dat ", "Dative"],
349 ["gen", "gen ","Genitive"],
350 ["nom","nom ", "Nominative"],
351 ["*","* ", "Undefined"]
352 ],
Akron113cc1a2016-01-22 21:17:57 +0100353 "mate/m=degree:" : [
354 ["comp","comp ", "Comparative"],
355 ["pos","pos ", "Positive"],
356 ["sup","sup ", "Superative"]
357 ],
Akron9b9d09f2017-04-27 20:10:34 +0200358 "marmot/m=degree:" : [
359 ["comp","comp ", "Comparative"],
360 ["pos","pos ", "Positive"],
361 ["sup","sup ", "Superative"]
362 ],
Akron113cc1a2016-01-22 21:17:57 +0100363 "mate/m=gender:" : [
364 ["fem", "fem ", "Feminium"],
365 ["masc", "masc ", "Masculinum"],
366 ["neut","neut ", "Neuter"],
367 ["*","* ","Undefined"]
368 ],
Akron9b9d09f2017-04-27 20:10:34 +0200369 "marmot/m=gender:" : [
370 ["fem", "fem ", "Feminium"],
371 ["masc", "masc ", "Masculinum"],
372 ["neut","neut ", "Neuter"],
373 ["*","* ","Undefined"]
374 ],
Akron113cc1a2016-01-22 21:17:57 +0100375 "mate/m=mood:" : [
376 ["imp","imp ", "Imperative"],
377 ["ind","ind ", "Indicative"],
378 ["subj","subj ", "Subjunctive"]
379 ],
Akron9b9d09f2017-04-27 20:10:34 +0200380 "marmot/m=mood:" : [
381 ["imp","imp ", "Imperative"],
382 ["ind","ind ", "Indicative"],
383 ["subj","subj ", "Subjunctive"]
384 ],
Akron113cc1a2016-01-22 21:17:57 +0100385 "mate/m=number:" : [
386 ["pl","pl ","Plural"],
387 ["sg","sg ","Singular"],
388 ["*","* ","Undefined"]
389 ],
Akron9b9d09f2017-04-27 20:10:34 +0200390 "marmot/m=number" : [
391 ["pl","pl ","Plural"],
392 ["sg","sg ","Singular"],
393 ["*","* ","Undefined"]
394 ],
Akron113cc1a2016-01-22 21:17:57 +0100395 "mate/m=person:" : [
396 ["1","1 ", "First Person"],
397 ["2","2 ", "Second Person"],
398 ["3","3 ", "Third Person"]
399 ],
Akron9b9d09f2017-04-27 20:10:34 +0200400 "marmot/m=person:" : [
401 ["1","1 ", "First Person"],
402 ["2","2 ", "Second Person"],
403 ["3","3 ", "Third Person"]
404 ],
Akron113cc1a2016-01-22 21:17:57 +0100405 "mate/m=tense:" : [
406 ["past","past ", "Past"],
407 ["pres","pres ", "Present"]
Akron9b9d09f2017-04-27 20:10:34 +0200408 ],
409 "marmot/m=tense:" : [
410 ["past","past ", "Past"],
411 ["pres","pres ", "Present"]
412 ],
413 "malt/d=" : [
414 ["-PUNCT-", "-PUNCT- "]
415 ["-UNKNOWN-","-UNKNOWN- "],
416 ["ADV","ADV "],
417 ["APP","APP "],
418 ["ATTR","ATTR "],
419 ["AUX","AUX "],
420 ["AVZ","AVZ "],
421 ["CJ","CJ "],
422 ["DET","DET "],
423 ["EXPL","EXPL "],
424 ["GMOD","GMOD "],
425 ["GRAD","GRAD "],
426 ["KOM","KOM "],
427 ["KON","KON "],
428 ["KONJ","KONJ "],
429 ["NEB","NEB "],
430 ["OBJA","OBJA "],
431 ["OBJC","OBJC "],
432 ["OBJD","OBJD "],
433 ["OBJG","OBJG "],
434 ["OBJI","OBJI "],
435 ["OBJP","OBJP "],
436 ["PAR","PAR "],
437 ["PART","PART "],
438 ["PN","PN "],
439 ["PP","PP "],
440 ["PRED","PRED "],
441 ["REL","REL "],
442 ["ROOT","ROOT "],
443 ["S","S "],
444 ["SUBJ","SUBJ "],
445 ["SUBJC","SUBJC "],
446 ["ZEIT","ZEIT "],
447 ["gmod-app","gmod-app "],
448 ["koord","koord "]
Akron113cc1a2016-01-22 21:17:57 +0100449 ]
450 };
Nils Diewald023c6712015-05-21 20:12:30 +0000451
Akron113cc1a2016-01-22 21:17:57 +0100452 for (var i in negraNodes) {
453 obj["corenlp/c=" + negraNodes[i][0] + '-'] = negraEdges;
454 };
455
456 return obj;
Nils Diewald023c6712015-05-21 20:12:30 +0000457});