blob: fcfe9a2ead16ca2d9fa50a7745ed14651b13ac9b [file] [log] [blame]
Akrond05e2112016-02-18 15:47:18 +01001/*
Nils Diewald023c6712015-05-21 20:12:30 +00002var menuContent = [
3 ['cnx/c', 'cnx', 'c'],
4 ['mate/c', 'mate', 'c'],
5 ['base/c', 'base', 'c'],
6 ['xip/c', 'xip', 'c'],
7 ['tt/c', 'tt', 'c']
8];
Akrond05e2112016-02-18 15:47:18 +01009*/
Nils Diewald023c6712015-05-21 20:12:30 +000010
11var namedEntities = [
12 ["I-LOC", "I-LOC ", "Location"],
13 ["I-MISC", "I-MISC ", "Miscellaneous"],
14 ["I-ORG", "I-ORG ", "Organization"],
15 ["I-PER", "I-PER ", "Person"]
16];
17
18// http://www.ids-mannheim.de/cosmas2/projekt/referenz/stts/morph.html
19// http://nachhalt.sfb632.uni-potsdam.de/owl-docu/stts.html
20var sttsArray = [
21 // "$.", "$(", "$,"
22 ["ADJA","ADJA ", "Attributive Adjective"],
23 ["ADJD","ADJD ", "Predicative Adjective"],
24 ["ADV","ADV ", "Adverb"],
25 ["APPO","APPO ", "Postposition"],
26 ["APPR","APPR ", "Preposition"],
27 ["APPRART","APPRART ", "Preposition with Determiner"],
28 ["APZR","APZR ","Right Circumposition"],
29 ["ART","ART ", "Determiner"],
30 ["CARD","CARD ", "Cardinal Number"],
31 ["FM","FM ", "Foreign Material"],
32 ["ITJ","ITJ ", "Interjection"],
33 ["KOKOM","KOKOM ", "Comparison Particle"],
34 ["KON","KON ", "Coordinating Conjuncion"],
35 ["KOUI","KOUI ", "Subordinating Conjunction with 'zu'"],
36 ["KOUS","KOUS ", "Subordinating Conjunction with Sentence"],
37 ["NE","NE ", "Named Entity"],
38 ["NN","NN ", "Normal Nomina"],
39 ["PAV", "PAV ", "Pronominal Adverb"],
40 ["PDAT","PDAT ","Attributive Demonstrative Pronoun"],
41 ["PDS","PDS ", "Substitutive Demonstrative Pronoun"],
42 ["PIAT","PIAT ", "Attributive Indefinite Pronoun without Determiner"],
43 ["PIDAT","PIDAT ", "Attributive Indefinite Pronoun with Determiner"],
44 ["PIS","PIS ", "Substitutive Indefinite Pronoun"],
45 ["PPER","PPER ", "Personal Pronoun"],
46 ["PPOSAT","PPOSAT ", "Attributive Possessive Pronoun"],
47 ["PPOSS","PPOSS ", "Substitutive Possessive Pronoun"],
48 ["PRELAT","PRELAT ", "Attributive Relative Pronoun"],
49 ["PRELS","PRELS ", "Substitutive Relative Pronoun"],
50 ["PRF","PRF ", "Reflexive Pronoun"],
51 ["PROAV","PROAV ", "Pronominal Adverb"],
52 ["PTKA","PTKA ","Particle with Adjective"],
53 ["PTKANT","PTKANT ", "Answering Particle"],
54 ["PTKNEG","PTKNEG ", "Negation Particle"],
55 ["PTKVZ","PTKVZ ", "Separated Verbal Particle"],
56 ["PTKZU","PTKZU ", "'zu' Particle"],
57 ["PWAT","PWAT ", "Attributive Interrogative Pronoun"],
58 ["PWAV","PWAV ", "Adverbial Interrogative Pronoun"],
59 ["PWS","PWS ", "Substitutive Interrogative Pronoun"],
60 ["TRUNC","TRUNC ","Truncated"],
61 ["VAFIN","VAFIN ", "Auxiliary Finite Verb"],
Nils Diewald023c6712015-05-21 20:12:30 +000062 ["VAIMP","VAIMP ", "Auxiliary Finite Imperative Verb"],
Akroncff9bac2016-01-25 21:39:38 +010063 ["VAINF","VAINF ", "Auxiliary Infinite Verb"],
Nils Diewald023c6712015-05-21 20:12:30 +000064 ["VAPP","VAPP ", "Auxiliary Perfect Participle"],
65 ["VMFIN","VMFIN ", "Modal Finite Verb"],
66 ["VMINF","VMINF ", "Modal Infinite Verb"],
67 ["VMPP","VMPP ", "Modal Perfect Participle"],
68 ["VVFIN","VVFIN ","Finite Verb"],
69 ["VVIMP","VVIMP ", "Finite Imperative Verb"],
70 ["VVINF","VVINF ", "Infinite Verb"],
71 ["VVIZU","VVIZU ", "Infinite Verb with 'zu'"],
72 ["VVPP","VVPP ", "Perfect Participle"],
73 ["XY", "XY ", "Non-Word"]
74];
75
Akroncff9bac2016-01-25 21:39:38 +010076
Akron113cc1a2016-01-22 21:17:57 +010077// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/negra-corpus.html
78// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/knoten.html
79var negraNodes = [
80 ["AA", "AA", "superlative phrase with 'am'"],
81 ["AP","AP", "adjektive phrase"],
82 ["AVP","AVP", "adverbial phrase"],
83 ["CAP","CAP", "coordinated adjektive phrase"],
84 ["CAVP","CAVP", "coordinated adverbial phrase"],
85 ["CAC","CAC", "coordinated adposition"],
86 ["CCP","CCP", "coordinated complementiser"],
87 ["CH","CH", "chunk"],
88 ["CNP","CNP", "coordinated noun phrase"],
89 ["CO","CO", "coordination"],
90 ["CPP","CPP", "coordinated adpositional phrase"],
91 ["CS","CS", "coordinated sentence"],
92 ["CVP","CVP", "coordinated verb phrase (non-finite)"],
93 ["CVZ","CVZ", "coordinated zu-marked infinitive"],
94 ["DL","DL", "discourse level constituent"],
95 ["ISU","ISU", "idiosyncratis unit"],
96 ["MPN","MPN", "multi-word proper noun"],
97 ["MTA","MTA", "multi-token adjective"],
98 ["NM","NM", "multi-token number"],
99 ["NP","NP", "noun phrase"],
100 ["PP","PP", "adpositional phrase"],
101 ["QL","QL", "quasi-languag"],
102 ["ROOT","ROOT", "root node"],
103 ["S","S", "sentence"],
104 ["VP","VP", "verb phrase (non-finite)"],
105 ["VZ","VZ", "zu-marked infinitive"]
106];
107
108// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/kanten.html
109var negraEdges = [
110 ["AC","AC","adpositional case marker"],
111 ["ADC","ADC","adjective component"],
112 ["AMS","AMS","measure argument of adj"],
113 ["APP","APP","apposition"],
114 ["AVC","AVC","adverbial phrase component"],
115 ["CC","CC","comparative complement"],
116 ["CD","CD","coordinating conjunction"],
117 ["CJ","CJ","conjunct"],
118 ["CM","CM","comparative concjunction"],
119 ["CP","CP","complementizer"],
120 ["DA","DA","dative"],
121 ["DH","DH","discourse-level head"],
122 ["DM","DM","discourse marker"],
123 ["GL","GL","prenominal genitive"],
124 ["GR","GR","postnominal genitive"],
125 ["HD","HD","head"],
126 ["JU","JU","junctor"],
127 ["MC","MC","comitative"],
128 ["MI","MI","instrumental"],
129 ["ML","ML","locative"],
130 ["MNR","MNR","postnominal modifier"],
131 ["MO","MO","modifier"],
132 ["MR","MR","rhetorical modifier"],
133 ["MW","MW","way (directional modifier)"],
134 ["NG","NG","negation"],
135 ["NK","NK","noun kernel modifier"],
136 ["NMC","NMC","numerical component"],
137 ["OA","OA","accusative object"],
138 ["OA2","OA2","second accusative object"],
139 ["OC","OC","clausal object"],
140 ["OG","OG","genitive object"],
141 ["PD","PD","predicate"],
142 ["PG","PG","pseudo-genitive"],
143 ["PH","PH","placeholder"],
144 ["PM","PM","morphological particle"],
145 ["PNC","PNC","proper noun component"],
146 ["RC","RC","relative clause"],
147 ["RE","RE","repeated element"],
148 ["RS","RS","reported speech"],
149 ["SB","SB","subject"],
150 ["SBP","SBP","passivised subject (PP)"],
151 ["SP","SP","subject or predicate"],
152 ["SVP","SVP","separable verb prefix"],
153 ["UC","UC","(idiosyncratic) unit component"],
154 ["VO","VO","vocative"]
155];
156
Nils Diewald023c6712015-05-21 20:12:30 +0000157var mateSttsArray = sttsArray.slice(0);
158mateSttsArray.push(
159 ["<root-POS>","<root-POS>","Root Part of Speech"]
160);
161
Akronb2a09532016-02-16 19:14:42 +0100162var sgbrSttsArray = sttsArray.slice(0);
Akronb3923852016-02-01 16:07:59 +0100163
Akronb2a09532016-02-16 19:14:42 +0100164// Push specific information for Schreibgebrauch
165sgbrSttsArray.push(
166 ["NNE", "NNE", "Normal Nomina with Named Entity"],
167 ["ADVART","ADVART", "Adverb with Article"],
168 ["EMOASC","EMOASC", "ASCII emoticon"],
169 ["EMOIMG","EMOIMG", "Graphic emoticon"],
170 ["ERRTOK","ERRTOK", "Tokenisation Error"],
171 ["HST", "HST", "Hashtag"],
172 ["KOUSPPER","KOUSPPER", "Subordinating Conjunction (with Sentence) with Personal Pronoun"],
173 ["ONO", "ONO", "Onomatopoeia"],
174 ["PPERPPER","PPERPPER", "Personal Pronoun with Personal Pronoun"],
175 ["URL", "URL", "Uniform Resource Locator"],
176 ["VAPPER", "VAPPER", "Finite Auxiliary Verb with Personal Pronoun"],
177 ["VMPPER", "VMPPER", "Fintite Modal Verb with Personal Pronoun"],
178 ["VVPPER", "VVPPER", "Finite Full Verb with Personal Pronoun"],
179 ["AW", "AW", "Interaction Word"],
180 ["ADR", "ADR", "Addressing Term"],
181 ["AWIND", "AWIND", "Punctuation Indicating Addressing Term"],
182 ["ERRAW","ERRAW", "Part of Erroneously Separated Compound"]
183 /*
184 As KorAP currently doesn't support these tags, they could also be ommited
185 ["_KOMMA", "_KOMMA", "Comma"],
186 ["_SONST", "_SONST", "Intrasentential Punctuation Mark"],
187 ["_ENDE", "_ENDE", "Punctuation Mark at the end of the Sentence"]
188 */
189);
190
191// Sort by tag
192sgbrSttsArray.sort(function (a,b) { return a[0].localeCompare(b[0]) });
Akroncff9bac2016-01-25 21:39:38 +0100193
Akron113cc1a2016-01-22 21:17:57 +0100194define(function () {
195 var obj = {
196 "-" : [
Akrond05e2112016-02-18 15:47:18 +0100197 ["Base Annotation", "base/s=", "Structure"],
Akron9b9d09f2017-04-27 20:10:34 +0200198// ["Connexor", "cnx/", "Constituency, Lemma, Morphology, Part-of-Speech, Syntax"],
Akroncff9bac2016-01-25 21:39:38 +0100199 ["CoreNLP", "corenlp/", "Constituency, Named Entities, Part-of-Speech"],
Akrond05e2112016-02-18 15:47:18 +0100200 ["DeReKo", "dereko/s=", "Structure"],
Akronbc609e32017-06-27 15:16:39 +0200201 ["DRuKoLa", "drukola/", "Lemma, Morphology, Part-of-Speech"],
Akron9b9d09f2017-04-27 20:10:34 +0200202// ["Mate", "mate/", "Lemma, Morphology, Part-of-Speech"],
203 ["Malt", "malt/", "Dependency"],
Akroncff9bac2016-01-25 21:39:38 +0100204 ["OpenNLP", "opennlp/", "Part-of-Speech"],
Akron9b9d09f2017-04-27 20:10:34 +0200205// ["Schreibgebrauch", "sgbr/", "Lemma, Lemma Variants, Part-of-Speech"],
Akroncff9bac2016-01-25 21:39:38 +0100206 ["TreeTagger", "tt/", "Lemma, Part-of-Speech"],
Akron9b9d09f2017-04-27 20:10:34 +0200207// ["Xerox Parser", "xip/", "Constituency, Lemma, Part-of-Speech"]
208 ["MarMoT", "marmot/", "Morphology, Part-of-Speech"],
Akron113cc1a2016-01-22 21:17:57 +0100209 ],
Akrond05e2112016-02-18 15:47:18 +0100210 "base/s=" : [
211 ["s", "s", "Sentence"],
212 ["p", "p", "Paragraph"],
213 ["t", "t", "Text"]
214 ],
Akron113cc1a2016-01-22 21:17:57 +0100215 "corenlp/" : [
216 ["Constituency", "c="],
217 ["Named Entity", "ne=" , "Combined"],
218 ["Named Entity", "ne_dewac_175m_600=" , "ne_dewac_175m_600"],
219 ["Named Entity", "ne_hgc_175m_600=", "ne_hgc_175m_600"],
220 ["Part-of-Speech", "p="]
221 ],
222 "corenlp/ne=" : namedEntities,
223 "corenlp/ne_dewac_175m_600=" : namedEntities,
224 "corenlp/ne_hgc_175m_600=" : namedEntities,
225 "corenlp/p=" : sttsArray,
226 "corenlp/c=" : negraNodes,
227 "cnx/" : [
228 ["Constituency", "c="],
229 ["Lemma", "l="],
230 ["Morphology", "m="],
231 ["Part-of-Speech", "p="],
232 ["Syntax", "syn="]
233 ],
234 "cnx/c=" : [
235 ["np", "np ", "Nominal Phrase"]
236 ],
237 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/morph.html
238 "cnx/m=" : [
239 ["Abbr","Abbr ", "Nouns: Abbreviation"],
240 ["CMP","CMP ", "Adjective: Comparative"],
241 ["IMP", "IMP ", "Mood: Imperative"],
242 ["IND", "IND ", "Mood: Indicative"],
243 ["INF", "INF ", "Infinitive"],
244 ["ORD","ORD ", "Numeral: Ordinal"],
245 ["PAST", "PAST ", "Tense: past"],
246 ["PCP", "PCP ", "Participle"],
247 ["PERF", "PERF ", "Perfective Participle"],
248 ["PL","PL ", "Nouns: Plural"],
249 ["PRES", "PRES ", "Tense: present"],
250 ["PROG", "PROG ", "Progressive Participle"],
251 ["Prop","Prop ", "Nouns: Proper Noun"],
252 ["SUB", "SUB ", "Mood: Subjunctive"],
253 ["SUP","SUP ", "Adjective: Superlative"]
254 ],
255 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/morph.html
256 "cnx/p=" : [
257 ["A", "A ", "Adjective"],
258 ["ADV", "ADV ", "Adverb"],
259 ["CC", "CC ", "Coordination Marker"],
260 ["CS", "CS ", "Clause Marker"],
261 ["DET", "DET ", "Determiner"],
262 ["INTERJ", "INTERJ ", "Interjection"],
263 ["N", "N ", "Noun"],
264 ["NUM", "NUM ", "Numeral"],
265 ["PREP", "PREP ", "Preposition"],
266 ["PRON", "PRON ", "Pro-Nominal"],
267 ["V", "V ", "Verb"]
268 ],
269 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/syntax.html
270 "cnx/syn=" : [
271 ["@ADVL", "@ADVL ", "Adverbial Head"],
272 ["@AUX", "@AUX ", "Auxiliary Verb"],
273 ["@CC", "@CC ", "Coordination"]
274 ["@MAIN", "@MAIN ", "Main Verb"],
275 ["@NH", "@NH ", "Nominal Head"],
276 ["@POSTMOD", "@POSTMOD ", "Postmodifier"],
277 ["@PREMARK", "@PREMARK ", "Preposed Marker"],
278 ["@PREMOD", "@POSTMOD ", "Premodifier"]
279 ],
Akronbc609e32017-06-27 15:16:39 +0200280 "drukola/" : [
281 ["Lemma", "l="],
282 ["Morphology", "m="],
283 ["Part-of-Speech", "p="]
284 ],
Akron113cc1a2016-01-22 21:17:57 +0100285 "opennlp/" : [
286 ["Part-of-Speech", "p="]
287 ],
288 "opennlp/p=" : sttsArray,
Akroncff9bac2016-01-25 21:39:38 +0100289 "sgbr/" : [
290 ["Lemma", "l="],
291 ["Lemma Variants", "lv="],
292 ["Part-of-Speech", "p="]
293 ],
Akronb2a09532016-02-16 19:14:42 +0100294 "sgbr/p=" : sgbrSttsArray,
Akron113cc1a2016-01-22 21:17:57 +0100295 "xip/" : [
296 ["Constituency", "c="],
297 // Inactive: ["Dependency", "d="],
298 ["Lemma", "l="],
299 ["Part-of-Speech", "p="],
300 ],
301 // "xip/c=" : [],
302 // Inactive: "xip/d=" : [],
303 // "xip/p=" : [],
304 "tt/" : [
305 ["Lemma", "l="],
306 ["Part-of-Speech", "p="]
307 ],
308 "tt/p=" : sttsArray,
Akron9b9d09f2017-04-27 20:10:34 +0200309 "marmot/" : [
310 ["Morphology", "m="],
311 ["Part-of-Speech", "p="]
312 ],
313 "marmot/p=" : sttsArray,
314 "malt/" : [
315 ["Dependency", "d="]
316 ],
Akron113cc1a2016-01-22 21:17:57 +0100317 "mate/" : [
318 // Inactive: "d" : ["d=", "Dependency"],
319 ["Lemma", "l="],
320 ["Morphology", "m="],
321 ["Part-of-Speech", "p="]
322 ],
323 // Inactive: mate/d=
324 "mate/p=" : mateSttsArray,
325 "mate/m=" : [
326 ["Case", "case:"],
327 ["Degree", "degree:"],
328 ["Gender", "gender:"],
329 ["Mood", "mood:"],
330 ["Number", "number:"],
331 ["Person", "person:"],
332 ["Tense","tense:"],
333 ["No type", "<no-type> "]
334 ],
Akron9b9d09f2017-04-27 20:10:34 +0200335 "marmot/m=" : [
336 ["Case", "case:"],
337 ["Degree", "degree:"],
338 ["Gender", "gender:"],
339 ["Mood", "mood:"],
340 ["Number", "number:"],
341 ["Person", "person:"],
342 ["Tense","tense:"],
343 ["No type", "<no-type> "]
344 ],
Akron113cc1a2016-01-22 21:17:57 +0100345 "mate/m=case:" : [
346 ["acc", "acc ", "Accusative"],
347 ["dat","dat ", "Dative"],
348 ["gen", "gen ","Genitive"],
349 ["nom","nom ", "Nominative"],
350 ["*","* ", "Undefined"]
351 ],
Akron9b9d09f2017-04-27 20:10:34 +0200352 "marmot/m=case:" : [
353 ["acc", "acc ", "Accusative"],
354 ["dat","dat ", "Dative"],
355 ["gen", "gen ","Genitive"],
356 ["nom","nom ", "Nominative"],
357 ["*","* ", "Undefined"]
358 ],
Akron113cc1a2016-01-22 21:17:57 +0100359 "mate/m=degree:" : [
360 ["comp","comp ", "Comparative"],
361 ["pos","pos ", "Positive"],
362 ["sup","sup ", "Superative"]
363 ],
Akron9b9d09f2017-04-27 20:10:34 +0200364 "marmot/m=degree:" : [
365 ["comp","comp ", "Comparative"],
366 ["pos","pos ", "Positive"],
367 ["sup","sup ", "Superative"]
368 ],
Akron113cc1a2016-01-22 21:17:57 +0100369 "mate/m=gender:" : [
370 ["fem", "fem ", "Feminium"],
371 ["masc", "masc ", "Masculinum"],
372 ["neut","neut ", "Neuter"],
373 ["*","* ","Undefined"]
374 ],
Akron9b9d09f2017-04-27 20:10:34 +0200375 "marmot/m=gender:" : [
376 ["fem", "fem ", "Feminium"],
377 ["masc", "masc ", "Masculinum"],
378 ["neut","neut ", "Neuter"],
379 ["*","* ","Undefined"]
380 ],
Akron113cc1a2016-01-22 21:17:57 +0100381 "mate/m=mood:" : [
382 ["imp","imp ", "Imperative"],
383 ["ind","ind ", "Indicative"],
384 ["subj","subj ", "Subjunctive"]
385 ],
Akron9b9d09f2017-04-27 20:10:34 +0200386 "marmot/m=mood:" : [
387 ["imp","imp ", "Imperative"],
388 ["ind","ind ", "Indicative"],
389 ["subj","subj ", "Subjunctive"]
390 ],
Akron113cc1a2016-01-22 21:17:57 +0100391 "mate/m=number:" : [
392 ["pl","pl ","Plural"],
393 ["sg","sg ","Singular"],
394 ["*","* ","Undefined"]
395 ],
Akron9b9d09f2017-04-27 20:10:34 +0200396 "marmot/m=number" : [
397 ["pl","pl ","Plural"],
398 ["sg","sg ","Singular"],
399 ["*","* ","Undefined"]
400 ],
Akron113cc1a2016-01-22 21:17:57 +0100401 "mate/m=person:" : [
402 ["1","1 ", "First Person"],
403 ["2","2 ", "Second Person"],
404 ["3","3 ", "Third Person"]
405 ],
Akron9b9d09f2017-04-27 20:10:34 +0200406 "marmot/m=person:" : [
407 ["1","1 ", "First Person"],
408 ["2","2 ", "Second Person"],
409 ["3","3 ", "Third Person"]
410 ],
Akron113cc1a2016-01-22 21:17:57 +0100411 "mate/m=tense:" : [
412 ["past","past ", "Past"],
413 ["pres","pres ", "Present"]
Akron9b9d09f2017-04-27 20:10:34 +0200414 ],
415 "marmot/m=tense:" : [
416 ["past","past ", "Past"],
417 ["pres","pres ", "Present"]
418 ],
419 "malt/d=" : [
Akronff969972017-05-23 22:54:47 +0200420 ["-PUNCT-", "-PUNCT- "],
Akron9b9d09f2017-04-27 20:10:34 +0200421 ["-UNKNOWN-","-UNKNOWN- "],
422 ["ADV","ADV "],
423 ["APP","APP "],
424 ["ATTR","ATTR "],
425 ["AUX","AUX "],
426 ["AVZ","AVZ "],
427 ["CJ","CJ "],
428 ["DET","DET "],
429 ["EXPL","EXPL "],
430 ["GMOD","GMOD "],
431 ["GRAD","GRAD "],
432 ["KOM","KOM "],
433 ["KON","KON "],
434 ["KONJ","KONJ "],
435 ["NEB","NEB "],
436 ["OBJA","OBJA "],
437 ["OBJC","OBJC "],
438 ["OBJD","OBJD "],
439 ["OBJG","OBJG "],
440 ["OBJI","OBJI "],
441 ["OBJP","OBJP "],
442 ["PAR","PAR "],
443 ["PART","PART "],
444 ["PN","PN "],
445 ["PP","PP "],
446 ["PRED","PRED "],
447 ["REL","REL "],
448 ["ROOT","ROOT "],
449 ["S","S "],
450 ["SUBJ","SUBJ "],
451 ["SUBJC","SUBJC "],
452 ["ZEIT","ZEIT "],
453 ["gmod-app","gmod-app "],
454 ["koord","koord "]
Akron113cc1a2016-01-22 21:17:57 +0100455 ]
456 };
Nils Diewald023c6712015-05-21 20:12:30 +0000457
Akron113cc1a2016-01-22 21:17:57 +0100458 for (var i in negraNodes) {
459 obj["corenlp/c=" + negraNodes[i][0] + '-'] = negraEdges;
460 };
461
462 return obj;
Nils Diewald023c6712015-05-21 20:12:30 +0000463});