blob: 822d658d3ee584f64463552c946c6ff6a8cf8bdd [file] [log] [blame]
Akrond05e2112016-02-18 15:47:18 +01001/*
Nils Diewald023c6712015-05-21 20:12:30 +00002var menuContent = [
3 ['cnx/c', 'cnx', 'c'],
4 ['mate/c', 'mate', 'c'],
5 ['base/c', 'base', 'c'],
6 ['xip/c', 'xip', 'c'],
7 ['tt/c', 'tt', 'c']
8];
Akrond05e2112016-02-18 15:47:18 +01009*/
Nils Diewald023c6712015-05-21 20:12:30 +000010
11var namedEntities = [
12 ["I-LOC", "I-LOC ", "Location"],
13 ["I-MISC", "I-MISC ", "Miscellaneous"],
14 ["I-ORG", "I-ORG ", "Organization"],
15 ["I-PER", "I-PER ", "Person"]
16];
17
18// http://www.ids-mannheim.de/cosmas2/projekt/referenz/stts/morph.html
19// http://nachhalt.sfb632.uni-potsdam.de/owl-docu/stts.html
20var sttsArray = [
21 // "$.", "$(", "$,"
22 ["ADJA","ADJA ", "Attributive Adjective"],
23 ["ADJD","ADJD ", "Predicative Adjective"],
24 ["ADV","ADV ", "Adverb"],
25 ["APPO","APPO ", "Postposition"],
26 ["APPR","APPR ", "Preposition"],
27 ["APPRART","APPRART ", "Preposition with Determiner"],
28 ["APZR","APZR ","Right Circumposition"],
29 ["ART","ART ", "Determiner"],
30 ["CARD","CARD ", "Cardinal Number"],
31 ["FM","FM ", "Foreign Material"],
32 ["ITJ","ITJ ", "Interjection"],
33 ["KOKOM","KOKOM ", "Comparison Particle"],
34 ["KON","KON ", "Coordinating Conjuncion"],
35 ["KOUI","KOUI ", "Subordinating Conjunction with 'zu'"],
36 ["KOUS","KOUS ", "Subordinating Conjunction with Sentence"],
37 ["NE","NE ", "Named Entity"],
38 ["NN","NN ", "Normal Nomina"],
39 ["PAV", "PAV ", "Pronominal Adverb"],
40 ["PDAT","PDAT ","Attributive Demonstrative Pronoun"],
41 ["PDS","PDS ", "Substitutive Demonstrative Pronoun"],
42 ["PIAT","PIAT ", "Attributive Indefinite Pronoun without Determiner"],
43 ["PIDAT","PIDAT ", "Attributive Indefinite Pronoun with Determiner"],
44 ["PIS","PIS ", "Substitutive Indefinite Pronoun"],
45 ["PPER","PPER ", "Personal Pronoun"],
46 ["PPOSAT","PPOSAT ", "Attributive Possessive Pronoun"],
47 ["PPOSS","PPOSS ", "Substitutive Possessive Pronoun"],
48 ["PRELAT","PRELAT ", "Attributive Relative Pronoun"],
49 ["PRELS","PRELS ", "Substitutive Relative Pronoun"],
50 ["PRF","PRF ", "Reflexive Pronoun"],
51 ["PROAV","PROAV ", "Pronominal Adverb"],
52 ["PTKA","PTKA ","Particle with Adjective"],
53 ["PTKANT","PTKANT ", "Answering Particle"],
54 ["PTKNEG","PTKNEG ", "Negation Particle"],
55 ["PTKVZ","PTKVZ ", "Separated Verbal Particle"],
56 ["PTKZU","PTKZU ", "'zu' Particle"],
57 ["PWAT","PWAT ", "Attributive Interrogative Pronoun"],
58 ["PWAV","PWAV ", "Adverbial Interrogative Pronoun"],
59 ["PWS","PWS ", "Substitutive Interrogative Pronoun"],
60 ["TRUNC","TRUNC ","Truncated"],
61 ["VAFIN","VAFIN ", "Auxiliary Finite Verb"],
Nils Diewald023c6712015-05-21 20:12:30 +000062 ["VAIMP","VAIMP ", "Auxiliary Finite Imperative Verb"],
Akroncff9bac2016-01-25 21:39:38 +010063 ["VAINF","VAINF ", "Auxiliary Infinite Verb"],
Nils Diewald023c6712015-05-21 20:12:30 +000064 ["VAPP","VAPP ", "Auxiliary Perfect Participle"],
65 ["VMFIN","VMFIN ", "Modal Finite Verb"],
66 ["VMINF","VMINF ", "Modal Infinite Verb"],
67 ["VMPP","VMPP ", "Modal Perfect Participle"],
68 ["VVFIN","VVFIN ","Finite Verb"],
69 ["VVIMP","VVIMP ", "Finite Imperative Verb"],
70 ["VVINF","VVINF ", "Infinite Verb"],
71 ["VVIZU","VVIZU ", "Infinite Verb with 'zu'"],
72 ["VVPP","VVPP ", "Perfect Participle"],
73 ["XY", "XY ", "Non-Word"]
74];
75
Akroncff9bac2016-01-25 21:39:38 +010076
Akron113cc1a2016-01-22 21:17:57 +010077// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/negra-corpus.html
78// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/knoten.html
79var negraNodes = [
80 ["AA", "AA", "superlative phrase with 'am'"],
81 ["AP","AP", "adjektive phrase"],
82 ["AVP","AVP", "adverbial phrase"],
83 ["CAP","CAP", "coordinated adjektive phrase"],
84 ["CAVP","CAVP", "coordinated adverbial phrase"],
85 ["CAC","CAC", "coordinated adposition"],
86 ["CCP","CCP", "coordinated complementiser"],
87 ["CH","CH", "chunk"],
88 ["CNP","CNP", "coordinated noun phrase"],
89 ["CO","CO", "coordination"],
90 ["CPP","CPP", "coordinated adpositional phrase"],
91 ["CS","CS", "coordinated sentence"],
92 ["CVP","CVP", "coordinated verb phrase (non-finite)"],
93 ["CVZ","CVZ", "coordinated zu-marked infinitive"],
94 ["DL","DL", "discourse level constituent"],
95 ["ISU","ISU", "idiosyncratis unit"],
96 ["MPN","MPN", "multi-word proper noun"],
97 ["MTA","MTA", "multi-token adjective"],
98 ["NM","NM", "multi-token number"],
99 ["NP","NP", "noun phrase"],
100 ["PP","PP", "adpositional phrase"],
101 ["QL","QL", "quasi-languag"],
102 ["ROOT","ROOT", "root node"],
103 ["S","S", "sentence"],
104 ["VP","VP", "verb phrase (non-finite)"],
105 ["VZ","VZ", "zu-marked infinitive"]
106];
107
108// http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/kanten.html
109var negraEdges = [
110 ["AC","AC","adpositional case marker"],
111 ["ADC","ADC","adjective component"],
112 ["AMS","AMS","measure argument of adj"],
113 ["APP","APP","apposition"],
114 ["AVC","AVC","adverbial phrase component"],
115 ["CC","CC","comparative complement"],
116 ["CD","CD","coordinating conjunction"],
117 ["CJ","CJ","conjunct"],
118 ["CM","CM","comparative concjunction"],
119 ["CP","CP","complementizer"],
120 ["DA","DA","dative"],
121 ["DH","DH","discourse-level head"],
122 ["DM","DM","discourse marker"],
123 ["GL","GL","prenominal genitive"],
124 ["GR","GR","postnominal genitive"],
125 ["HD","HD","head"],
126 ["JU","JU","junctor"],
127 ["MC","MC","comitative"],
128 ["MI","MI","instrumental"],
129 ["ML","ML","locative"],
130 ["MNR","MNR","postnominal modifier"],
131 ["MO","MO","modifier"],
132 ["MR","MR","rhetorical modifier"],
133 ["MW","MW","way (directional modifier)"],
134 ["NG","NG","negation"],
135 ["NK","NK","noun kernel modifier"],
136 ["NMC","NMC","numerical component"],
137 ["OA","OA","accusative object"],
138 ["OA2","OA2","second accusative object"],
139 ["OC","OC","clausal object"],
140 ["OG","OG","genitive object"],
141 ["PD","PD","predicate"],
142 ["PG","PG","pseudo-genitive"],
143 ["PH","PH","placeholder"],
144 ["PM","PM","morphological particle"],
145 ["PNC","PNC","proper noun component"],
146 ["RC","RC","relative clause"],
147 ["RE","RE","repeated element"],
148 ["RS","RS","reported speech"],
149 ["SB","SB","subject"],
150 ["SBP","SBP","passivised subject (PP)"],
151 ["SP","SP","subject or predicate"],
152 ["SVP","SVP","separable verb prefix"],
153 ["UC","UC","(idiosyncratic) unit component"],
154 ["VO","VO","vocative"]
155];
156
Nils Diewald023c6712015-05-21 20:12:30 +0000157var mateSttsArray = sttsArray.slice(0);
158mateSttsArray.push(
159 ["<root-POS>","<root-POS>","Root Part of Speech"]
160);
161
Akronb2a09532016-02-16 19:14:42 +0100162var sgbrSttsArray = sttsArray.slice(0);
Akronb3923852016-02-01 16:07:59 +0100163
Akronb2a09532016-02-16 19:14:42 +0100164// Push specific information for Schreibgebrauch
165sgbrSttsArray.push(
166 ["NNE", "NNE", "Normal Nomina with Named Entity"],
167 ["ADVART","ADVART", "Adverb with Article"],
168 ["EMOASC","EMOASC", "ASCII emoticon"],
169 ["EMOIMG","EMOIMG", "Graphic emoticon"],
170 ["ERRTOK","ERRTOK", "Tokenisation Error"],
171 ["HST", "HST", "Hashtag"],
172 ["KOUSPPER","KOUSPPER", "Subordinating Conjunction (with Sentence) with Personal Pronoun"],
173 ["ONO", "ONO", "Onomatopoeia"],
174 ["PPERPPER","PPERPPER", "Personal Pronoun with Personal Pronoun"],
175 ["URL", "URL", "Uniform Resource Locator"],
176 ["VAPPER", "VAPPER", "Finite Auxiliary Verb with Personal Pronoun"],
177 ["VMPPER", "VMPPER", "Fintite Modal Verb with Personal Pronoun"],
178 ["VVPPER", "VVPPER", "Finite Full Verb with Personal Pronoun"],
179 ["AW", "AW", "Interaction Word"],
180 ["ADR", "ADR", "Addressing Term"],
181 ["AWIND", "AWIND", "Punctuation Indicating Addressing Term"],
182 ["ERRAW","ERRAW", "Part of Erroneously Separated Compound"]
183 /*
184 As KorAP currently doesn't support these tags, they could also be ommited
185 ["_KOMMA", "_KOMMA", "Comma"],
186 ["_SONST", "_SONST", "Intrasentential Punctuation Mark"],
187 ["_ENDE", "_ENDE", "Punctuation Mark at the end of the Sentence"]
188 */
189);
190
191// Sort by tag
192sgbrSttsArray.sort(function (a,b) { return a[0].localeCompare(b[0]) });
Akroncff9bac2016-01-25 21:39:38 +0100193
Akron113cc1a2016-01-22 21:17:57 +0100194define(function () {
195 var obj = {
196 "-" : [
Akrond05e2112016-02-18 15:47:18 +0100197 ["Base Annotation", "base/s=", "Structure"],
Akroncff9bac2016-01-25 21:39:38 +0100198 ["Connexor", "cnx/", "Constituency, Lemma, Morphology, Part-of-Speech, Syntax"],
199 ["CoreNLP", "corenlp/", "Constituency, Named Entities, Part-of-Speech"],
Akrond05e2112016-02-18 15:47:18 +0100200 ["DeReKo", "dereko/s=", "Structure"],
Akroncff9bac2016-01-25 21:39:38 +0100201 ["Mate", "mate/", "Lemma, Morphology, Part-of-Speech"],
202 ["OpenNLP", "opennlp/", "Part-of-Speech"],
203 ["Schreibgebrauch", "sgbr/", "Lemma, Lemma Variants, Part-of-Speech"],
204 ["TreeTagger", "tt/", "Lemma, Part-of-Speech"],
205 ["Xerox Parser", "xip/", "Constituency, Lemma, Part-of-Speech"]
Akron113cc1a2016-01-22 21:17:57 +0100206 ],
Akrond05e2112016-02-18 15:47:18 +0100207 "base/s=" : [
208 ["s", "s", "Sentence"],
209 ["p", "p", "Paragraph"],
210 ["t", "t", "Text"]
211 ],
Akron113cc1a2016-01-22 21:17:57 +0100212 "corenlp/" : [
213 ["Constituency", "c="],
214 ["Named Entity", "ne=" , "Combined"],
215 ["Named Entity", "ne_dewac_175m_600=" , "ne_dewac_175m_600"],
216 ["Named Entity", "ne_hgc_175m_600=", "ne_hgc_175m_600"],
217 ["Part-of-Speech", "p="]
218 ],
219 "corenlp/ne=" : namedEntities,
220 "corenlp/ne_dewac_175m_600=" : namedEntities,
221 "corenlp/ne_hgc_175m_600=" : namedEntities,
222 "corenlp/p=" : sttsArray,
223 "corenlp/c=" : negraNodes,
224 "cnx/" : [
225 ["Constituency", "c="],
226 ["Lemma", "l="],
227 ["Morphology", "m="],
228 ["Part-of-Speech", "p="],
229 ["Syntax", "syn="]
230 ],
231 "cnx/c=" : [
232 ["np", "np ", "Nominal Phrase"]
233 ],
234 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/morph.html
235 "cnx/m=" : [
236 ["Abbr","Abbr ", "Nouns: Abbreviation"],
237 ["CMP","CMP ", "Adjective: Comparative"],
238 ["IMP", "IMP ", "Mood: Imperative"],
239 ["IND", "IND ", "Mood: Indicative"],
240 ["INF", "INF ", "Infinitive"],
241 ["ORD","ORD ", "Numeral: Ordinal"],
242 ["PAST", "PAST ", "Tense: past"],
243 ["PCP", "PCP ", "Participle"],
244 ["PERF", "PERF ", "Perfective Participle"],
245 ["PL","PL ", "Nouns: Plural"],
246 ["PRES", "PRES ", "Tense: present"],
247 ["PROG", "PROG ", "Progressive Participle"],
248 ["Prop","Prop ", "Nouns: Proper Noun"],
249 ["SUB", "SUB ", "Mood: Subjunctive"],
250 ["SUP","SUP ", "Adjective: Superlative"]
251 ],
252 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/morph.html
253 "cnx/p=" : [
254 ["A", "A ", "Adjective"],
255 ["ADV", "ADV ", "Adverb"],
256 ["CC", "CC ", "Coordination Marker"],
257 ["CS", "CS ", "Clause Marker"],
258 ["DET", "DET ", "Determiner"],
259 ["INTERJ", "INTERJ ", "Interjection"],
260 ["N", "N ", "Noun"],
261 ["NUM", "NUM ", "Numeral"],
262 ["PREP", "PREP ", "Preposition"],
263 ["PRON", "PRON ", "Pro-Nominal"],
264 ["V", "V ", "Verb"]
265 ],
266 // http://www.ids-mannheim.de/cosmas2/projekt/referenz/connexor/syntax.html
267 "cnx/syn=" : [
268 ["@ADVL", "@ADVL ", "Adverbial Head"],
269 ["@AUX", "@AUX ", "Auxiliary Verb"],
270 ["@CC", "@CC ", "Coordination"]
271 ["@MAIN", "@MAIN ", "Main Verb"],
272 ["@NH", "@NH ", "Nominal Head"],
273 ["@POSTMOD", "@POSTMOD ", "Postmodifier"],
274 ["@PREMARK", "@PREMARK ", "Preposed Marker"],
275 ["@PREMOD", "@POSTMOD ", "Premodifier"]
276 ],
277 "opennlp/" : [
278 ["Part-of-Speech", "p="]
279 ],
280 "opennlp/p=" : sttsArray,
Akroncff9bac2016-01-25 21:39:38 +0100281 "sgbr/" : [
282 ["Lemma", "l="],
283 ["Lemma Variants", "lv="],
284 ["Part-of-Speech", "p="]
285 ],
Akronb2a09532016-02-16 19:14:42 +0100286 "sgbr/p=" : sgbrSttsArray,
Akron113cc1a2016-01-22 21:17:57 +0100287 "xip/" : [
288 ["Constituency", "c="],
289 // Inactive: ["Dependency", "d="],
290 ["Lemma", "l="],
291 ["Part-of-Speech", "p="],
292 ],
293 // "xip/c=" : [],
294 // Inactive: "xip/d=" : [],
295 // "xip/p=" : [],
296 "tt/" : [
297 ["Lemma", "l="],
298 ["Part-of-Speech", "p="]
299 ],
300 "tt/p=" : sttsArray,
301 "mate/" : [
302 // Inactive: "d" : ["d=", "Dependency"],
303 ["Lemma", "l="],
304 ["Morphology", "m="],
305 ["Part-of-Speech", "p="]
306 ],
307 // Inactive: mate/d=
308 "mate/p=" : mateSttsArray,
309 "mate/m=" : [
310 ["Case", "case:"],
311 ["Degree", "degree:"],
312 ["Gender", "gender:"],
313 ["Mood", "mood:"],
314 ["Number", "number:"],
315 ["Person", "person:"],
316 ["Tense","tense:"],
317 ["No type", "<no-type> "]
318 ],
319 "mate/m=case:" : [
320 ["acc", "acc ", "Accusative"],
321 ["dat","dat ", "Dative"],
322 ["gen", "gen ","Genitive"],
323 ["nom","nom ", "Nominative"],
324 ["*","* ", "Undefined"]
325 ],
326 "mate/m=degree:" : [
327 ["comp","comp ", "Comparative"],
328 ["pos","pos ", "Positive"],
329 ["sup","sup ", "Superative"]
330 ],
331 "mate/m=gender:" : [
332 ["fem", "fem ", "Feminium"],
333 ["masc", "masc ", "Masculinum"],
334 ["neut","neut ", "Neuter"],
335 ["*","* ","Undefined"]
336 ],
337 "mate/m=mood:" : [
338 ["imp","imp ", "Imperative"],
339 ["ind","ind ", "Indicative"],
340 ["subj","subj ", "Subjunctive"]
341 ],
342 "mate/m=number:" : [
343 ["pl","pl ","Plural"],
344 ["sg","sg ","Singular"],
345 ["*","* ","Undefined"]
346 ],
347 "mate/m=person:" : [
348 ["1","1 ", "First Person"],
349 ["2","2 ", "Second Person"],
350 ["3","3 ", "Third Person"]
351 ],
352 "mate/m=tense:" : [
353 ["past","past ", "Past"],
354 ["pres","pres ", "Present"]
355 ]
356 };
Nils Diewald023c6712015-05-21 20:12:30 +0000357
Akron113cc1a2016-01-22 21:17:57 +0100358 for (var i in negraNodes) {
359 obj["corenlp/c=" + negraNodes[i][0] + '-'] = negraEdges;
360 };
361
362 return obj;
Nils Diewald023c6712015-05-21 20:12:30 +0000363});