blob: 31d3bc46e2ad26bfb6a37da3fd1c5d741fec43c5 [file] [log] [blame]
banspc3cdcb92022-03-09 03:25:32 +01001<!-- IDS-XCES v1.0 -->
2<!-- -->
3<!-- $Id: ids.xcesdoc.dtd 44 2009-02-20 11:01:28Z kupietz $ -->
4<!-- -->
5<!-- based on: -->
6<!-- -->
7<!-- Corpus Encoding Standard -->
8<!-- -->
9<!-- CES -->
10<!-- -->
11<!-- Encoding conventions for level 1 -->
12<!-- -->
13<!-- -->
14<!-- -->
15<!--
16
17 -->
18<!-- -->
19<!-- ENTITY DECLARATIONS -->
20<!-- -->
21
22
23
24
25<!-- Global attributes -->
26
27<!ENTITY % a.global '
28 id ID #IMPLIED
29 n CDATA #IMPLIED
30 xml:lang CDATA #IMPLIED
31 lang IDREF #IMPLIED' >
32
33<!ENTITY % a.text '%a.global;
34 rend CDATA #IMPLIED
35 wsd CDATA #IMPLIED' >
36
37
38<!-- Elements that can appear between paragraphs -->
39
40<!ENTITY % m.inter ' bibl | quote | list |
41 poem | note | caption | figure | table ' >
42
43
44<!-- Sub-paragraph elements -->
45
46<!ENTITY % x.token '' >
47
48<!ENTITY % m.token '%x.token; abbr | date | num |
49 dateRange | numRange | timeRange |
50 measure | name | term | time | w |' >
51
52<!ENTITY % m.phrase '%m.token; corr | distinct | foreign |
53 gap | hi | list | mentioned | orig | q |
54 ref | reg | s | stage | title | table | xref' >
55
56
57<!ENTITY % base.seq '#PCDATA | %x.token; num | numRange | abbr | hi' >
58
59<!ENTITY % phrase.seq '#PCDATA | %m.phrase;' >
60
61
62
63<!ENTITY % par.seq '(p | sp | %m.inter;)*' >
64
65
66
67<!-- Entitaeten aus header.elt hiereher kopiert -->
68
69<!ENTITY % a.header '%a.global;' >
70
71<!ENTITY % a.declarable '
72 Default (y | n) "n"' >
73
74
75<!ENTITY % ids.customization SYSTEM "ids.xcustomize.ent" >
76%ids.customization;
77%ids.state.elem;
78
79<!-- -->
80<!-- ELEMENT DECLARATIONS -->
81<!-- -->
82
83<!-- HIGH-LEVEL COMPONENTS -->
84
85
86<!ELEMENT idsCorpus (idsHeader,(idsDoc+)) >
87<!ATTLIST idsCorpus %a.global;
88 type CDATA #IMPLIED
89 version CDATA #REQUIRED
90 TEIform CDATA 'teiCorpus.2' >
91
92<!ELEMENT idsDoc (idsHeader, idsText+) >
93<!ATTLIST idsDoc %a.global;
94 type CDATA "text"
95 version CDATA #REQUIRED
96 TEIform CDATA 'TEI.2' >
97
98
99<!ENTITY % ids.header PUBLIC "-//CES//ENTITIES Header//EN" "ids.xheader.elt" >
100%ids.header;
101
102
103<!-- WRITTEN TEXTS -->
104
105<!ELEMENT idsText ((idsHeader , text)) >
106<!ATTLIST idsText %a.global;
107 version CDATA #REQUIRED >
108
109<!ELEMENT text (front | body |back | %ids.milestones;)* >
110<!-- milestones...-->
111<!ATTLIST text %a.global; >
112
113<!ELEMENT front (titlePage?,div*) >
114<!ATTLIST front %a.global; >
115
116
117<!ELEMENT titlePage ((docTitle|byline|docEdition|docImprint|epigraph)+) >
118<!ATTLIST titlePage %a.global; >
119
120<!ELEMENT docTitle (titlePart+) >
121<!ATTLIST docTitle %a.global;
122 type (main | sub) #IMPLIED >
123
124<!ELEMENT epigraph (quote) >
125<!ATTLIST epigraph %a.global; >
126
127<!ELEMENT docEdition (#PCDATA) >
128<!ATTLIST docEdition %a.global; >
129
130<!ELEMENT docImprint (#PCDATA) >
131<!ATTLIST docImprint %a.global; >
132
133<!ELEMENT titlePart (#PCDATA | s)* >
134
135<!ATTLIST titlePart %a.global;
136 type (main | sub | desc | unspecified) #IMPLIED >
137
138<!ELEMENT back (%par.seq;, div*) >
139<!ATTLIST back %a.text; >
140
141<!ELEMENT body (%par.seq;, div*) >
142<!ATTLIST body %a.text;
143 decls IDREFS #IMPLIED >
144
145<!ELEMENT div (opener | head | byline | p | sp | stage | %m.inter; | div | closer | %ids.milestones; )* >
146
147<!ATTLIST div %a.text;
148 complete (y | n) "y"
149 type CDATA #REQUIRED
150 decls IDREFS #IMPLIED >
151
152
153
154<!-- Opening elements -->
155
156<!ELEMENT opener (%phrase.seq;| dateline | keywords | salute | %ids.milestones;)* >
157%ids.opener.att;
158
159%ids.head;
160
161
162<!-- Keyword lists, bylines, datelines -->
163
164<!ELEMENT keywords (term+ | list) >
165<!ATTLIST keywords %a.text;
166 scheme IDREF #IMPLIED >
167
168
169<!ELEMENT byline (%phrase.seq; | docAuthor | %ids.milestones;)* >
170<!ATTLIST byline %a.text; >
171
172<!ELEMENT docAuthor (%base.seq; | %ids.milestones; )* >
173<!ATTLIST docAuthor %a.text; >
174
175<!ELEMENT dateline (%base.seq; | date | time |
176 dateRange | timeRange |
177 name | address | %ids.milestones;)* >
178
179<!ATTLIST dateline %a.text; >
180
181<!ELEMENT salute (#PCDATA | %ids.milestones;)* >
182<!ATTLIST salute %a.text; >
183
184
185<!ELEMENT signed (#PCDATA | %ids.milestones;)* >
186<!ATTLIST signed %a.text; >
187
188
189
190<!ELEMENT address (%base.seq;)* >
191<!ATTLIST address %a.text; >
192
193
194
195
196<!-- Closing element -->
197
198<!ELEMENT closer (%phrase.seq; | dateline | keywords | salute | signed | %ids.milestones;)* >
199<!ATTLIST closer %a.text; >
200
201
202<!-- PARAGRAPH-LEVEL ELEMENTS THE CLASS M.INTER -->
203
204<!-- Written paragraphs -->
205
206<!ELEMENT p (%phrase.seq; | %ids.milestones;)* >
207
208<!ATTLIST p %a.text; >
209
210
211<!-- Quotations -->
212
213<!ELEMENT quote (%phrase.seq; | p | poem | %ids.milestones; )* >
214<!ATTLIST quote %a.text;
215 next IDREF #IMPLIED
216 prev IDREF #IMPLIED
217 type CDATA #IMPLIED
218 broken (yes | no) "no" >
219
220
221<!-- Lists -->
222
223
224<!ELEMENT list (head?, (item | (label, (%ids.milestones;)* , item) | %ids.milestones;)*) >
225<!ATTLIST list %a.text;
226 type CDATA #IMPLIED >
227
228<!ELEMENT item (%phrase.seq; | p | %ids.milestones;)* >
229<!ATTLIST item %a.text; >
230
231<!ELEMENT label (%phrase.seq;)* >
232<!ATTLIST label %a.text; >
233
234
235<!-- Analog zu TEI koennen poem und quote innerhalb von note auftreten -->
236
237<!ELEMENT note (%phrase.seq; | p | bibl | poem | quote | sp | %ids.milestones;)* >
238<!ATTLIST note %a.text;
239 place (side | foot | end | unspec)
240
241 "unspec" >
242
243<!ELEMENT bibl (%phrase.seq; | author | %ids.milestones;)* >
244<!ATTLIST bibl %a.text;
245 %a.declarable; >
246
247<!ELEMENT author (%base.seq;)* >
248<!ATTLIST author %a.text; >
249
250
251<!-- Poems -->
252
253<!ELEMENT poem (head?, (lg | l | %ids.milestones;)+ ) >
254<!ATTLIST poem %a.text; >
255
256<!ELEMENT lg (l | lg | %ids.milestones;)+ >
257<!ATTLIST lg %a.text;
258 type CDATA #IMPLIED
259 part (y | n | u) "u" >
260
261<!ELEMENT l (%phrase.seq; | %ids.milestones;)* >
262<!ATTLIST l %a.text;
263 part (y | n | u) "u" >
264
265
266<!-- Figures -->
267
268<!-- Motivation: Innerhalb von Bildbeischriften koennen auch Sprechpassagen
269 oder Zitate inkl. Sprecher oder Titel auftreten.
270 Die bisherige Strukturbeschreibung ist in dieser
271 Hinsicht nicht ausreichend.
272-->
273
274<!ELEMENT figure (head?, (p| %m.inter; | %ids.milestones; )*, figDesc?, text?) >
275<!ATTLIST figure %a.text;
276 entity ENTITY #IMPLIED >
277
278<!ELEMENT figDesc (%phrase.seq;)* >
279<!ATTLIST figDesc %a.text; >
280
281<!-- Tables -->
282
283<!ELEMENT table (head?, (row | %ids.milestones;)+ ) >
284<!ATTLIST table %a.text;
285 rows NMTOKEN #IMPLIED
286 cols NMTOKEN #IMPLIED >
287
288<!ELEMENT row (cell | table)+ >
289<!ATTLIST row %a.text;
290 role CDATA "data" >
291
292<!ELEMENT cell (%phrase.seq; | %ids.milestones;)* >
293<!ATTLIST cell %a.text;
294 role CDATA "data"
295 rows NMTOKEN "1"
296 cols NMTOKEN "1" >
297
298
299<!-- Captions -->
300
301<!-- Motivation: Innerhalb von Captions koennen beliebige paragraph-
302 wertige Strukturen sowie Ueberschriften auftreten.
303 Die bisherige Strukturbeschreibung ist in dieser
304 Hinsicht voellig unzureichend, da sie nur satzwertige
305 Strukturen erlaubt.
306-->
307<!ELEMENT caption ( head*, (p | %m.inter; | %ids.milestones; )+ ) >
308<!ATTLIST caption %a.text;
309 type ( byline | display |
310 attached | unspec ) "unspec" >
311
312
313
314<!-- Analog zu TEI koennen auch poem und quote
315 innerhalb von sp auftreten -->
316
317<!ELEMENT sp (speaker | p | quote | poem | stage | %ids.milestones; )* >
318<!ATTLIST sp %a.text;
319 who CDATA #IMPLIED >
320
321
322<!ELEMENT speaker (%base.seq; | %ids.milestones; )* >
323<!ATTLIST speaker %a.text; >
324
325<!ELEMENT stage (%base.seq; | p | %ids.milestones; )* >
326<!ATTLIST stage %a.text;
327 type CDATA #IMPLIED >
328
329
330
331<!-- SENTENCES, QUOTED DIALOGUE WITHIN PARAGRAPHS -->
332
333<!ELEMENT s (%phrase.seq; | %ids.milestones; )* >
334<!ATTLIST s %a.text;
335 next IDREF #IMPLIED
336 prev IDREF #IMPLIED
337 type CDATA #IMPLIED
338 broken (yes | no) "no" >
339
340
341<!ELEMENT q (%phrase.seq; | %ids.milestones; )* >
342<!ATTLIST q %a.text; %ids.q.att.type;
343 next IDREF #IMPLIED
344 prev IDREF #IMPLIED
345 direct (y | n | unspecified)
346 "unspecified"
347 who CDATA #IMPLIED
348 broken (yes | no) "no" >
349
350
351
352<!-- PHRASE-LEVEL ELEMENTS THE CLASS M.PHRASE -->
353
354
355<!-- Editorial Changes -->
356
357<!ELEMENT gap EMPTY >
358<!ATTLIST gap %a.text;
359 desc CDATA #IMPLIED
360 reason CDATA #IMPLIED
361 resp CDATA #IMPLIED
362 cert CDATA #IMPLIED >
363
364<!ELEMENT reg (%phrase.seq;)* >
365<!ATTLIST reg %a.text;
366 orig CDATA #IMPLIED
367 resp CDATA #IMPLIED
368 cert CDATA #IMPLIED >
369
370<!-- Seubert, 07.03.05 erweitert um Attribut 'regalt' wg. Varianten
371 in sog. Sparschreibung -->
372<!ELEMENT orig (%phrase.seq;)* >
373<!ATTLIST orig %a.text;
374 reg CDATA #IMPLIED
375 regalt CDATA #IMPLIED
376 resp CDATA #IMPLIED
377 cert CDATA #IMPLIED >
378
379<!ELEMENT corr (%phrase.seq;)* >
380<!ATTLIST corr %a.text;
381 sic CDATA #IMPLIED
382 resp CDATA #IMPLIED
383 cert CDATA #IMPLIED >
384
385
386<!-- Highlighted text -->
387
388<!ELEMENT hi (%phrase.seq; | %ids.milestones;)* >
389<!ATTLIST hi %a.text; >
390
391
392
393<!-- Other Phrase-level Elements -->
394
395<!ELEMENT date (%base.seq;)* >
396<!ATTLIST date %a.text;
397 ISO8601 CDATA #IMPLIED >
398
399<!ELEMENT foreign (%phrase.seq; | %ids.milestones;)* >
400<!ATTLIST foreign %a.text; >
401
402<!ELEMENT distinct (%phrase.seq; | %ids.milestones;)* >
403<!ATTLIST distinct %a.text;
404 type CDATA #IMPLIED >
405
406<!ELEMENT mentioned (%phrase.seq;| %ids.milestones;)* >
407<!ATTLIST mentioned %a.text; >
408
409<!ELEMENT measure (%base.seq;)* >
410<!ATTLIST measure %a.text;
411 type (weight| length| count| area|
412 volume| temperature| currency)
413 #IMPLIED
414 value CDATA #IMPLIED >
415
416<!ELEMENT name (%base.seq; | %ids.milestones;)* >
417<!ATTLIST name %a.text;
418 type CDATA
419 #IMPLIED >
420
421<!ELEMENT term (%base.seq; | %ids.milestones;)* >
422<!ATTLIST term %a.text;
423 type CDATA #IMPLIED >
424
425%ids.gloss;
426
427<!ELEMENT time (%base.seq; | %ids.milestones;)* >
428<!ATTLIST time %a.text;
429 ISO8601 CDATA #IMPLIED
430 type (am | pm | 24hour | descriptive)
431 #IMPLIED >
432
433<!-- provisorisch eingefuegt, Seubert (30.06.2004) -->
434<!ELEMENT w (#PCDATA) >
435<!ATTLIST w %a.text;
436 ana CDATA #IMPLIED
437 ctag CDATA #IMPLIED
438 type CDATA #IMPLIED >
439
440<!ELEMENT title (%phrase.seq; | %ids.milestones;)* >
441<!ATTLIST title %a.text;
442 type CDATA #IMPLIED >
443
444<!ELEMENT abbr (#PCDATA) >
445<!ATTLIST abbr %a.text;
446 expan CDATA #IMPLIED
447 resp IDREF #IMPLIED
448 cert CDATA #IMPLIED
449 type CDATA #IMPLIED >
450
451<!ELEMENT num (#PCDATA) >
452<!ATTLIST num %a.text;
453 type CDATA #IMPLIED
454 value CDATA #IMPLIED >
455
456
457<!-- Eric Seubert, 03.03.06 provisorisch eingefuegt -->
458
459<!ELEMENT dateRange (%base.seq;)* >
460<!ATTLIST dateRange %a.text;
461 from CDATA #IMPLIED
462 to CDATA #IMPLIED >
463
464<!ELEMENT numRange (%base.seq;)* >
465<!ATTLIST numRange %a.text;
466 from CDATA #IMPLIED
467 to CDATA #IMPLIED
468 type CDATA #IMPLIED >
469
470<!ELEMENT timeRange (%base.seq;)* >
471<!ATTLIST timeRange %a.text;
472 from CDATA #IMPLIED
473 to CDATA #IMPLIED >
474
475
476
477
478
479<!-- SEGMENTATION, LINKING, ALIGNMENT -->
480
481<!-- Simple cross references -->
482
483<!ELEMENT ptr EMPTY >
484<!ATTLIST ptr %a.text;
485 corresp IDREFS #IMPLIED
486 next IDREF #IMPLIED
487 prev IDREF #IMPLIED
488 type CDATA #IMPLIED
489 resp CDATA #IMPLIED
490 crdate CDATA #IMPLIED
491 targType NMTOKENS #IMPLIED
492 targOrder (y | n | u) "u"
493 evaluate (all | one | none) #IMPLIED
494 target IDREFS #REQUIRED >
495
496<!ELEMENT ref (%phrase.seq; | %ids.milestones; )* >
497<!ATTLIST ref %a.text;
498 corresp IDREFS #IMPLIED
499 next IDREF #IMPLIED
500 prev IDREF #IMPLIED
501 type CDATA #IMPLIED
502 resp CDATA #IMPLIED
503 crdate CDATA #IMPLIED
504 targType NMTOKENS #IMPLIED
505 targOrder (y | n | u) "u"
506 evaluate (all | one | none) #IMPLIED
507 target CDATA #IMPLIED >
508
509
510<!-- PUBLIC ENTITY SETS -->
511
512
513<!ENTITY % IDSlat1 PUBLIC "-//IDS//ENTITIES Latin 1 Extension for IDS-CES//EN" "ids-lat1.ent">
514%IDSlat1;
515