Added text marker, added sentences from multiple foundries, changed paragraphs to base/para some tests, some bugfixes
diff --git a/t/WPD/02035-substring/header.xml b/t/WPD/02035-substring/header.xml
new file mode 100644
index 0000000..b4689d7
--- /dev/null
+++ b/t/WPD/02035-substring/header.xml
@@ -0,0 +1,65 @@
+<?xml version="1.0" encoding="iso-8859-1"?>
+<?xml-model href="header.rng" type="application/xml" schematypens="http://relaxng.org/ns/structure/1.0"?>
+<!DOCTYPE idsCorpus PUBLIC "-//IDS//DTD IDS-XCES 1.0//EN" "http://corpora.ids-mannheim.de/idsxces1/DTD/ids.xcesdoc.dtd">
+<idsHeader type="text" pattern="text" status="new" version="1.1" TEIform="teiHeader">
+ <fileDesc>
+ <titleStmt>
+ <textSigle>A00/JAN.02035</textSigle>
+ <t.title assemblage="regular">A00/JAN.02035 St. Galler Tagblatt, 11.01.2000, Ressort: TB-RSP (Abk.)</t.title>
+ </titleStmt>
+ <publicationStmt>
+ <distributor/>
+ <pubAddress/>
+ <availability region="world" status="unknown"/>
+ <pubDate/>
+ </publicationStmt>
+ <sourceDesc>
+ <biblStruct>
+ <analytic>
+ <h.title type="main"/>
+ <h.author/>
+ <imprint/>
+ <biblScope type="pp"/>
+ <biblScope type="suppl"/>
+ <biblScope type="suppltitle"/>
+ <biblNote n="1"/>
+ </analytic>
+ <monogr>
+ <h.title type="main"/>
+ <imprint>
+ <pubDate type="year">2000</pubDate>
+ <pubDate type="month">01</pubDate>
+ <pubDate type="day">11</pubDate>
+ </imprint>
+ <biblScope type="issue"/>
+ <biblScope type="issueplace"/>
+ </monogr>
+ </biblStruct>
+ <reference type="complete" assemblage="regular">A00/JAN.02035 St. Galler Tagblatt, [Tageszeitung], 11.01.2000, Jg. 56. Originalressort: TB-RSP (Abk.), [Bericht]</reference>
+ <reference type="short" assemblage="regular">A00/JAN.02035 St. Galler Tagblatt, 11.01.2000</reference>
+ </sourceDesc>
+ </fileDesc>
+ <encodingDesc>
+ <samplingDecl/>
+ <tagsDecl>
+ <tagUsage gi="p" occurs="5"/>
+ <tagUsage gi="s" occurs="28"/>
+ </tagsDecl>
+ </encodingDesc>
+ <profileDesc>
+ <creation>
+ <creatDate>2000.01.11</creatDate>
+ </creation>
+ <textClass>
+ <catRef n="1" target="topic.sport.ballsport" scheme="topic"/>
+ <h.keywords>
+ <keyTerm/>
+ </h.keywords>
+ </textClass>
+ <textDesc>
+ <textTypeArt>Bericht</textTypeArt>
+ <textDomain/>
+ <column>TB-RSP (Abk.)</column>
+ </textDesc>
+ </profileDesc>
+ </idsHeader>