blob: aa5043de3b69e7ba5a8b60846ffb5f975e1518b8 [file] [log] [blame]
<xsl:stylesheet version="3.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
xmlns:xs="http://www.w3.org/2001/XMLSchema"
xmlns:opf="http://www.idpf.org/2007/opf"
xmlns:dc="http://purl.org/dc/elements/1.1/"
xmlns:ids="http://www.ids-mannheim.de/ids"
xmlns:hlu="http://www.ids-mannheim.de/hlu"
xmlns:saxon="http://saxon.sf.net/"
xmlns:xhtml="http://www.w3.org/1999/xhtml"
exclude-result-prefixes="xs opf dc ids hlu saxon xhtml">
<xsl:output method="xml" indent="yes" omit-xml-declaration="yes" saxon:line-length="1000"/>
<xsl:strip-space elements="*"/>
<xsl:variable name="ev"/>
<xsl:variable name="x"/>
<xsl:variable name="isbn" as="xs:string" select="replace(document-uri(), '.*([0-9]{13,}).*' , '$1')"/>
<xsl:variable name="dnbBookdata">
<xsl:copy-of select="doc(concat('https://services.dnb.de/sru/dnb?version=1.1&amp;operation=searchRetrieve&amp;query=NUM%3D', $isbn, '&amp;recordSchema=oai_dc'))"/>
</xsl:variable>
<xsl:variable name="autor"
select="replace(string-join($dnbBookdata//dc:creator[not(matches(., '\[(Erzähler)\]'))], ' ; '), ' *\[[^\]]*\]', '')"/>
<xsl:variable name="straight_autor" select="normalize-space(replace(hlu:reversedAuthors($autor), ',', ''))"/>
<xsl:variable name="ina"/>
<xsl:variable name="_corpus"/>
<xsl:variable name="ent_known"/>
<!-- added HLU 2012-02-09: -->
<xsl:variable name="ent">
<xsl:choose>
<xsl:when test="$ent_known">
<xsl:value-of select="$ent_known"/>
</xsl:when>
<xsl:when test="$ev">
<xsl:value-of select="$ev"/>
</xsl:when>
<xsl:otherwise>
<xsl:value-of select="$j"/>
</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<xsl:variable name="titel">
<xsl:variable name="title-with-subtitles">
<xsl:choose>
<xsl:when test="contains(($dnbBookdata//dc:title)[1],':')">
<xsl:value-of select="normalize-space(substring-before(substring-before(($dnbBookdata//dc:title)[1], '/'), ':'))"
/>
</xsl:when>
<xsl:otherwise>
<xsl:value-of select="normalize-space(substring-before(($dnbBookdata//dc:title)[1], '/'))"/>
</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<xsl:value-of select="normalize-space(replace($title-with-subtitles, '\|.*', ''))"/>
</xsl:variable>
<xsl:variable name="erscheinungsort">
<xsl:choose>
<xsl:when test="contains(($dnbBookdata//dc:publisher)[1], ':')">
<xsl:value-of select="normalize-space(substring-before(($dnbBookdata//dc:publisher)[1], ':'))"/>
</xsl:when>
<xsl:otherwise>
<xsl:value-of select="normalize-space(($dnbBookdata//dc:publisher)[1])"/>
</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<xsl:variable name="texttype" select="replace(($dnbBookdata//dc:subject[matches(., '^[A-Z] ')])[1], '^[A-Z] (.*)', '$1')"/>
<xsl:variable name="verlag">
<xsl:choose>
<xsl:when test="contains(($dnbBookdata//dc:publisher)[1], ':')">
<xsl:value-of select="normalize-space(substring-after(($dnbBookdata//dc:publisher)[1], ':'))"/>
</xsl:when>
<xsl:otherwise>
<xsl:value-of select="normalize-space(($dnbBookdata//dc:publisher)[1])"/>
</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<xsl:variable name="erscheinungsjahr">
<xsl:choose>
<xsl:when test="dnbBookdata//dc:date[matches(normalize-space(.), '^[0-9]{4}$')]">
<xsl:value-of select="$dnbBookdata//dc:date[matches(normalize-space(.), '^[0-9]{4}$')][1]"/>
</xsl:when>
<xsl:otherwise>
<xsl:value-of select="substring-before(($dnbBookdata//dc:date)[1], '-')"/>
</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<xsl:variable name="untertitel"
select="normalize-space(substring-after(substring-before(($dnbBookdata//dc:title)[1], '/'), ':'))"/>
<xsl:variable name="herausgeber">
<xsl:choose>
<xsl:when test="$dnbBookdata//dc:creator[ends-with(.,'[Hrsg.]')]">
<xsl:value-of
select="replace(string-join($dnbBookdata//dc:creator[ends-with(.,'[Hrsg.]')][1], ' ; '),'\s?\[Hrsg.\]','')"
/>
</xsl:when>
<xsl:otherwise>.</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<xsl:variable name="straight_herausgeber"
select="replace(hlu:reversedAuthors($herausgeber), ',', '')"/>
<xsl:variable name="j" select="$dnbBookdata//dc:date"/>
<!-- for BOT+s: -->
<xsl:variable name="seiten" select="replace($dnbBookdata//dc:format,'S\.','')"/>
<!-- fuer BOT+b: -->
<xsl:variable name="_b">
<xsl:variable name="regexp1" select="'(Band|Bd\.)\s*([0-9]?[0-9]?[0-9])'"/>
<xsl:choose>
<xsl:when test="matches($dnbBookdata, $regexp1)">
<xsl:analyze-string select="$dnbBookdata//dc:title" regex="{$regexp1}">
<xsl:matching-substring>
<xsl:value-of select="."/>
</xsl:matching-substring>
</xsl:analyze-string>
</xsl:when>
<xsl:otherwise>
<xsl:value-of select="'.'"/>
</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<!-- for BOT+x: -->
<xsl:variable name="txtart">
<xsl:choose>
<xsl:when test="$x">
<xsl:value-of select="concat('[', $x, ']')"/>
</xsl:when>
<xsl:when
test="matches($untertitel, '([Rr]oman|[Ee]rzhlung(en)?|[Aa]nthologie|[Gg]eschichte(n)?|[Nn]ovelle)')">
<xsl:value-of
select="concat('[', replace(replace($untertitel, '.*?(((^|\P{L})\p{L}+)?([Rr]oman|[Ee]rzhlung(en)?|[Aa]nthologie|[Gg]eschichte(n)?|[Nn]ovelle)).*', '$1'), '\P{L}*(.+)', '$1'), ']')"
/>
</xsl:when>
<xsl:otherwise>
<xsl:value-of>Roman</xsl:value-of>
</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<!-- fuer BOTd: -->
<xsl:variable name="dok"
select="concat((if(string-length($autor) &gt; 0) then concat($straight_autor, ': ') else ''), $titel, ', ', $txtart, ', (', $j, ')')"/>
<!-- END variables derived from sru request to dnb archive -->
<xsl:variable name="corpus_sigle" select="concat('DNB', substring($erscheinungsjahr, 3, 2))"/>
<!-- for BOTD: -->
<!-- Dokumentsigle muss zusammen mit Korpussigle (z.B DIV fuer loz-div und loz-div-pub) eindeutig sein -->
<xsl:variable name="doc_sigle">
<xsl:variable name="firstContentWordTitleInitial">
<xsl:variable name="helper">
<xsl:analyze-string select="$titel" regex="\w+">
<xsl:matching-substring>
<xsl:choose>
<xsl:when
test="matches(.,'^[A-Z]') and not(matches(.,'^(Der|Die|Das|Des|Ein|Eine|Eines|Einmal|Von|Mit|Zu|Zurck)$'))">
<!-- TODO: Fktnswoerter nachtragen -->
<xsl:sequence select="."/>
</xsl:when>
<xsl:otherwise/>
</xsl:choose>
</xsl:matching-substring>
</xsl:analyze-string>
</xsl:variable>
<xsl:value-of
select="upper-case(substring(normalize-space(replace($helper,'\s+.+$','')),1,1))"/>
<!-- longest match of .+ -->
</xsl:variable>
<xsl:choose>
<xsl:when test="contains($autor,';')">
<xsl:variable name="lastname_aut1"
select="upper-case(substring(normalize-space(substring-before(substring-before($autor,';'),',')), 1, 1))"/>
<xsl:variable name="lastname_aut2"
select="upper-case(substring(normalize-space(substring-before(substring-before(substring-after($autor, ';'),';'),',')), 1, 1))"/>
<xsl:value-of select="concat($lastname_aut1, $lastname_aut2)"/>
</xsl:when>
<xsl:otherwise>
<xsl:variable name="lastname_aut1"
select="upper-case(substring(normalize-space(substring-before($autor,',')),1,1))"/>
<xsl:variable name="firstname_aut1"
select="upper-case(substring(normalize-space(substring-after($autor,',')),1,1))"/>
<xsl:value-of select="concat($lastname_aut1, $firstname_aut1)"/>
</xsl:otherwise>
</xsl:choose>
<xsl:value-of select="$firstContentWordTitleInitial"/>
</xsl:variable>
<xsl:variable name="text_sigle" select="substring($isbn, 8, 5)"/>
<xsl:variable name="sigle" select="concat($corpus_sigle, '/', $doc_sigle, '.', $text_sigle)"/>
<!-- fuer BOT+xy: (?) -->
<xsl:variable name="xyref">
<xsl:value-of select="document-uri(.)"/>
<xsl:text>; </xsl:text>
<xsl:text>ISBN:</xsl:text>
<xsl:value-of select="$isbn"/>
<xsl:text>; </xsl:text>
<xsl:value-of select="string-join($dnbBookdata//dc:identifier)"/>
</xsl:variable>
<xsl:variable name="long-reference"
select="concat($sigle, ' ', $autor, ': ', $titel, '. ', $erscheinungsort, ': ', $verlag, ', ', $erscheinungsjahr)"/>
<xsl:variable name="short-reference"
select="concat($straight_autor, ': ', $titel, ' (', $erscheinungsjahr, ')')"/>
<xsl:template match="/">
<idsDoc TEIform="TEI.2" type="text" version="1.0">
<idsHeader TEIform="teiHeader" pattern="text" status="new" type="document" version="1.1">
<fileDesc>
<titleStmt>
<dokumentSigle><xsl:value-of select="string-join(($corpus_sigle, $doc_sigle), '/')"/></dokumentSigle>
<d.title><xsl:value-of select="$short-reference"/></d.title>
</titleStmt>
<publicationStmt>
<distributor/>
<pubAddress/>
<availability region="world" status="unknown">QAO-NC</availability>
<pubDate/>
</publicationStmt>
<sourceDesc>
<biblStruct>
<monogr>
<h.title type="main"/>
<imprint/>
</monogr>
</biblStruct>
</sourceDesc>
</fileDesc>
</idsHeader>
<idsText version="1.0">
<idsHeader TEIform="teiHeader" pattern="text" status="new" type="text" version="1.1">
<fileDesc>
<titleStmt>
<textSigle><xsl:sequence select="$sigle"/></textSigle>
<t.title assemblage="regular"><xsl:value-of select="$long-reference"/></t.title>
</titleStmt>
<publicationStmt>
<distributor/>
<pubAddress/>
<availability region="world" status="unknown">QAO-NC</availability>
<pubDate/>
</publicationStmt>
<sourceDesc>
<biblStruct>
<monogr>
<h.title type="main"><xsl:value-of select="$titel"/></h.title>
<h.title type="sub"><xsl:value-of select="$untertitel"/></h.title>
<h.author><xsl:value-of select="$autor"/></h.author>
<editor/>
<edition>
<further/>
<kind>E-Book-Ausgabe</kind>
<appearance>EPUB-Datei</appearance>
</edition>
<imprint>
<publisher><xsl:value-of select="$verlag"/></publisher>
<pubDate type="year"><xsl:value-of select="$j"/></pubDate>
<pubDate type="month"/>
<pubDate type="day"/>
<pubPlace key="DE"><xsl:value-of select="$erscheinungsort"/></pubPlace>
</imprint>
<biblScope type="subsume"/>
<biblScope type="pp"/>
<biblScope type="vol"/>
<biblScope type="volume-title"/>
</monogr>
</biblStruct>
<reference assemblage="regular" type="complete"><xsl:value-of select="concat($sigle, ' ', $autor, ': ', $titel, '. ', $erscheinungsort, ': ', $verlag, ', ', $erscheinungsjahr)"/></reference>
</sourceDesc>
</fileDesc>
<profileDesc>
<creation>
<creatDate><xsl:value-of select="$j"/></creatDate>
</creation>
<textClass/>
<textDesc>
<textType><xsl:value-of select="$texttype"/></textType>
<textTypeRef><xsl:value-of select="$texttype"/></textTypeRef>
<textDomain/>
</textDesc>
</profileDesc>
</idsHeader>
<text>
<body>
<!-- Call the template for each link in the TOC
<xsl:apply-templates select="//xhtml:ol[@class='toc']/xhtml:li/xhtml:a" mode="collect"/> -->
<xsl:apply-templates select="//opf:package/opf:manifest/opf:item[matches(@href, '\.x?html$') and not(matches(@href, '(cover|toc|copyright|feedback|inhalt|nav|titlepage).*'))]" mode="collect"/>
</body>
</text>
</idsText>
</idsDoc>
</xsl:template>
<xsl:template match="opf:item" mode="collect">
<xsl:variable name="href" select="@href"/>
<xsl:message>
<xsl:text>converting: </xsl:text><xsl:value-of select="$href"/><xsl:text> </xsl:text><xsl:value-of select="$isbn"/>
</xsl:message>
<xsl:apply-templates select="doc(resolve-uri($href, base-uri()))/xhtml:html/xhtml:body"/>
</xsl:template>
<xsl:template match="xhtml:body">
<div type="chapter">
<xsl:apply-templates/>
</div>
</xsl:template>
<xsl:template match="xhtml:title">
<head>
<xsl:apply-templates/>
</head>
</xsl:template>
<xsl:template match="xhtml:h1">
<head>
<xsl:apply-templates/>
</head>
</xsl:template>
<xsl:template match="xhtml:h2|xhtml:h3">
<head type="sub">
<xsl:apply-templates/>
</head>
</xsl:template>
<xsl:template match="xhtml:em">
<emph>
<xsl:apply-templates/>
</emph>
</xsl:template>
<xsl:template match="xhtml:span[matches(@class, '(bold|italic|big|kursiv| )+')]">
<xsl:variable name="class" select="replace(@class, 'kursiv', 'italic')"/>
<hi rend="{$class}">
<xsl:apply-templates/>
</hi>
</xsl:template>
<xsl:template match="xhtml:b">
<hi rend="bold">
<xsl:apply-templates/>
</hi>
</xsl:template>
<xsl:template match="xhtml:sub|xhtml:span[@class='sub']">
<hi rend="sub">
<xsl:apply-templates/>
</hi>
</xsl:template>
<xsl:template match="xhtml:sup|xhtml:span[@class='sup']">
<hi rend="sup">
<xsl:apply-templates/>
</hi>
</xsl:template>
<xsl:template match="xhtml:div">
<div type="section">
<xsl:apply-templates/>
</div>
</xsl:template>
<xsl:template match="xhtml:p">
<p>
<xsl:apply-templates/>
</p>
</xsl:template>
<xsl:template match="xhtml:nav">
<!-- <gap reason="toc"/> -->
</xsl:template>
<xsl:template match="xhtml:img">
<!-- <gap reason="image"/> -->
</xsl:template>
<xsl:template match="xhtml:audio">
<!-- <gap reason="audio"/> -->
</xsl:template>
<xsl:template match="xhtml:a">
<ref target="{@href}">
<xsl:apply-templates />
</ref>
</xsl:template>
<xsl:template match="xhtml:br"/>
<xsl:template match="xhtml:*">
<xsl:message>
<xsl:text>unhandled element: </xsl:text><xsl:value-of select="concat(name(), ' ', string-join(./@*[normalize-space(.) != '']/concat(name(), ':', ., ' '), '_'))"/>
</xsl:message>
<xsl:apply-templates/>
</xsl:template>
<xsl:function name="ids:reversedAuthors">
<xsl:param name="s" />
<xsl:value-of
select="
if (matches($s, ';')) then
concat(ids:reversedAuthors(substring-before($s, ' ; ')), ' ; ', ids:reversedAuthors(substring-after($s, ' ; ')))
else
replace($s, '(.+) (.+)', '$2, $1')"
/>
</xsl:function>
<xsl:function name="hlu:reversedAuthors">
<xsl:param name="s"/>
<xsl:value-of
select="if (matches($s, ';')) then concat(ids:reversedAuthors(substring-before($s, ' ; ')), ' ; ', ids:reversedAuthors(substring-after($s, ' ; '))) else replace($s, '(.+),(.+)', '$2, $1')"
/>
</xsl:function>
</xsl:stylesheet>