| <xsl:stylesheet version="3.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform" |
| xmlns:xs="http://www.w3.org/2001/XMLSchema" |
| xmlns:opf="http://www.idpf.org/2007/opf" |
| xmlns:dc="http://purl.org/dc/elements/1.1/" |
| xmlns:ids="http://www.ids-mannheim.de/ids" |
| xmlns:hlu="http://www.ids-mannheim.de/hlu" |
| xmlns:saxon="http://saxon.sf.net/" |
| xmlns:xhtml="http://www.w3.org/1999/xhtml" |
| exclude-result-prefixes="xs opf dc ids hlu saxon xhtml"> |
| |
| <xsl:output method="xml" indent="yes" omit-xml-declaration="yes" saxon:line-length="1000"/> |
| <xsl:strip-space elements="*"/> |
| |
| <xsl:variable name="ev"/> |
| <xsl:variable name="x"/> |
| |
| <xsl:variable name="isbn" as="xs:string" select="replace(document-uri(), '.*([0-9]{13,}).*' , '$1')"/> |
| |
| |
| <xsl:variable name="dnbBookdata"> |
| <xsl:copy-of select="doc(concat('https://services.dnb.de/sru/dnb?version=1.1&operation=searchRetrieve&query=NUM%3D', $isbn, '&recordSchema=oai_dc'))"/> |
| </xsl:variable> |
| |
| <xsl:variable name="autor" |
| select="replace(string-join($dnbBookdata//dc:creator[not(matches(., '\[(Erzähler)\]'))], ' ; '), ' *\[[^\]]*\]', '')"/> |
| |
| <xsl:variable name="straight_autor" select="normalize-space(replace(hlu:reversedAuthors($autor), ',', ''))"/> |
| |
| <xsl:variable name="ina"/> |
| <xsl:variable name="_corpus"/> |
| <xsl:variable name="ent_known"/> |
| |
| |
| <!-- added HLU 2012-02-09: --> |
| <xsl:variable name="ent"> |
| <xsl:choose> |
| <xsl:when test="$ent_known"> |
| <xsl:value-of select="$ent_known"/> |
| </xsl:when> |
| <xsl:when test="$ev"> |
| <xsl:value-of select="$ev"/> |
| </xsl:when> |
| <xsl:otherwise> |
| <xsl:value-of select="$j"/> |
| </xsl:otherwise> |
| </xsl:choose> |
| </xsl:variable> |
| |
| <xsl:variable name="titel"> |
| <xsl:variable name="title-with-subtitles"> |
| <xsl:choose> |
| <xsl:when test="contains(($dnbBookdata//dc:title)[1],':')"> |
| <xsl:value-of select="normalize-space(substring-before(substring-before(($dnbBookdata//dc:title)[1], '/'), ':'))" |
| /> |
| </xsl:when> |
| <xsl:otherwise> |
| <xsl:value-of select="normalize-space(substring-before(($dnbBookdata//dc:title)[1], '/'))"/> |
| </xsl:otherwise> |
| </xsl:choose> |
| </xsl:variable> |
| <xsl:value-of select="normalize-space(replace($title-with-subtitles, '\|.*', ''))"/> |
| </xsl:variable> |
| |
| <xsl:variable name="erscheinungsort"> |
| <xsl:choose> |
| <xsl:when test="contains(($dnbBookdata//dc:publisher)[1], ':')"> |
| <xsl:value-of select="normalize-space(substring-before(($dnbBookdata//dc:publisher)[1], ':'))"/> |
| </xsl:when> |
| <xsl:otherwise> |
| <xsl:value-of select="normalize-space(($dnbBookdata//dc:publisher)[1])"/> |
| </xsl:otherwise> |
| </xsl:choose> |
| </xsl:variable> |
| |
| <xsl:variable name="texttype" select="replace(($dnbBookdata//dc:subject[matches(., '^[A-Z] ')])[1], '^[A-Z] (.*)', '$1')"/> |
| |
| <xsl:variable name="verlag"> |
| <xsl:choose> |
| <xsl:when test="contains(($dnbBookdata//dc:publisher)[1], ':')"> |
| <xsl:value-of select="normalize-space(substring-after(($dnbBookdata//dc:publisher)[1], ':'))"/> |
| </xsl:when> |
| <xsl:otherwise> |
| <xsl:value-of select="normalize-space(($dnbBookdata//dc:publisher)[1])"/> |
| </xsl:otherwise> |
| </xsl:choose> |
| </xsl:variable> |
| |
| <xsl:variable name="erscheinungsjahr"> |
| <xsl:choose> |
| <xsl:when test="dnbBookdata//dc:date[matches(normalize-space(.), '^[0-9]{4}$')]"> |
| <xsl:value-of select="$dnbBookdata//dc:date[matches(normalize-space(.), '^[0-9]{4}$')][1]"/> |
| </xsl:when> |
| <xsl:otherwise> |
| <xsl:value-of select="substring-before(($dnbBookdata//dc:date)[1], '-')"/> |
| </xsl:otherwise> |
| </xsl:choose> |
| </xsl:variable> |
| |
| <xsl:variable name="untertitel" |
| select="normalize-space(substring-after(substring-before(($dnbBookdata//dc:title)[1], '/'), ':'))"/> |
| |
| <xsl:variable name="herausgeber"> |
| <xsl:choose> |
| <xsl:when test="$dnbBookdata//dc:creator[ends-with(.,'[Hrsg.]')]"> |
| <xsl:value-of |
| select="replace(string-join($dnbBookdata//dc:creator[ends-with(.,'[Hrsg.]')][1], ' ; '),'\s?\[Hrsg.\]','')" |
| /> |
| </xsl:when> |
| <xsl:otherwise>.</xsl:otherwise> |
| </xsl:choose> |
| </xsl:variable> |
| |
| <xsl:variable name="straight_herausgeber" |
| select="replace(hlu:reversedAuthors($herausgeber), ',', '')"/> |
| |
| <xsl:variable name="j" select="$dnbBookdata//dc:date"/> |
| |
| <!-- for BOT+s: --> |
| <xsl:variable name="seiten" select="replace($dnbBookdata//dc:format,'S\.','')"/> |
| |
| <!-- fuer BOT+b: --> |
| <xsl:variable name="_b"> |
| <xsl:variable name="regexp1" select="'(Band|Bd\.)\s*([0-9]?[0-9]?[0-9])'"/> |
| <xsl:choose> |
| <xsl:when test="matches($dnbBookdata, $regexp1)"> |
| <xsl:analyze-string select="$dnbBookdata//dc:title" regex="{$regexp1}"> |
| <xsl:matching-substring> |
| <xsl:value-of select="."/> |
| </xsl:matching-substring> |
| </xsl:analyze-string> |
| </xsl:when> |
| <xsl:otherwise> |
| <xsl:value-of select="'.'"/> |
| </xsl:otherwise> |
| </xsl:choose> |
| </xsl:variable> |
| |
| <!-- for BOT+x: --> |
| <xsl:variable name="txtart"> |
| <xsl:choose> |
| <xsl:when test="$x"> |
| <xsl:value-of select="concat('[', $x, ']')"/> |
| </xsl:when> |
| <xsl:when |
| test="matches($untertitel, '([Rr]oman|[Ee]rzhlung(en)?|[Aa]nthologie|[Gg]eschichte(n)?|[Nn]ovelle)')"> |
| <xsl:value-of |
| select="concat('[', replace(replace($untertitel, '.*?(((^|\P{L})\p{L}+)?([Rr]oman|[Ee]rzhlung(en)?|[Aa]nthologie|[Gg]eschichte(n)?|[Nn]ovelle)).*', '$1'), '\P{L}*(.+)', '$1'), ']')" |
| /> |
| </xsl:when> |
| <xsl:otherwise> |
| <xsl:value-of>Roman</xsl:value-of> |
| </xsl:otherwise> |
| </xsl:choose> |
| </xsl:variable> |
| |
| |
| |
| <!-- fuer BOTd: --> |
| <xsl:variable name="dok" |
| select="concat((if(string-length($autor) > 0) then concat($straight_autor, ': ') else ''), $titel, ', ', $txtart, ', (', $j, ')')"/> |
| |
| <!-- END variables derived from sru request to dnb archive --> |
| |
| |
| <xsl:variable name="corpus_sigle" select="concat('DNB', substring($erscheinungsjahr, 3, 2))"/> |
| |
| <!-- for BOTD: --> |
| <!-- Dokumentsigle muss zusammen mit Korpussigle (z.B DIV fuer loz-div und loz-div-pub) eindeutig sein --> |
| <xsl:variable name="doc_sigle"> |
| <xsl:variable name="firstContentWordTitleInitial"> |
| <xsl:variable name="helper"> |
| <xsl:analyze-string select="$titel" regex="\w+"> |
| <xsl:matching-substring> |
| <xsl:choose> |
| <xsl:when |
| test="matches(.,'^[A-Z]') and not(matches(.,'^(Der|Die|Das|Des|Ein|Eine|Eines|Einmal|Von|Mit|Zu|Zurck)$'))"> |
| <!-- TODO: Fktnswoerter nachtragen --> |
| <xsl:sequence select="."/> |
| </xsl:when> |
| <xsl:otherwise/> |
| </xsl:choose> |
| </xsl:matching-substring> |
| </xsl:analyze-string> |
| </xsl:variable> |
| <xsl:value-of |
| select="upper-case(substring(normalize-space(replace($helper,'\s+.+$','')),1,1))"/> |
| <!-- longest match of .+ --> |
| </xsl:variable> |
| <xsl:choose> |
| <xsl:when test="contains($autor,';')"> |
| <xsl:variable name="lastname_aut1" |
| select="upper-case(substring(normalize-space(substring-before(substring-before($autor,';'),',')), 1, 1))"/> |
| <xsl:variable name="lastname_aut2" |
| select="upper-case(substring(normalize-space(substring-before(substring-before(substring-after($autor, ';'),';'),',')), 1, 1))"/> |
| <xsl:value-of select="concat($lastname_aut1, $lastname_aut2)"/> |
| </xsl:when> |
| <xsl:otherwise> |
| <xsl:variable name="lastname_aut1" |
| select="upper-case(substring(normalize-space(substring-before($autor,',')),1,1))"/> |
| <xsl:variable name="firstname_aut1" |
| select="upper-case(substring(normalize-space(substring-after($autor,',')),1,1))"/> |
| <xsl:value-of select="concat($lastname_aut1, $firstname_aut1)"/> |
| </xsl:otherwise> |
| </xsl:choose> |
| <xsl:value-of select="$firstContentWordTitleInitial"/> |
| </xsl:variable> |
| |
| |
| <xsl:variable name="text_sigle" select="substring($isbn, 8, 5)"/> |
| <xsl:variable name="sigle" select="concat($corpus_sigle, '/', $doc_sigle, '.', $text_sigle)"/> |
| |
| <!-- fuer BOT+xy: (?) --> |
| <xsl:variable name="xyref"> |
| <xsl:value-of select="document-uri(.)"/> |
| <xsl:text>; </xsl:text> |
| <xsl:text>ISBN:</xsl:text> |
| <xsl:value-of select="$isbn"/> |
| <xsl:text>; </xsl:text> |
| <xsl:value-of select="string-join($dnbBookdata//dc:identifier)"/> |
| </xsl:variable> |
| |
| <xsl:variable name="long-reference" |
| select="concat($sigle, ' ', $autor, ': ', $titel, '. ', $erscheinungsort, ': ', $verlag, ', ', $erscheinungsjahr)"/> |
| |
| <xsl:variable name="short-reference" |
| select="concat($straight_autor, ': ', $titel, ' (', $erscheinungsjahr, ')')"/> |
| |
| <xsl:template match="/"> |
| <idsDoc TEIform="TEI.2" type="text" version="1.0"> |
| <idsHeader TEIform="teiHeader" pattern="text" status="new" type="document" version="1.1"> |
| <fileDesc> |
| <titleStmt> |
| <dokumentSigle><xsl:value-of select="string-join(($corpus_sigle, $doc_sigle), '/')"/></dokumentSigle> |
| <d.title><xsl:value-of select="$short-reference"/></d.title> |
| </titleStmt> |
| <publicationStmt> |
| <distributor/> |
| <pubAddress/> |
| <availability region="world" status="unknown">QAO-NC</availability> |
| <pubDate/> |
| </publicationStmt> |
| <sourceDesc> |
| <biblStruct> |
| <monogr> |
| <h.title type="main"/> |
| <imprint/> |
| </monogr> |
| </biblStruct> |
| </sourceDesc> |
| </fileDesc> |
| </idsHeader> |
| <idsText version="1.0"> |
| <idsHeader TEIform="teiHeader" pattern="text" status="new" type="text" version="1.1"> |
| <fileDesc> |
| <titleStmt> |
| <textSigle><xsl:sequence select="$sigle"/></textSigle> |
| <t.title assemblage="regular"><xsl:value-of select="$long-reference"/></t.title> |
| </titleStmt> |
| <publicationStmt> |
| <distributor/> |
| <pubAddress/> |
| <availability region="world" status="unknown">QAO-NC</availability> |
| <pubDate/> |
| </publicationStmt> |
| <sourceDesc> |
| <biblStruct> |
| <monogr> |
| <h.title type="main"><xsl:value-of select="$titel"/></h.title> |
| <h.title type="sub"><xsl:value-of select="$untertitel"/></h.title> |
| <h.author><xsl:value-of select="$autor"/></h.author> |
| <editor/> |
| <edition> |
| <further/> |
| <kind>E-Book-Ausgabe</kind> |
| <appearance>EPUB-Datei</appearance> |
| </edition> |
| <imprint> |
| <publisher><xsl:value-of select="$verlag"/></publisher> |
| <pubDate type="year"><xsl:value-of select="$j"/></pubDate> |
| <pubDate type="month"/> |
| <pubDate type="day"/> |
| <pubPlace key="DE"><xsl:value-of select="$erscheinungsort"/></pubPlace> |
| </imprint> |
| <biblScope type="subsume"/> |
| <biblScope type="pp"/> |
| <biblScope type="vol"/> |
| <biblScope type="volume-title"/> |
| </monogr> |
| </biblStruct> |
| <reference assemblage="regular" type="complete"><xsl:value-of select="concat($sigle, ' ', $autor, ': ', $titel, '. ', $erscheinungsort, ': ', $verlag, ', ', $erscheinungsjahr)"/></reference> |
| </sourceDesc> |
| </fileDesc> |
| <profileDesc> |
| <creation> |
| <creatDate><xsl:value-of select="$j"/></creatDate> |
| </creation> |
| <textClass/> |
| <textDesc> |
| <textType><xsl:value-of select="$texttype"/></textType> |
| <textTypeRef><xsl:value-of select="$texttype"/></textTypeRef> |
| <textDomain/> |
| </textDesc> |
| </profileDesc> |
| </idsHeader> |
| <text> |
| <body> |
| <!-- Call the template for each link in the TOC |
| <xsl:apply-templates select="//xhtml:ol[@class='toc']/xhtml:li/xhtml:a" mode="collect"/> --> |
| <xsl:apply-templates select="//opf:package/opf:manifest/opf:item[matches(@href, '\.x?html$') and not(matches(@href, '(cover|toc|copyright|feedback|inhalt|nav|titlepage).*'))]" mode="collect"/> |
| </body> |
| </text> |
| </idsText> |
| </idsDoc> |
| </xsl:template> |
| |
| <xsl:template match="opf:item" mode="collect"> |
| <xsl:variable name="href" select="@href"/> |
| <xsl:message> |
| <xsl:text>converting: </xsl:text><xsl:value-of select="$href"/><xsl:text> </xsl:text><xsl:value-of select="$isbn"/> |
| </xsl:message> |
| <xsl:apply-templates select="doc(resolve-uri($href, base-uri()))/xhtml:html/xhtml:body"/> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:body"> |
| <div type="chapter"> |
| <xsl:apply-templates/> |
| </div> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:title"> |
| <head> |
| <xsl:apply-templates/> |
| </head> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:h1"> |
| <head> |
| <xsl:apply-templates/> |
| </head> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:h2|xhtml:h3"> |
| <head type="sub"> |
| <xsl:apply-templates/> |
| </head> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:em"> |
| <emph> |
| <xsl:apply-templates/> |
| </emph> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:span[matches(@class, '(bold|italic|big|kursiv| )+')]"> |
| <xsl:variable name="class" select="replace(@class, 'kursiv', 'italic')"/> |
| <hi rend="{$class}"> |
| <xsl:apply-templates/> |
| </hi> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:b"> |
| <hi rend="bold"> |
| <xsl:apply-templates/> |
| </hi> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:sub|xhtml:span[@class='sub']"> |
| <hi rend="sub"> |
| <xsl:apply-templates/> |
| </hi> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:sup|xhtml:span[@class='sup']"> |
| <hi rend="sup"> |
| <xsl:apply-templates/> |
| </hi> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:div"> |
| <div type="section"> |
| <xsl:apply-templates/> |
| </div> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:p"> |
| <p> |
| <xsl:apply-templates/> |
| </p> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:nav"> |
| <!-- <gap reason="toc"/> --> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:img"> |
| <!-- <gap reason="image"/> --> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:audio"> |
| <!-- <gap reason="audio"/> --> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:a"> |
| <ref target="{@href}"> |
| <xsl:apply-templates /> |
| </ref> |
| </xsl:template> |
| |
| <xsl:template match="xhtml:br"/> |
| |
| <xsl:template match="xhtml:*"> |
| <xsl:message> |
| <xsl:text>unhandled element: </xsl:text><xsl:value-of select="concat(name(), ' ', string-join(./@*[normalize-space(.) != '']/concat(name(), ':', ., ' '), '_'))"/> |
| </xsl:message> |
| <xsl:apply-templates/> |
| </xsl:template> |
| |
| <xsl:function name="ids:reversedAuthors"> |
| <xsl:param name="s" /> |
| <xsl:value-of |
| select=" |
| if (matches($s, ';')) then |
| concat(ids:reversedAuthors(substring-before($s, ' ; ')), ' ; ', ids:reversedAuthors(substring-after($s, ' ; '))) |
| else |
| replace($s, '(.+) (.+)', '$2, $1')" |
| /> |
| </xsl:function> |
| |
| <xsl:function name="hlu:reversedAuthors"> |
| <xsl:param name="s"/> |
| <xsl:value-of |
| select="if (matches($s, ';')) then concat(ids:reversedAuthors(substring-before($s, ' ; ')), ' ; ', ids:reversedAuthors(substring-after($s, ' ; '))) else replace($s, '(.+),(.+)', '$2, $1')" |
| /> |
| </xsl:function> |
| |
| </xsl:stylesheet> |