Support expanded archives in multi‐step data
[Shushe] / lib / catalog2parser.xslt
index f35fbc12572d8e87794c64131f13129194b7fd7f..a2eab127f482dd3915bec5b167a087f2cfd5ec0c 100644 (file)
@@ -1,8 +1,12 @@
 <?xml version="1.0"?>
 <!--
 <?xml version="1.0"?>
 <!--
-⁌ ⛩️📰 书社 ∷ lib/catalog2parser.xslt
+SPDX-FileCopyrightText: 2023, 2024 Lady <https://www.ladys.computer/about/#lady>
+SPDX-License-Identifier: MPL-2.0
+-->
+<!--
+⁌ ⛩📰 书社 ∷ lib/catalog2parser.xslt
 
 
-© 2023–2024 Lady [@ Lady’s Computer]
+© 2023–2024 Lady [@ Ladys Computer].
 
 This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0.
 If a copy of the M·P·L was not distributed with this file, You can obtain one at <https://mozilla.org/MPL/2.0/>.
 
 This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0.
 If a copy of the M·P·L was not distributed with this file, You can obtain one at <https://mozilla.org/MPL/2.0/>.
@@ -10,14 +14,71 @@ If a copy of the M·P·L was not distributed with this file, You can obtain one
 <transform
        xmlns="http://www.w3.org/1999/XSL/Transform"
        xmlns:catalog="urn:oasis:names:tc:entity:xmlns:xml:catalog"
 <transform
        xmlns="http://www.w3.org/1999/XSL/Transform"
        xmlns:catalog="urn:oasis:names:tc:entity:xmlns:xml:catalog"
+       xmlns:exsl="http://exslt.org/common"
+       xmlns:exslstr="http://exslt.org/strings"
+       xmlns:html="http://www.w3.org/1999/xhtml"
+       xmlns:nfo="http://www.semanticdesktop.org/ontologies/2007/03/22/nfo#"
+       xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+       xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
        xmlns:xslt="http://www.w3.org/1999/XSL/TransformAlias"
        xmlns:书社="urn:fdc:ladys.computer:20231231:Shu1She4"
        exclude-result-prefixes="catalog"
        xmlns:xslt="http://www.w3.org/1999/XSL/TransformAlias"
        xmlns:书社="urn:fdc:ladys.computer:20231231:Shu1She4"
        exclude-result-prefixes="catalog"
+       extension-element-prefixes="exslstr"
        version="1.0"
 >
        <namespace-alias stylesheet-prefix="xslt" result-prefix="#default"/>
        <template match="/">
        version="1.0"
 >
        <namespace-alias stylesheet-prefix="xslt" result-prefix="#default"/>
        <template match="/">
-               <xslt:transform version="1.0">
+               <xslt:transform extension-element-prefixes="exsl" version="1.0">
+                       <xslt:param name="BUILDTIME" select="'1972-12-31T00:00:00Z'"/>
+                       <xslt:param name="IDENTIFIER" select="false()"/>
+                       <xslt:param name="SRCREV" select="false()"/>
+                       <xslt:param name="THISREV" select="false()"/>
+                       <xslt:variable name="书社:parsers">
+                               <html:dl>
+                                       <for-each select="//catalog:uri">
+                                               <variable name="parser" select="document(@uri, .)"/>
+                                               <html:div>
+                                                       <html:dt>
+                                                               <value-of select="@name"/>
+                                                       </html:dt>
+                                                       <choose>
+                                                               <when test="$parser/*/@书社:supported-media-types">
+                                                                       <for-each select="exslstr:tokenize($parser/*/@书社:supported-media-types)">
+                                                                               <if test="not(translate(., '0123456789abcdefghijklmnopqrstuvwxyz!#$&#x26;-^_.+/', ''))">
+                                                                                       <html:dd>
+                                                                                               <value-of select="."/>
+                                                                                       </html:dd>
+                                                                               </if>
+                                                                       </for-each>
+                                                               </when>
+                                                               <otherwise>
+                                                                       <for-each select="$parser//xsl:template[not(@name) and not(@mode)]">
+                                                                               <variable name="match" select="@match"/>
+                                                                               <for-each select="namespace::*[local-name() and string()='http://www.w3.org/1999/xhtml']">
+                                                                                       <variable name="matchstart">
+                                                                                               <value-of select="local-name()"/>
+                                                                                               <text>:</text>
+                                                                                               <text>script[@type=</text>
+                                                                                       </variable>
+                                                                                       <if test="starts-with($match, $matchstart) and substring($match, string-length($match))=']' and contains($match, '/')">
+                                                                                               <variable name="inner" select="substring-before(substring-after($match, $matchstart), ']')"/>
+                                                                                               <if test="starts-with($inner, '&#x22;') and substring($inner, string-length($inner))='&#x22;' or starts-with($inner, &#x22;'&#x22;) and substring($inner, string-length($inner))=&#x22;'&#x22;">
+                                                                                                       <variable name="type" select="substring($inner, 2, string-length($inner)-2)"/>
+                                                                                                       <if test="not(translate($type, '0123456789abcdefghijklmnopqrstuvwxyz!#$&#x26;-^_.+/', ''))">
+                                                                                                               <html:dd>
+                                                                                                                       <value-of select="$type"/>
+                                                                                                               </html:dd>
+                                                                                                       </if>
+                                                                                               </if>
+                                                                                       </if>
+                                                                               </for-each>
+                                                                       </for-each>
+                                                               </otherwise>
+                                                       </choose>
+                                               </html:div>
+                                       </for-each>
+                               </html:dl>
+                       </xslt:variable>
                        <for-each select="//catalog:uri">
                                <xslt:include href="{@uri}">
                                        <if test="contains(@name, ':')">
                        <for-each select="//catalog:uri">
                                <xslt:include href="{@uri}">
                                        <if test="contains(@name, ':')">
@@ -27,11 +88,71 @@ If a copy of the M·P·L was not distributed with this file, You can obtain one
                                        </if>
                                </xslt:include>
                        </for-each>
                                        </if>
                                </xslt:include>
                        </for-each>
+                       <xslt:template name="书社:apply-parsed-by">
+                               <xslt:param name="id"/>
+                               <xslt:param name="media-type"/>
+                               <xslt:param name="result" select="/.."/>
+                               <xslt:for-each select="$result/node()">
+                                       <xslt:choose>
+                                               <xslt:when test="self::*">
+                                                       <xslt:copy>
+                                                               <xslt:if test="string($id)!=''">
+                                                                       <xslt:attribute name="书社:parsed-by">
+                                                                               <xslt:value-of select="$id"/>
+                                                                               <xslt:if test="@书社:parsed-by">
+                                                                                       <xslt:text>
+                                                                                               <text> </text>
+                                                                                       </xslt:text>
+                                                                                       <xslt:value-of select="@书社:parsed-by"/>
+                                                                               </xslt:if>
+                                                                       </xslt:attribute>
+                                                               </xslt:if>
+                                                               <xslt:if test="string($media-type)!=''">
+                                                                       <xslt:attribute name="书社:media-type">
+                                                                               <xslt:value-of select="$media-type"/>
+                                                                       </xslt:attribute>
+                                                               </xslt:if>
+                                                               <xslt:copy-of select="@*[namespace-uri()!='urn:fdc:ladys.computer:20231231:Shu1She4' or local-name()!='parsed-by' and local-name()!='media-type']|node()"/>
+                                                       </xslt:copy>
+                                               </xslt:when>
+                                               <xslt:otherwise>
+                                                       <xslt:copy-of select="."/>
+                                               </xslt:otherwise>
+                                       </xslt:choose>
+                               </xslt:for-each>
+                       </xslt:template>
+                       <xslt:template match="/">
+                               <xslt:apply-templates select="node()" mode="书社:parse"/>
+                       </xslt:template>
                        <xslt:template match="@*|node()" priority="-1">
                                <xslt:copy>
                        <xslt:template match="@*|node()" priority="-1">
                                <xslt:copy>
-                                       <xslt:apply-templates select="@*|node()"/>
+                                       <xslt:apply-templates select="@*|node()" mode="书社:parse"/>
                                </xslt:copy>
                        </xslt:template>
                                </xslt:copy>
                        </xslt:template>
+                       <xslt:template match="html:script[@type]" mode="书社:parse" priority="1">
+                               <xslt:variable name="parserdiv" select="exsl:node-set($书社:parsers)//html:div[html:dd=current()/@type]"/>
+                               <xslt:choose>
+                                       <xslt:when test="$parserdiv">
+                                               <xslt:variable name="result">
+                                                       <xslt:apply-templates select="."/>
+                                               </xslt:variable>
+                                               <xslt:variable name="reparsed-result">
+                                                       <xslt:apply-templates select="exsl:node-set($result)/node()" mode="书社:parse"/>
+                                               </xslt:variable>
+                                               <xslt:call-template name="书社:apply-parsed-by">
+                                                       <xslt:with-param name="id" select="string($parserdiv/html:dt)"/>
+                                                       <xslt:with-param name="media-type" select="string(@type)"/>
+                                                       <xslt:with-param name="result" select="exsl:node-set($reparsed-result)"/>
+                                               </xslt:call-template>
+                                       </xslt:when>
+                                       <xslt:otherwise>
+                                               <xslt:apply-templates select="."/>
+                                       </xslt:otherwise>
+                               </xslt:choose>
+                       </xslt:template>
+                       <xslt:template match="@*|node()" mode="书社:parse">
+                               <xslt:apply-templates select="."/>
+                       </xslt:template>
                </xslt:transform>
        </template>
        <output method="xml" encoding="UTF-8"/>
                </xslt:transform>
        </template>
        <output method="xml" encoding="UTF-8"/>
This page took 0.031077 seconds and 4 git commands to generate.