]> Lady’s Gitweb - Shushe/blobdiff - lib/catalog2parser.xslt
Drop CKSUM and SRCTIME params; add as attributes
[Shushe] / lib / catalog2parser.xslt
index ead56da91dab9bd2916beda213937a7100703e2c..f3afd7fa945d8a763e30cbe22f792269910e290c 100644 (file)
@@ -1,8 +1,12 @@
 <?xml version="1.0"?>
 <!--
+SPDX-FileCopyrightText: 2023, 2024 Lady <https://www.ladys.computer/about/#lady>
+SPDX-License-Identifier: MPL-2.0
+-->
+<!--
 ⁌ ⛩️📰 书社 ∷ lib/catalog2parser.xslt
 
-© 2023–2024 Lady [@ Lady’s Computer]
+© 2023–2024 Lady [@ Lady’s Computer].
 
 This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0.
 If a copy of the M·P·L was not distributed with this file, You can obtain one at <https://mozilla.org/MPL/2.0/>.
@@ -10,17 +14,25 @@ If a copy of the M·P·L was not distributed with this file, You can obtain one
 <transform
        xmlns="http://www.w3.org/1999/XSL/Transform"
        xmlns:catalog="urn:oasis:names:tc:entity:xmlns:xml:catalog"
+       xmlns:exsl="http://exslt.org/common"
        xmlns:exslstr="http://exslt.org/strings"
        xmlns:html="http://www.w3.org/1999/xhtml"
+       xmlns:nfo="http://www.semanticdesktop.org/ontologies/2007/03/22/nfo#"
+       xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
        xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
        xmlns:xslt="http://www.w3.org/1999/XSL/TransformAlias"
        xmlns:书社="urn:fdc:ladys.computer:20231231:Shu1She4"
-       exclude-result-prefixes="catalog exslstr"
+       exclude-result-prefixes="catalog"
+       extension-element-prefixes="exslstr"
        version="1.0"
 >
        <namespace-alias stylesheet-prefix="xslt" result-prefix="#default"/>
        <template match="/">
-               <xslt:transform version="1.0">
+               <xslt:transform extension-element-prefixes="exsl" version="1.0">
+                       <xslt:param name="BUILDTIME" select="'1972-12-31T00:00:00Z'"/>
+                       <xslt:param name="IDENTIFIER" select="false()"/>
+                       <xslt:param name="SRCREV" select="false()"/>
+                       <xslt:param name="THISREV" select="false()"/>
                        <xslt:variable name="书社:parsers">
                                <html:dl>
                                        <for-each select="//catalog:uri">
@@ -76,11 +88,94 @@ If a copy of the M·P·L was not distributed with this file, You can obtain one
                                        </if>
                                </xslt:include>
                        </for-each>
+                       <xslt:template name="书社:apply-parsed-by">
+                               <xslt:param name="id"/>
+                               <xslt:param name="media-type"/>
+                               <xslt:param name="result" select="/.."/>
+                               <xslt:for-each select="$result/node()">
+                                       <xslt:choose>
+                                               <xslt:when test="self::*">
+                                                       <xslt:copy>
+                                                               <xslt:if test="string($id)!=''">
+                                                                       <xslt:attribute name="书社:parsed-by">
+                                                                               <xslt:value-of select="$id"/>
+                                                                               <xslt:if test="@书社:parsed-by">
+                                                                                       <xslt:text>
+                                                                                               <text> </text>
+                                                                                       </xslt:text>
+                                                                                       <xslt:value-of select="@书社:parsed-by"/>
+                                                                               </xslt:if>
+                                                                       </xslt:attribute>
+                                                               </xslt:if>
+                                                               <xslt:if test="string($media-type)!=''">
+                                                                       <xslt:attribute name="书社:media-type">
+                                                                               <xslt:value-of select="$media-type"/>
+                                                                       </xslt:attribute>
+                                                               </xslt:if>
+                                                               <xslt:copy-of select="@*[namespace-uri()!='urn:fdc:ladys.computer:20231231:Shu1She4' or local-name()!='parsed-by' and local-name()!='media-type']|node()"/>
+                                                       </xslt:copy>
+                                               </xslt:when>
+                                               <xslt:otherwise>
+                                                       <xslt:copy-of select="."/>
+                                               </xslt:otherwise>
+                                       </xslt:choose>
+                               </xslt:for-each>
+                       </xslt:template>
+                       <xslt:template match="/">
+                               <xslt:variable name="parsedroot">
+                                       <xslt:apply-templates select="node()" mode="书社:parse"/>
+                               </xslt:variable>
+                               <xslt:for-each select="exsl:node-set($parsedroot)/node()">
+                                       <xslt:choose>
+                                               <xslt:when test="self::*">
+                                                       <xslt:copy>
+                                                               <xslt:attribute name="书社:cksum">
+                                                                       <xslt:value-of select="document('metadata')//*[@rdf:about=$IDENTIFIER]/nfo:hasHash[@nfo:hashAlgorithm='CRC32']/@nfo:hashValue"/>
+                                                               </xslt:attribute>
+                                                               <xslt:attribute name="书社:identifier">
+                                                                       <xslt:value-of select="$IDENTIFIER"/>
+                                                               </xslt:attribute>
+                                                               <xslt:attribute name="书社:mtime">
+                                                                       <xslt:value-of select="document('metadata')//*[@rdf:about=$IDENTIFIER]/nfo:fileLastModified"/>
+                                                               </xslt:attribute>
+                                                               <xslt:copy-of select="@*[namespace-uri()!='urn:fdc:ladys.computer:20231231:Shu1She4' or not(contains(' cksum identifier mtime ', concat(' ', local-name(), ' ')))]|node()"/>
+                                                       </xslt:copy>
+                                               </xslt:when>
+                                               <xslt:otherwise>
+                                                       <xslt:copy-of select="."/>
+                                               </xslt:otherwise>
+                                       </xslt:choose>
+                               </xslt:for-each>
+                       </xslt:template>
                        <xslt:template match="@*|node()" priority="-1">
                                <xslt:copy>
-                                       <xslt:apply-templates select="@*|node()"/>
+                                       <xslt:apply-templates select="@*|node()" mode="书社:parse"/>
                                </xslt:copy>
                        </xslt:template>
+                       <xslt:template match="html:script[@type]" mode="书社:parse" priority="1">
+                               <xslt:variable name="parserdiv" select="exsl:node-set($书社:parsers)//html:div[html:dd=current()/@type]"/>
+                               <xslt:choose>
+                                       <xslt:when test="$parserdiv">
+                                               <xslt:variable name="result">
+                                                       <xslt:apply-templates select="."/>
+                                               </xslt:variable>
+                                               <xslt:variable name="reparsed-result">
+                                                       <xslt:apply-templates select="exsl:node-set($result)/node()" mode="书社:parse"/>
+                                               </xslt:variable>
+                                               <xslt:call-template name="书社:apply-parsed-by">
+                                                       <xslt:with-param name="id" select="string($parserdiv/html:dt)"/>
+                                                       <xslt:with-param name="media-type" select="string(@type)"/>
+                                                       <xslt:with-param name="result" select="exsl:node-set($reparsed-result)"/>
+                                               </xslt:call-template>
+                                       </xslt:when>
+                                       <xslt:otherwise>
+                                               <xslt:apply-templates select="."/>
+                                       </xslt:otherwise>
+                               </xslt:choose>
+                       </xslt:template>
+                       <xslt:template match="@*|node()" mode="书社:parse">
+                               <xslt:apply-templates select="."/>
+                       </xslt:template>
                </xslt:transform>
        </template>
        <output method="xml" encoding="UTF-8"/>
This page took 0.026082 seconds and 4 git commands to generate.