From: kibigo! <redacted> Date: Mon, 1 Jan 2024 04:07:41 +0000 (-0500) Subject: Initial commit; minimal working implementation X-Git-Url: Initial commit; minimal working implementation

--- 61c43d3c26846f6415751c0c00848c3c2bc44829 diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..33687b1 --- /dev/null +++ b/.gitignore @@ -0,0 +1,2 @@ +/build +/public diff --git a/COPYING b/COPYING new file mode 100644 index 0000000..a612ad9 --- /dev/null +++ b/COPYING @@ -0,0 +1,373 @@ +Mozilla Public License Version 2.0 If a copy of the MPL was not distributed with this + file, You can obtain one at

If it is not possible or desirable to put the notice in a particular +file, then You may include the notice in a location (such as a LICENSE +file in a relevant directory) where a recipient would be likely to look +for such a notice.

You may add additional accurate notices of copyright ownership.

Exhibit B - "Incompatible With Secondary Licenses" Notice +---------------------------------------------------------

+ This Source Code Form is "Incompatible With Secondary Licenses", as + defined by the Mozilla Public License, v. 2.0. Beyond this, only programs │║ +║│ required by Posix are used, altho there is a chance of │║ +║│ version incompatibilities. The full list of program │║ +║│ requirements is as follows :— │║ +║│ │║ +║│ • cat │║ +║│ • cp │║ +║│ • echo │║ +║│ • file │║ +║│ • find │║ +║│ • mkdir (requires support for `-p´) │║ +║│ • mv │║ +║│ • printf │║ +║│ • sed │║ +║│ • test │║ +║│ • touch │║ +║│ • tr (requires support for `-d´) │║ +║│ • uuencode (requires support for `-m´ and `-r´) │║ +║│ • xmlcatalog (provided by libxml2) │║ +║│ • xmllint (provided by libxml2) │║ +║│ • xsltproc (provided by libxslt) │║ +║│ │║ +║│ In all cases, you can supply your own version of any │║ +║│ program `program´ by overriding the corresponding variable │║ +║│ `PROGRAM´ when calling Make. │║ +║╰────────────────────────────────────────────────────────────╯║ +╟┬ ¶ Usage ───────────────────────────────────────────────────┬╢ +║│ │║ +║│ • `make all´: Compile, but do not install, all files. │║ +║│ │║ +║│ • `make clean´: Remove `BUILDDIR´. │║ +║│ │║ +║│ • `make gone´: Remove installed files. │║ +║│ │║ +║│ • `make help´ (default): Print this message. │║ +║│ │║ +║│ • `make install´: Compile all files and install in │║ +║│ `DESTDIR´. │║ +║│ │║ +║│ • `make list´: List all recognized source files and their │║ +║│ classification (including media type and dependencies). │║ +║│ │║ +║│ Set `VERBOSE=1´ to see the text of commands as they are │║ +║│ executed. │║ +║│ │║ +║│ See `README.markdown´ for a more involved description of │║ +║│ the capabilities and configuration of this program. │║ +║╰────────────────────────────────────────────────────────────╯║ +╟┬ ¶ License ─────────────────────────────────────────────────┬╢ +║│ This Source Code Form is subject to the terms of the │║ +║│ Mozilla Public License, v 2.0. If a copy of the M·P·L was │║ +║│ not distributed with this file, You can obtain one at │║ +║│ <>. Instead, link or copy just the files you expect to need for +# your project. They may have multiple. Requiring it ensures that file classifications are +# up‐to‐date immediately after the reload. -d $(call quote,$1); then $(MKDIR) -p $(call quote,$1); fi Restarting…\0033[22m' Restarting…\0033[22m' Asset files +# are turned into H·T·M·L embeds pointing to `data:´ U·R·I's. This does not depend on actually transforming the files. quote,$(THISDIR)/lib/catalog2dependencies.xslt) $(call quote,$<) + $(silent)$(TOUCH) -A -000001 -am $(THISDIR)/GNUmakefile + +# Generate the main transform. +$(BUILDDIR)/transform.catalog: $(TRANSFORMS) + @$(ECHO) "Generating catalog of transforms…" + $(silent)$(XMLCATALOG) --create --noout $(call quote,$@) + $(foreach transform,$(TRANSFORMS),$(silent)$(XMLCATALOG) --add uri $(call quote,$(basename $(notdir $(transform)))) $(call quote,../$(transform)) --noout $(call quote,$@)$(newline)) +$(BUILDDIR)/transform.xslt: $(BUILDDIR)/transform.catalog $(THISDIR)/lib/catalog2transform.xslt + @$(ECHO) "Generating main transform…" + $(silent)$(XSLTPROC) -o $(call quote,$@) $(call quote,$(THISDIR)/lib/catalog2transform.xslt) $(call quote,$<) + +# Generate the output files using the dependencies as necessary. +$(call compiled,$(compilablefiles)): $(BUILDDIR)/public/%: $$(call parsed,$(SRCDIR)/%) $(BUILDDIR)/transform.xslt $$(call parsed,$$(call dependencies,$(SRCDIR)/%)) + $(silent)$(call ensuredirectory,$(dir $@)) + @$(PRINTF) '%s\n' $(call quote,Compiling `$*´…) + $(silent)$(XSLTPROC) -o $(call quote,$@) --stringparam catalog 'catalog' $(call quote,$(BUILDDIR)/transform.xslt) $(call quote,$<) +$(call compiled,$(filter $(assetfiles),$(sourcefiles))): $(BUILDDIR)/public/%: $(SRCDIR)/% + @$(PRINTF) '%s\n' $(call quote,Compiling `$*´…) + $(silent)$(call ensuredirectory,$(dir $@)) + $(silent)$(CP) $(call quote,$<) $(call quote,$@) + +# Install compiled files (or error in the case of recursive ones). +$(call installed,$(filter $(assetfiles),$(sourcefiles)) $(recursivefiles) $(compilablefiles)): $(DESTDIR)/%: $(BUILDDIR)/public/% + @$(PRINTF) '%s\n' $(call quote,Installing `$*´…) + $(silent)$(call ensuredirectory,$(dir $@)) + $(silent)$(CP) $(call quote,$<) $(call quote,$@) diff --git a/README.markdown b/README.markdown new file mode 100644 index 0000000..51aca8d --- /dev/null +++ b/README.markdown @@ -0,0 +1,323 @@ +# ⛩️📰 书社 + +<b>An X·S·L·T‐based static site generator.</b> +

<dfn>⛩️📰 书社</dfn> aims to make it easy to generate websites with + X·S·L·T and G·N·U Make. +It is consequently only a good choice for people who like X·S·L·T and + G·N·U Make and wish it were easier to make websites with them.

It makes things easier by :—

- Automatically identifying source files and characterizing them by + type (X·M·L, text, or asset).

- Parsing supported text types into X·M·L trees.

- Enabling easy inclusion of source files within each other.

It aims to do this with zero dependencies beyond the programs already + installed on your computer.

## Nomenclature

<i lang="cmn-Hans">书社</i> is a Chinese word meaning "publishing + house".

The first character, <i lang="cmn-Hans">书</i>, is the simplified form + of "document".

The second character, <i lang="cmn-Hans">社</i>, contemporarily means + "association", but historically referred to the god of the soil and + related altars or festivities. +In Japanese, it is an alternate spelling for <i lang="ja">やしろ</i>, + the word for "Shinto shrine".

The name <i lang="cmn-Hans">书社</i> was chosen to play on this pun, as + it is intended as a publishing program for webshrines.

In Ascii environments, ⛩️📰 书社 should be written `Shushe`, following + the pinyin transliteration.

## Basic Usage

Place source files in `sources/` and run `make install` to compile + the result to `public/`. +Compilation involves the following steps :—

1. ⛩️📰 书社 compiles all of the magic files in `magic/` into a single + file, `build/magic.mgc`.

2. ⛩️📰 书社 processes all of the parsers in `parsers/` and determines + the list of supported plaintext types.

3. ⛩️📰 书社 identifies all of the source files and includes and uses + `build/magic.mgc` to classify them by media type.

4. ⛩️📰 书社 parses all plaintext and X·M·L source files and includes + and then builds a dependency tree between them.

5. ⛩️📰 书社 uses the dependency tree to establish prerequisites for + each output file.

6. ⛩️📰 书社 compiles each output file to `build/public`.

7. ⛩️📰 书社 copies the output files to `public`.

You can use `make list` to list each identified source file or include + alongside its computed type and dependencies. +As this is a Make‐based program, steps will only be run if the + corresponding buildfile or output file is older than its + prerequisites.

## Namespaces

The ⛩️📰 书社 namespace is ``.

This document uses a few namespace prefixes, with the following + meanings :—

| Prefix | Expansion | +| -------: | :----------------------------------------- | +| `html:` | `` | +| `xlink:` | `` | +| `xslt:` | `` | +| `书社:` | `` |

## Setup and Configuration

⛩️📰 书社 depends on the following programs to run. +In every case, you may supply your own implementation by overriding the + corresponding (allcaps) variable (e·g, set `MKDIR` to supply your own + `mkdir` implementation).

- `cat` +- `cp` +- `echo` +- `file` +- `find` +- `mkdir` (requires support for `-p`) +- `mv` +- `printf` +- `sed` +- `test` +- `touch` +- `tr` (requires support for `-d`) +- `uuencode` (requires support for `-m` and `-r`) +- `xmlcatalog` (provided by `libxml2`) +- `xmllint` (provided by `libxml2`) +- `xsltproc` (provided by `libxslt`)

The following additional variables can be used to control the behaviour + of ⛩️📰 书社 :—

- **`SRCDIR`:** + The location of the source files (default: `sources`).

- **`INCLUDEDIR`:** + The location of the source files (default: `sources/includes`). + This can be inside of `SRCDIR`, but needn't be.

- **`BUILDDIR`:** + The location of the (temporary) build directory (default: `build`).

- **`DESTDIR`:** + The location of directory to output files to (default: `public`).

- **`THISDIR`:** + The location of the ⛩️📰 书社 `GNUmakefile`. + This should be set automatically when calling Make and shouldn't ever + need to be set manually. + This variable is used to find the ⛩️📰 书社 `lib/` folder, which is + expected to be in the same location.

- **`MAGICDIR`:** + The location of the magic files to use (default: `$(THISDIR)/magic`).

- **`FINDOPTS`:** + Options to pass to `find` when searching for source files (default: + `-LE`).

- **`FINDRULES`:** + Rules to use with `find` when searching for source files (default: + `-flags -nohidden -and -not -name '.*'`).

- **`PARSERS`:** + A white·space‐separated list of parsers to use (default: + `$(THISDIR)/parsers/*.xslt`).

- **`TRANSFORMS`:** + A white·space‐separated list of transforms to use (default: + `$(THISDIR)/transforms/*.xslt`).

- **`XMLTYPES`:** + A white·space‐separated list of media types to consider X·M·L + (default: `application/xml text/xml`).

- **`VERBOSE`:** + If this variable has a value, every recipe instruction will be + printed when it runs (default: empty). + This is helpful for debugging, but typically too noisy for general + usage.

## Source Files

Source files may be placed in `SRCDIR` in any manner; the file + structure used there will match the output. +The type of source files is *not* determined by file extension, but + rather by magic number; this means that files **must** begin with + something recognizable. +Supported magic numbers include :—

- `<?xml` for `application/xml` files +- `#!js` for `text/javascript` files +- `@charset "` for `text/css` files +- `#!tsv` for `text/tab-separated-values` files

Text formats with associated X·S·L·T parsers are wrapped in a H·T·M·L + `<script>` element whose `@type` gives its media type, and then + passed to the parser to process. +Source files whose media type does not have an associated X·S·L·T + parser are considered "assets" and will not be transformed.

For compatibility with this program, source filenames should conform to + the following rules :—

- They should not start with a hyphen‐minus. + This is to prevent confusion between filenames and options on the + commandline.

- They should not contain spaces, colons, percent signs, backticks, + question marks, hashes, or backslashes.

In general, filenames should be such that they do not require + percent‐encoding in the path component of an i·r·i.

## Parsers

Parsers are used to convert plaintext files into X·M·L trees, as well + as convert plaintext formats which are already included inline in + existing source X·M·L documents. +⛩️📰 书社 comes with some parsers; namely :—

- **`parsers/plain.xslt`:** + Wraps `text/plain` contents in a `<html:pre>` element.

- **`parsers/tsv.xslt`:** + Converts `text/tab-separated-values` contents into an `<html:table>` + element.

New ⛩️📰 书社 parsers should have a `<xslt:template>` element with no + `@name` or `@mode` and whose `@match` attribute…

- Starts with an appropriately‐namespaced qualified name for a + `<html:script>` element.

- Follows this with the string `[@type=`.

- Follows this with a quoted string giving a media type supported by + the parser. + Media type parameters are *not* supported.

- Follows this with the string `]`.

For example, the trivial `text/plain` parser is defined as follows :—

```xml +<?xml version="1.0"?> +<transform + xmlns="" + xmlns:html="" + version="1.0" +> + <template match="html:script[@type='text/plain']"> + <html:pre><value-of select="."/></html:pre> + </template> +</transform> +```

⛩️📰 书社 will scan the provided parsers for this pattern to determine + the set of allowed plaintext file types. +Multiple such `<xslt:template>` elements may be provided in a single + parser, for example if the parser supports multiple media types.

It is **strongly recommended** that all templates in parsers other than + those described above be namespaced (by `@name` or `@mode`), to avoid + conflicts between templates in multiple parsers.

## Embedding

Documents can be embedded in other documents using a `<书社:link>` + element with `@xlink:show="embed"`. +The `@xlink:href`s of these elements should have the format + `about:shushe?source=<path>`, where `<path>` provides the path to the + file within `SRCDIR`. +Includes, which do not generate outputs of their own but may still be + freely embedded, instead use the format + `about:shushe?include=<path>`, where `<path>` provides the path + within `INCLUDEDIR`.

Embeds are replaced with the parsed contents of a file, unless the file + is an asset, in which case an `<html:object>` element is produced + instead (with the contents of the asset file provided as a base64 + `data:` u·r·i).

Embedding takes place after parsing but before transformation, so + parsers are able to generate their own embeds. +⛩️📰 书社 is able to detect the transitive embed dependencies of files + and update them accordingly; it will signal an error if the + dependencies are recursive.

## Transforms

Transforms are used to convert X·M·L files into their final output, + after all necessary parsing and embedding has taken place. +⛩️📰 书社 comes with some transforms; namely :—

- **`transforms/asset.xslt`:** + Converts `<html:object type="text/css">` elements into corresponding + `<html:link rel="stylesheet">` elements and + `<html:object type="text/javascript">` elements into corresponding + `<html:script>` elements. + This transform enables embedding of `text/css` and `text/javascript` + files, which ordinarily are considered assets (as they lack + associated parsers).

- **`transforms/metadata.xslt`:** + Provides basic `<html:head>` metadata. + This metadata is generated from `<html:meta>` descendants of the + first element with an `@itemscope` attribute (recommended to just + be the root element). + Such elements can provide metadata using the following `@itemprop` + attributes :—

+ - **``:** + Provides the title of the page.

The following are recommendations on effective creation of + transforms :—

- Make template matchers as specific as possible. + It is likely an error if two transforms have templates which match + the same element (unless the templates have different priority).

- Namespace templates (with `@name` or `@mode`) whenever possible.

- Set `@exclude-result-prefixes` on the root `xslt:transform` element + to reduce the number of declared namespaces in the final result.

## Output Wrapping

⛩️📰 书社 will wrap the final output of the transforms in appropriate b/lib/catalog2dependencies.xslt @@ -0,0 +1,113 @@ +<?xml version="1.0"?> +<!-- +⁌ ⛩️📰 书社 ∷ lib/catalog2dependencies.xslt + +© 2023 Lady [@ Lady’s Computer] + +This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0. +If a copy of the M·P·L was not distributed with this file, You can obtain one at <>. +--> +<transform + xmlns="" + xmlns:catalog="urn:oasis:names:tc:entity:xmlns:xml:catalog" + xmlns:exsl="" + xmlns:xlink="" + xmlns:书社="" + version="1.0" +> + <variable name="uris" select="//catalog:uri"/> + <template name="书社:process-dependencies"> + <param name="processed"/> + <param name="unprocessed"/> + <variable name="queue"> + <copy-of select="exsl:node-set($unprocessed)/书社:dependency-root"/> + <for-each select="exsl:node-set($unprocessed)/书社:dependency"> + <if test="not((exsl:node-set($processed)/书社:*|preceding-sibling::书社:*|following-sibling::书社:recursive-dependency)[string()=string(current())])"> + <copy-of select="."/> + </if> + </for-each> + </variable> + <variable name="old"> + <copy-of select="exsl:node-set($processed)/书社:dependency-root"/> + <copy-of select="exsl:node-set($processed)/书社:recursive-dependency"/> + <for-each select="exsl:node-set($unprocessed)/书社:recursive-dependency"> + <if test="not((exsl:node-set($processed)/书社:recursive-dependency|preceding-sibling::书社:recursive-dependency)[string()=string(current())])"> + <copy-of select="."/> + </if> + </for-each> + <for-each select="exsl:node-set($processed)/书社:dependency"> + <if test="not(exsl:node-set($unprocessed)/书社:recursive-dependency[string()=string(current())])"> + <copy-of select="."/> + </if> + </for-each> + <copy-of select="$queue"/> + </variable> + <variable name="new"> + <for-each select="exsl:node-set($queue)/书社:*"> + <for-each select="$uris[@name=string(current()) and substring-after(@uri, '#')!='asset']"> + <variable name="parent" select="@name"/> + <for-each select="document(substring-before(@uri, '#'), .)//书社:link[@xlink:show='embed']"> + <if test="exsl:node-set($old)/书社:dependency-root[string()=string(current()/@xlink:href)]"> + <书社:recursive-dependency> + <value-of select="$parent"/> + </书社:recursive-dependency> + </if> + <if test="$uris/@name[string()=string(current()/@xlink:href)]"> + <书社:dependency> + <value-of select="@xlink:href"/> + </书社:dependency> + </if> + </for-each> + </for-each> + </for-each> + </variable> + <choose> + <when test="exsl:node-set($new)/书社:dependency"> + <call-template name="书社:process-dependencies"> + <with-param name="processed"> + <copy-of select="$old"/> + </with-param> + <with-param name="unprocessed"> + <copy-of select="$new"/> + </with-param> + </call-template> + </when> + <otherwise> + <copy-of select="$old"/> + </otherwise> + </choose> + </template> + <template match="catalog:uri" mode="书社:dependencies"> + <if test="substring-after(@uri, '#')!='asset'"> + <call-template name="书社:process-dependencies"> + <with-param name="unprocessed"> + <书社:dependency-root> + <value-of select="@name"/> + </书社:dependency-root> + </with-param> + </call-template> + </if> + </template> + <template match="/"> + <for-each select="$uris[not(substring-after(@uri, '#')='asset')]"> + <variable name="parent" select="@name"/> + <variable name="dependencies"> + <apply-templates select="." mode="书社:dependencies"/> + </variable> + <value-of select="@name"/> + <text>
</text> + <for-each select="exsl:node-set($dependencies)/书社:recursive-dependency"> + <text>	</text> + <text>!</text> + <value-of select="."/> + <text>
</text> + </for-each> + <for-each select="exsl:node-set($dependencies)/书社:dependency"> + <text>	</text> + <value-of select="."/> + <text>
</text> + </for-each> + </for-each> + </template> + <output method="text" encoding="UTF-8"/> +</transform> diff --git a/lib/catalog2parser.xslt b/lib/catalog2parser.xslt new file mode 100644 index 0000000..d044503 --- /dev/null +++ b/lib/catalog2parser.xslt @@ -0,0 +1,30 @@ +<?xml version="1.0"?> +<!-- +⁌ ⛩️📰 书社 ∷ lib/catalog2parser.xslt + +© 2023 Lady [@ Lady’s Computer] + +This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0. +If a copy of the M·P·L was not distributed with this file, You can obtain one at <>. +--> +<transform + xmlns="" + xmlns:catalog="urn:oasis:names:tc:entity:xmlns:xml:catalog" + xmlns:xsla="" + exclude-result-prefixes="catalog" + version="1.0" +> + <namespace-alias stylesheet-prefix="xsla" result-prefix="#default"/> + <template match="/"> + <xsla:transform version="1.0"> + <for-each select="//catalog:uri"> + <xsla:include href="{@uri}"/> + </for-each> + <xsla:template match="@*|node()" priority="-1"> + <xsla:copy> + <xsla:apply-templates select="@*|node()"/> + </xsla:copy> + </xsla:template> + </xsla:transform> + </template> +</transform> diff --git a/lib/catalog2transform.xslt b/lib/catalog2transform.xslt new file mode 100644 index 0000000..4a09235 --- /dev/null +++ b/lib/catalog2transform.xslt @@ -0,0 +1,84 @@ +<?xml version="1.0"?> +<!-- +⁌ ⛩️📰 书社 ∷ lib/catalog2transform.xslt + +© 2023 Lady [@ Lady’s Computer] + +This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0. +If a copy of the M·P·L was not distributed with this file, You can obtain one at <>. +--> +<transform + xmlns="" + xmlns:html="" + xmlns:catalog="urn:oasis:names:tc:entity:xmlns:xml:catalog" + xmlns:exsl="" + xmlns:xlink="" + xmlns:xslt="" + xmlns:书社="" + version="1.0" +> + <namespace-alias stylesheet-prefix="xslt" result-prefix="#default"/> + <template match="/"> + <xslt:transform exclude-result-prefixes="catalog exsl" version="1.0"> + <xslt:param name="catalog" select="'catalog'"/> + <for-each select="//catalog:uri"> + <xslt:include href="{@uri}"/> + </for-each> + <xslt:template match="/" priority="1"> + <xslt:variable name="expansion"> + <xslt:apply-templates select="." mode="书社:expand"/> + </xslt:variable> + <xslt:variable name="result"> + <xslt:apply-templates select="exsl:node-set($expansion)/*"/> + </xslt:variable> + <xslt:variable name="metadata"> + <xslt:copy-of select="exsl:node-set($result)/html/head/*"/> + <xslt:apply-templates select="exsl:node-set($result)" mode="书社:metadata"/> + </xslt:variable> + <html:html> + <xslt:copy-of select="exsl:node-set($result)/html:html/@*"/> + <html:head> + <xslt:copy-of select="exsl:node-set($result)/html:html/html:head/@*"/> + <html:title> + <xslt:for-each select="exsl:node-set($metadata)/html:title"> + <xslt:value-of select="."/> + </xslt:for-each> + </html:title> + <xslt:copy-of select="exsl:node-set($metadata)/*[not(self::html:title)]"/> + <xslt:if test="not(exsl:node-set($metadata)/html:meta[@name='generator'])"> + <html:meta name="generator" content="⛩️📰 书社"/> + </xslt:if> + </html:head> + <html:body> + <xslt:copy-of select="exsl:node-set($result)/*[not(self::html:html or self::html:body)]|exsl:node-set($result)/html:html/*[not(self::html:head or self::html:body)]|exsl:node-set($result)/html:html/html:body/*|exsl:node-set($result)/html:body/*"/> + </html:body> + </html:html> + </xslt:template> + <xslt:template match="@*|node()" priority="-1"> + <xslt:copy> + <xslt:apply-templates select="@*|node()"/> + </xslt:copy> + </xslt:template> + <xslt:template match="书社:link[@xlink:show='embed']" mode="书社:expand"> + <xslt:variable name="uri" select="substring-before(document($catalog)//catalog:uri[@name=current()/@xlink:href]/@uri[1], '#')"/> + <xslt:choose> + <xslt:when test="$uri"> + <xslt:apply-templates select="document($uri)" mode="书社:expand"/> + </xslt:when> + <xslt:otherwise> + <xslt:copy> + <xslt:apply-templates select="@*|node()" mode="书社:expand"/> + </xslt:copy> + </xslt:otherwise> + </xslt:choose> + </xslt:template> + <xslt:template match="@*|text()|*[not(self::书社:link) or not(@xlink:show='embed')]" mode="书社:expand"> + <xslt:copy> + <xslt:apply-templates select="@*|node()" mode="书社:expand"/> + </xslt:copy> + </xslt:template> + <xslt:template match="text()" mode="书社:metadata"/> + <xslt:output method="xml" encoding="UTF-8" cdata-section-elements="html:script html:style html:textarea"/> + </xslt:transform> + </template> +</transform> diff --git a/lib/parser2types.xslt b/lib/parser2types.xslt new file mode 100644 index 0000000..ee107e4 --- /dev/null +++ b/lib/parser2types.xslt @@ -0,0 +1,42 @@ +<?xml version="1.0"?> +<!-- +⁌ ⛩️📰 书社 ∷ lib/parser2types.xslt + +© 2023 Lady [@ Lady’s Computer] + +This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0. +If a copy of the M·P·L was not distributed with this file, You can obtain one at <>. +--> +<transform + xmlns="" + xmlns:catalog="urn:oasis:names:tc:entity:xmlns:xml:catalog" + xmlns:xslt="" + xmlns:书社="" + version="1.0" +> + <template match="/"> + <for-each select="//xslt:include"> + <for-each select="document(@href, .)//xslt:template[not(@name) and not(@mode)]"> + <variable name="match" select="@match"/> + <for-each select="namespace::*[local-name() and string()='']"> + <variable name="matchstart"> + <value-of select="local-name()"/> + <text>:</text> + <text>script[@type=</text> + </variable> + <if test="starts-with($match, $matchstart) and substring($match, string-length($match))=']' and contains($match, '/')"> + <variable name="inner" select="substring-before(substring-after($match, $matchstart), ']')"/> + <if test="starts-with($inner, '"') and substring($inner, string-length($inner))='"' or starts-with($inner, "'") and substring($inner, string-length($inner))="'""> + <variable name="type" select="substring($inner, 2, string-length($inner)-2)"/> + <if test="not(translate($type, '0123456789abcdefghijklmnopqrstuvwxyz!#$&-^_.+/', ''))"> + <value-of select="$type"/> + <text>
</text> + </if> + </if> + </if> + </for-each> + </for-each> + </for-each> + </template> + <output method="text" encoding="UTF-8"/> +</transform> diff --git a/magic/css b/magic/css new file mode 100644 index 0000000..24bbf5a --- /dev/null +++ b/magic/css @@ -0,0 +1,14 @@ +0 string /*css CSS text +!:mime text/css +!:strength + 255 + +0 string @charset\ " CSS text +!:mime text/css +!:strength + 255 + +0 byte 0xEF +>1 byte 0xBB +>>2 byte 0xBF +>>>3 string @charset\ " CSS text +!:mime text/css +!:strength + 255 diff --git a/magic/js b/magic/js new file mode 100644 index 0000000..971c95f --- /dev/null +++ b/magic/js @@ -0,0 +1,7 @@ +0 string #!js Javascript text +!:mime text/javascript +!:strength + 255 + +0 string #!javascript Javascript text +!:mime text/javascript +!:strength + 255 diff --git a/magic/tsv b/magic/tsv new file mode 100644 index 0000000..de72924 --- /dev/null +++ b/magic/tsv @@ -0,0 +1,10 @@ +0 string #!tsv TSV text +!:mime text/tab-separated-values +!:strength + 255 + +0 byte 0xEF +>1 byte 0xBB +>>2 byte 0xBF +>>>3 string #!tsv TSV text +!:mime text/tab-separated-values +!:strength + 255 diff --git a/magic/xml b/magic/xml new file mode 100644 index 0000000..d441701 --- /dev/null +++ b/magic/xml @@ -0,0 +1,10 @@ +0 string \<?xml XML data +!:mime application/xml +!:strength + 255 + +0 byte 0xEF +>1 byte 0xBB +>>2 byte 0xBF +>>>3 string \<?xml XML data +!:mime application/xml +!:strength + 255 diff --git a/parsers/plain.xslt b/parsers/plain.xslt new file mode 100644 index 0000000..0f61bfe --- /dev/null +++ b/parsers/plain.xslt @@ -0,0 +1,18 @@ +<?xml version="1.0"?> +<!-- +⁌ ⛩️📰 书社 ∷ parsers/plain.xslt + +© 2023 Lady [@ Lady’s Computer] + +This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0. +If a copy of the M·P·L was not distributed with this file, You can obtain one at <>. +--> +<transform + xmlns="" + xmlns:html="" + version="1.0" +> + <template match="html:script[@type='text/plain']"> + <html:pre><value-of select="."/></html:pre> + </template> +</transform> diff --git a/parsers/tsv.xslt b/parsers/tsv.xslt new file mode 100644 index 0000000..4de3b98 --- /dev/null +++ b/parsers/tsv.xslt @@ -0,0 +1,45 @@ +<?xml version="1.0"?> +<!-- +⁌ ⛩️📰 书社 ∷ parsers/tsv.xslt + +© 2023 Lady [@ Lady’s Computer] + +This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0. +If a copy of the M·P·L was not distributed with this file, You can obtain one at <>. +--> +<transform + xmlns="" + xmlns:exsl="" + xmlns:exslstr="" + xmlns:html="" + exclude-result-prefixes="exsl exslstr" + version="1.0" +> + <template match="html:script[@type='text/tab-separated-values']"> + <variable name="rows" select="exslstr:tokenize(., '
')[normalize-space(.) and not(starts-with(., '#'))]"/> + <variable name="head" select="exsl:node-set($rows)[1]"/> + <variable name="body" select="exsl:node-set($rows)[not(position()=1)]"/> + <html:table> + <html:thead> + <html:tr> + <for-each select="exslstr:tokenize($head, '	')"> + <html:th scope="row"> + <value-of select="."/> + </html:th> + </for-each> + </html:tr> + </html:thead> + <html:tbody> + <for-each select="exsl:node-set($body)"> + <html:tr> + <for-each select="exslstr:tokenize(., '	')"> + <html:td> + <value-of select="."/> + </html:td> + </for-each> + </html:tr> + </for-each> + </html:tbody> + </html:table> + </template> +</transform> diff --git a/transforms/asset.xslt b/transforms/asset.xslt new file mode 100644 index 0000000..a85c891 --- /dev/null +++ b/transforms/asset.xslt @@ -0,0 +1,29 @@ +<?xml version="1.0"?> +<!-- +⁌ ⛩️📰 书社 ∷ transforms/asset.xslt + +© 2023 Lady [@ Lady’s Computer] + +This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0. +If a copy of the M·P·L was not distributed with this file, You can obtain one at <>. +--> +<transform + xmlns="" + xmlns:html="" + xmlns:书社="" + exclude-result-prefixes="书社" + version="1.0" +> + <template match="html:object[@type='text/css']"> + <comment> + <text>[书社:CSS] </text> + <value-of select="@data"/> + </comment> + </template> + <template match="comment()[starts-with(., '[书社:CSS] ')]" mode="书社:metadata"> + <html:link rel="stylesheet" type="text/css" href="{substring-after(., '[书社:CSS] ')}"/> + </template> + <template match="html:object[@type='text/javascript']"> + <html:script type="{@type}" src="{@data}"/> + </template> +</transform> diff --git a/transforms/metadata.xslt b/transforms/metadata.xslt new file mode 100644 index 0000000..d4be493 --- /dev/null +++ b/transforms/metadata.xslt @@ -0,0 +1,36 @@ +<?xml version="1.0"?> +<!-- +⁌ ⛩️📰 书社 ∷ transforms/metadata.xslt + +© 2023 Lady [@ Lady’s Computer] + +This Source Code Form is subject to the terms of the Mozilla Public License, v 2.0. +If a copy of the M·P·L was not distributed with this file, You can obtain one at <>. +--> +<transform + xmlns="" + xmlns:html="" + xmlns:书社="" + exclude-result-prefixes="书社" + version="1.0" +> + <template match="html:*[@itemscope][1]//html:meta[not(@name) and starts-with(@itemprop, '')]"> + <comment> + <text>[书社:META] </text> + <value-of select="substring-after(@itemprop, '')"/> + <text>: </text> + <value-of select="@content"/> + </comment> + </template> + <template match="comment()[starts-with(., '[书社:META] ')]" mode="书社:metadata"> + <variable name="property" select="substring-before(substring-after(., '[书社:META] '), ': ')"/> + <variable name="value" select="substring-after(., concat('[书社:META] ', $property, ': '))"/> + <choose> + <when test="$property='title'"> + <html:title> + <value-of select="$value"/> + </html:title> + </when> + </choose> + </template> +</transform>