
59 lines
2.3 KiB
Raw Permalink Normal View History

2023-04-27 12:08:25 -04:00
<?xml version="1.0" encoding="UTF-8"?>
<xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
exclude-result-prefixes="xs math"
<!-- <xsl:output method="xhtml" html-version="5" omit-xml-declaration="yes"
include-content-type="no" indent="yes"/>-->
<!-- 2023-04-27 ebb: This is XSLT Stage 1: fixing paragraphs in the XML.
It is an XML-to-XML identity transformation, leaving the files intact but adding paragraph markup where it is missing.
<xsl:variable name="conspiracy" as="document-node()+" select="collection('../regexConspTest')"/>
<xsl:mode on-no-match="shallow-copy"/>
<xsl:template match="/">
2023-04-28 02:15:04 -04:00
2023-04-27 12:08:25 -04:00
<xsl:for-each select="$conspiracy">
<xsl:variable name="filename" as="xs:string" select="current() ! base-uri() ! tokenize(., '/')[last()]"/>
<xsl:result-document method="xml" indent="yes" href="../pre-src-xml/{$filename}">
2023-04-28 02:15:04 -04:00
<!-- 2023-04-28 ebb: Corrected xml root element to sit inside the individual documents. -->
2023-04-27 12:08:25 -04:00
<xsl:when test="count(descendant::p) gt 1">
<div class="article"><xsl:apply-templates select=".//p" mode="multiparagraph"/></div>
<xsl:apply-templates select=".//p"/>
2023-04-28 02:15:04 -04:00
2023-04-27 13:30:47 -04:00
2023-04-27 12:08:25 -04:00
<xsl:template match="p" mode="multiparagraph">
<xsl:template match="p">
<div class="article">
<xsl:analyze-string select="." regex="(.+?)\n\n" flags="s">
<p><xsl:value-of select="regex-group(1)"/></p>
<!-- If we wanted to save the \n\n we could, but why? <xsl:non-matching-substring>
<xsl:value-of select="."/>