Skip to content

Commit

Permalink
Some XProc for running XSpec (usnistgov#94)
Browse files Browse the repository at this point in the history
* Towards usnistgov#93: support for calling XSpec using XProc and bash scripting (calling XML Calabash under Maven), with batch processing.

Includes XProc and XSLT-based pipelines for executing XSpec as well as shell scripting and utility code. With aggregation capabilities and a new HTML format for XSpec results.
  • Loading branch information
wendellpiez authored Jan 30, 2024
1 parent a36144f commit 2515000
Show file tree
Hide file tree
Showing 25 changed files with 2,211 additions and 0 deletions.
11 changes: 11 additions & 0 deletions bin/metaschema-xslt
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,11 @@ Subcommands:
Generate converter transformations (XSLT) between JSON and XML for a given metaschema
- composition-validate METASCHEMA_XML [ADDITIONAL_ARGS]
Test metaschema composition (assembling modules and linking definitions) and report issues
- xpec-test XSPEC_XML [ADDITIONAL_ARGS]
Compile and run a (single) XSpec test set, producing a report in a folder named xspec
- xpec-batch [ADDITIONAL_ARGS]
Compile and run a collection of XSpec test sets, echoing a summary report to the console
Parameters: folder, pattern, stop-on-error (TODO: UPDATE ME)
EOF
}

Expand Down Expand Up @@ -69,6 +74,12 @@ case "$SUBCOMMAND" in
;;
composition-validate)
"$SRC_DIR"/validate/mvn-composition-validate-xpl.sh "$@"
;;
xspec-batch)
"$ROOT_DIR"/support/xspec-dev/mvn-saxon-xspec-batch.sh "$@"
;;
xspec-test)
"$ROOT_DIR"/support/xspec-dev/mvn-saxon-xspec-html.sh "$@"
;;
?)
msg "Unknown subcommand: $SUBCOMMAND"
Expand Down
25 changes: 25 additions & 0 deletions support/pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -23,6 +23,10 @@
redirect. https://github.com/restlet/restlet-framework-java/issues/1390
-->
<repositories>
<repository>
<id>Maven Central</id>
<url>https://repo1.maven.org/maven2</url>
</repository>
<repository>
<id>maven.restlet.org</id>
<name>maven.restlet.org</name>
Expand All @@ -41,6 +45,27 @@
<artifactId>xmlcalabash</artifactId>
<version>1.5.3-110</version>
</dependency>

<!-- https://mvnrepository.com/artifact/org.nineml/coffeegrinder -->
<dependency>
<groupId>org.nineml</groupId>
<artifactId>coffeegrinder</artifactId>
<version>3.2.6</version>
<scope>runtime</scope>
</dependency>
<dependency>
<groupId>org.nineml</groupId>
<artifactId>coffeefilter</artifactId>
<version>3.2.6</version>
<scope>runtime</scope>
</dependency>
<dependency>
<groupId>org.nineml</groupId>
<artifactId>coffeesacks</artifactId>
<version>3.2.6</version>
<scope>runtime</scope>
</dependency>

</dependencies>

<build>
Expand Down
236 changes: 236 additions & 0 deletions support/xspec-dev/XSPEC-BATCH.xsl
Original file line number Diff line number Diff line change
@@ -0,0 +1,236 @@
<?xml version="1.0" encoding="UTF-8"?>
<xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
xmlns:xs="http://www.w3.org/2001/XMLSchema"
xmlns:mx="http://csrc.nist.gov/ns/csd/metaschema-xslt"
xmlns:err="http://www.w3.org/2005/xqt-errors"
exclude-result-prefixes="#all"
version="3.0">


<!--Q: redirect STDERR so as not to see runtime messages in the console?
-->

<!--Main outputs are to be returned to console or file as plain text
Reports are written as side effects -->
<xsl:output method="text"/>

<!-- NOTE TO DEVS: this is the point of dependency on released XSpec
If the referenced code moves or changes, this XSLT must be adapted accordingly. -->
<xsl:param name="compiler-xslt-path" as="xs:string">../xspec/src/compiler/compile-xslt-tests.xsl</xsl:param>

<!-- in no mode, the imported stylesheet makes HTML reports from XSpec execution results -->
<xsl:import href="XSPEC-SINGLE.xsl"/>

<!--
call template "go" for the full effect - it will do its best
current impressions are that runtime is fast but no indication of memory consumption
for diagnostic info including paths to resources that the XSLT will use
(for reading and writing) use initial template "nogo"
Parameters:
$baseURI: a URI indicating runtime context - relative to which XSpecs are found
$folder: a folder, relative to baseURI - defaults to 'src'
hint - if you want your script to run in the current directory or any arbitrary directory
and wish to hardwire its location
and it's not inside ../../src (in which case designating $folder works)
set baseURI to the script's file: URI e.g. file:/mnt/c/Users/wap1/Documents/usnistgov/metaschema-xslt/support/xspec-dev/script.sh
(or to the folder with closing slash)
and folder to '.'
this parameterization is necessary so the XSLT can locate resource
even located elsewhere from where the script is called)
$pattern: glob-like syntax for file name matching
cf https://www.saxonica.com/html/documentation12/sourcedocs/collections/collection-directories.html '?select'
use a single file name for a single file
use (file1.xspec|file2.xspec|...|fileN.xspec) for file name literals (with URI escaping)
defaults to *.xspec (all files suffixed xspec)
$recurse (yes|no) identify files recursively - defaults to 'yes'
$stop-on-error (yes|no) hard stop on any failure, or keep going
does not stop if a test successfully runs and returns a false result
only if tests fail to run for any reason
default to 'hard'
$report-to - if ends in '.html', a single aggregated report is written to this path relative to baseURI
otherwise a non-empty $report-to results in each XSpec getting its own report written into a folder of that name
they will all be together and no precaution is taken for XSpecs with colliding names - take care
as Saxon will refuse (so rename one of the files or report in aggregate)
if $report is not given, no external reports are written
$theme works as it does in XSPEC-SINGLE.xsl (clean|classic|toybox|uswds)
results:
A failure to read, parse, compile or process any XSpec will drop it with warnings
unless $stop-on-error=yes in which case the run stops with an error condition
A run that completes delivers plain text results to -o or STDOUT
Depending on settings, XSpec reports are formatted and written out as HTML (single or multiple)
-->

<xsl:param name="baseURI" as="xs:string" select="resolve-uri('../..', static-base-uri())"/>

<xsl:param name="folder" as="xs:string">src</xsl:param>

<xsl:param name="pattern" as="xs:string">*.xspec</xsl:param>

<xsl:param name="recurse" as="xs:string">no</xsl:param>

<xsl:param name="report-to" as="xs:string?"/>
<!-- non-null values produce either a single HTML report, when ending in '.html'
or one report for each XSpec, to a separate file
nb memory usage may be heavy under the first scenario, untested! -->
<xsl:variable name="reporting" as="xs:boolean" select="boolean($report-to)"/>
<xsl:variable name="reporting-aggregate" as="xs:boolean" select="ends-with($report-to,'.html')"/>

<xsl:param name="stop-on-error" as="xs:string">no</xsl:param>
<xsl:variable name="stopping-on-error" as="xs:boolean" select="$stop-on-error=('yes','true')"/>


<xsl:variable name="collection-location" select="resolve-uri($folder, $baseURI)"/>

<xsl:variable name="collection-args" as="xs:string" expand-text="true">
<xsl:variable name="s">select={$pattern}</xsl:variable>
<xsl:variable name="r">recurse={ if ($recurse=('no','false')) then 'no' else 'yes' }</xsl:variable>
<xsl:variable name="e">on-error={ if ($stopping-on-error) then 'fail' else 'warning' }</xsl:variable>
<xsl:value-of select="($s,$r,$e,'metadata=yes') => string-join(';')"/>
</xsl:variable>

<xsl:variable name="collection-uri" select="($collection-location, $collection-args) => string-join('?')"/>

<xsl:variable name="collection-in" as="map(*)*">

<xsl:try select="collection( $collection-uri )">
<xsl:catch>
<xsl:message terminate="{ if ($stopping-on-error) then 'yes' else 'no' }" expand-text="true">ERROR: Unable to resolve collection at URI {$collection-uri} - getting {$err:code} '{$err:description}'</xsl:message>
</xsl:catch>
</xsl:try>
</xsl:variable>

<xsl:template name="nogo" expand-text="true">
<xsl:text>Param $baseURI is: { $baseURI }&#xA;</xsl:text>
<xsl:text>Static base URI is: { static-base-uri() }&#xA;</xsl:text>

</xsl:template>

<xsl:template name="go">
<!--<xsl:call-template name="report-locations"/>-->
<xsl:text expand-text="true">Acquiring collection from { $collection-uri }&#xA;</xsl:text>

<xsl:variable name="all-compiled" as="document-node()*">
<xsl:iterate select="$collection-in">
<xsl:variable name="my" as="map(*)" select="."/>
<!-- we could execute $my?fetch(), except it has the wrong static context and does not produce
a viable (self-executing) XSLT stylesheet as the compiled results -
the path to the XSLT being tested is broken.
Accordingly, we use collection() only to get our name list, then compile
each XSpec from its own context. -->
<xsl:try select="$my?name => xs:anyURI() => mx:compile-xspec-at-uri()">
<xsl:catch>
<xsl:message terminate="{ if ($stopping-on-error) then 'yes' else 'no' }" expand-text="true">ERROR: Unable to compile XSpec at { $my?name } - getting {$err:code} '{$err:description}'</xsl:message>
</xsl:catch>
</xsl:try>
</xsl:iterate>
</xsl:variable>
<xsl:variable name="all-executed" as="document-node()*">
<xsl:iterate select="$all-compiled">
<xsl:try select="mx:execute-xspec(.)">
<xsl:catch>
<!--<xsl:variable name="Q{http://www.jenitennison.com/xslt/xspec}xspec-uri"-->
<xsl:message terminate="{ if ($stopping-on-error) then 'yes' else 'no' }" expand-text="true">ERROR:
Unable to execute compiled XSpec from { /*/xsl:variable[@name='Q{{http://www.jenitennison.com/xslt/xspec}}xspec-uri'] } - getting {$err:code}
'{$err:description}'</xsl:message>
</xsl:catch>
</xsl:try>
</xsl:iterate>
</xsl:variable>
<xsl:variable name="aggregated-results" as="document-node()">
<xsl:document>
<RESULTS>
<xsl:sequence select="$all-executed"/>
</RESULTS>
</xsl:document>
</xsl:variable>

<xsl:apply-templates select="$aggregated-results/RESULTS" mode="emit-reports"/>

<!-- An aggregated report is produced for -o or STDOUT using transformations xspec-summarize.xsl and xspec-summary-reduce.xsl over $aggregated-results -->
<xsl:sequence select="$aggregated-results => mx:transform-with(xs:anyURI('xspec-summarize.xsl')) => mx:transform-with(xs:anyURI('xspec-summary-reduce.xsl'))"/>

<!-- As extra, we report if we can see that tests were dropped along the way - this goes into main output,
post summary, not the message stream -->
<xsl:variable name="reported-xspecs" select="$aggregated-results/RESULTS/*/@xspec"/>
<xsl:variable name="dropped" select="$collection-in[not(.?name = $reported-xspecs)]"/>
<xsl:if test="exists($dropped)" expand-text="true">
<xsl:text>WARNING: of { count($collection-in) } { if (count($collection-in)=1) then 'file' else 'files' }, { count($dropped) } { if (count($dropped) = 1) then 'file selected was' else 'were' } dropped - either unavailable, would not compile (XSpec to XSLT), or would not execute (XSLT):&#xA;</xsl:text>
<xsl:text expand-text="true"> { $dropped?name => string-join(',&#xA; ') }&#xA;</xsl:text>
</xsl:if>

</xsl:template>

<xsl:template priority="101" match="RESULTS[not($reporting)]" mode="emit-reports"/>

<xsl:template priority="99" match="RESULTS[$reporting-aggregate]" mode="emit-reports">
<xsl:call-template name="write-html-file">
<xsl:with-param name="filename" select="resolve-uri($report-to,$collection-location)"/>
<!-- nb in this application, html is in no namespace -->
<xsl:with-param name="payload" as="element(html)">
<xsl:call-template name="html-report"/>
</xsl:with-param>
</xsl:call-template>
</xsl:template>

<xsl:template priority="91" match="RESULTS" mode="emit-reports">
<xsl:apply-templates mode="produce-html" select="*"/>
</xsl:template>

<xsl:template mode="produce-html" match="x:report" xmlns:x="http://www.jenitennison.com/xslt/xspec">
<!--xspec="file:/C:/Users/wap1/Documents/usnistgov/metaschema-xslt/support/xspec-dev/xspec-shell.xspec"-->

<xsl:variable name="xspec-basename" select="@xspec => replace('.*/', '') => replace('\.[^.]*$', '')"/>
<xsl:variable name="html-filename" expand-text="true">{$report-to}/{$xspec-basename}.html</xsl:variable>
<xsl:variable name="write-to" select="resolve-uri($html-filename, $collection-location)"/>

<xsl:call-template name="write-html-file">
<xsl:with-param name="filename" select="$write-to"/>
<xsl:with-param name="payload" as="element(html)">
<xsl:call-template name="html-report"/>
</xsl:with-param>
</xsl:call-template>
</xsl:template>

<xsl:template name="write-html-file">
<xsl:param name="filename" as="xs:anyURI"/>
<xsl:param name="payload" as="element(html)"/>
<xsl:message expand-text="true">Writing report {$filename} ...</xsl:message>
<xsl:result-document href="{$filename}" method="html" html-version="5.0" indent="yes">
<xsl:sequence select="$payload"/>
</xsl:result-document>
</xsl:template>

<xsl:function name="mx:compile-xspec-at-uri" as="document-node()?" cache="true">
<xsl:param name="xspec-uri" as="xs:anyURI"/>
<xsl:sequence select="doc($xspec-uri) => mx:compile-xspec()"/>
</xsl:function>

<xsl:function name="mx:transform-with" as="document-node()?" cache="true">
<xsl:param name="source" as="document-node()"/>
<xsl:param name="stylesheet-location" as="xs:anyURI"/>

<xsl:variable name="runtime-params" as="map(xs:QName,item()*)">
<xsl:map/>
</xsl:variable>
<xsl:variable name="runtime" as="map(xs:string, item())">
<!-- call template t:main xmlns:t="http://www.jenitennison.com/xslt/xspec"-->
<xsl:map>
<xsl:map-entry key="'xslt-version'" select="3.0"/>
<xsl:map-entry key="'source-node'" select="$source"/>
<xsl:map-entry key="'stylesheet-location'" select="$stylesheet-location"/>
<xsl:map-entry key="'stylesheet-params'" select="$runtime-params"/>
</xsl:map>
</xsl:variable>
<xsl:sequence select="transform($runtime)?output"/>
</xsl:function>


</xsl:stylesheet>
Loading

0 comments on commit 2515000

Please sign in to comment.