/usr/local/CPAN/XML-EP/XML/EP/Processor/XSLTParser.pm
################################################################################
#
# Perl module: XML::XSLT
#
# By Geert Josten, gjosten@sci.kun.nl
# and Egon Willighagen, egonw@sci.kun.nl
#
################################################################################
######################################################################
package XML::EP::Processor::XSLTParser;
######################################################################
use strict;
use XML::DOM;
use XML::DOM ();
use vars qw ( $_indent $_indent_incr $debug $warnings );
$_indent = 0;
$_indent_incr = 1;
sub new {
my $proto = shift;
my $parser = bless {@_}, (ref($proto) || $proto);
$parser->__add_default_templates__($parser->{xslDocument})
if $parser->{xslDocument};
$parser;
}
sub openproject {
my ($parser, $xmlfile, $xslfile) = @_;
my $domParser = XML::DOM::Parser->new();
$parser->{xslDocument} = $domParser->parsefile($xslfile);
$parser->{xmlDocument} = $domParser->parsefile($xmlfile);
$parser->__add_default_templates__($parser->{xslDocument});
}
sub process_project {
my ($parser) = @_;
$parser->{resultNode} = $parser->{xmlDocument}->createDocumentFragment();
my $root_template = $parser->_find_template ('/');
if ($root_template) {
$parser->_evaluate_template (
$root_template, # starting template, the root template
$parser->{xmlDocument}, # current XML node, the root
'', # current XML selection path, the root
$parser->{resultNode} # current result tree node, the root
);
}
$parser->{resultNode};
}
sub print_result {
my ($parser, $file) = @_;
my $output = $parser->{resultNode}->toString();
$output =~ s/\n\s*\n(\s*)\n/\n$1\n/g; # Substitute multiple empty lines by one
$output =~ s/\/\>/ \/\>/g; # Insert a space before all />
if ($file) {
print $file $output;
} else {
print $output;
}
}
######################################################################
sub __add_default_templates__ {
my $parser = shift;
# Add the default templates for match="/" and match="*" #
my $root_node = shift;
my $stylesheet = $root_node->getElementsByTagName('xsl:stylesheet',0)->item(0);
my $first_template = $stylesheet->getElementsByTagName('xsl:template',0)->item(0);
my $root_template = $root_node->createElement('xsl:template');
$root_template->setAttribute('match','/');
$root_template->appendChild ($root_node->createElement('xsl:apply-templates'));
$stylesheet->insertBefore($root_template,$first_template);
my $any_element_template = $root_node->createElement('xsl:template');
$any_element_template->setAttribute('match','*');
$any_element_template->appendChild ($root_node->createElement('xsl:apply-templates'));
$stylesheet->insertBefore($any_element_template,$first_template);
}
sub _find_template {
my $parser = shift;
my $current_xml_selection_path = shift;
my $attribute_name = shift;
$attribute_name = "match" unless defined $attribute_name;
print " "x$_indent,"searching template for \"$current_xml_selection_path\": " if $debug;
my $stylesheet = $parser->{xslDocument}->getElementsByTagName('xsl:stylesheet',0)->item(0);
my $templates = $stylesheet->getElementsByTagName('xsl:template',0);
for (my $i = ($templates->getLength - 1); $i >= 0; $i--) {
my $template = $templates->item($i);
my $template_attr_value = $template->getAttribute ($attribute_name);
if (&__template_matches__ ($template_attr_value, $current_xml_selection_path)) {
print "found #$i \"$template_attr_value\"$/" if $debug;
return $template;
}
}
print "no template found! $/" if $debug;
warn ("No template matching $current_xml_selection_path found !!$/") if $debug;
return "";
}
sub __template_matches__ {
my $template = shift;
my $path = shift;
if ($template ne $path) {
if ($path =~ /\/.*(\@\*|\@\w+)$/) {
# attribute selection #
my $attribute = $1;
return ($template eq "\@*" || $template eq $attribute);
} elsif ($path =~ /\/(\*|\w+)$/) {
# element selection #
my $element = $1;
return ($template eq "*" || $template eq $element);
} else {
return "";
}
} else {
return "True";
}
}
sub _evaluate_template {
my $parser = shift;
my $template = shift;
my $current_xml_node = shift;
my $current_xml_selection_path = shift;
my $current_result_node = shift;
print " "x$_indent,"evaluating template content for \"$current_xml_selection_path\": $/" if $debug;
$_indent += $_indent_incr;;
foreach my $child ($template->getChildNodes) {
my $ref = ref $child;
print " "x$_indent,"$ref$/" if $debug;
$_indent += $_indent_incr;
if ($child->getNodeType == ELEMENT_NODE) {
$parser->_evaluate_element ($child,
$current_xml_node,
$current_xml_selection_path,
$current_result_node);
} elsif ($child->getNodeType == TEXT_NODE) {
$parser->_add_node($child, $current_result_node);
} else {
my $name = $template->getTagName;
print " "x$_indent,"Cannot evaluate node $name of type $ref !$/" if $debug;
warn ("evaluate-template: Dunno what to do with node of type $ref !!! ($name; $current_xml_selection_path)$/") if $warnings;
}
$_indent -= $_indent_incr;
}
$_indent -= $_indent_incr;
}
sub _add_node {
my $parser = shift;
my $node = shift;
my $parent = shift;
my $deep = (shift || "");
my $owner = (shift || $parser->{'xmlDocument'});
if ($debug) {
print " "x$_indent,"adding (deep): " if $deep;
print " "x$_indent,"adding (non-deep): " if !$deep;
}
$node = $node->cloneNode($deep);
$node->setOwnerDocument($owner);
$parent->appendChild($node);
print "done$/" if $debug;
}
sub _apply_templates {
my $parser = shift;
my $current_xml_node = shift;
my $current_xml_selection_path = shift;
my $current_result_node = shift;
print " "x$_indent,"applying templates on children of \"$current_xml_selection_path\":$/" if $debug;
$_indent += $_indent_incr;
foreach my $child ($current_xml_node->getChildNodes) {
my $ref = ref $child;
print " "x$_indent,"$ref$/" if $debug;
$_indent += $_indent_incr;
my $child_xml_selection_path = $child->getNodeName;
$child_xml_selection_path = "$current_xml_selection_path/$child_xml_selection_path";
if ($child->getNodeType == ELEMENT_NODE) {
my $template = $parser->_find_template ($child_xml_selection_path);
if ($template) {
$parser->_evaluate_template ($template,
$child,
$child_xml_selection_path,
$current_result_node);
}
} elsif ($child->getNodeType == TEXT_NODE) {
$parser->_add_node($child, $current_result_node);
} elsif ($child->getNodeType == DOCUMENT_TYPE_NODE) {
# skip #
} elsif ($child->getNodeType == COMMENT_NODE) {
# skip #
} else {
print " "x$_indent,"Cannot apply templates on nodes of type $ref$/" if $debug;
warn ("apply-templates: Dunno what to do with nodes of type $ref !!! ($child_xml_selection_path)$/") if $warnings;
}
$_indent -= $_indent_incr;
}
$_indent -= $_indent_incr;
}
sub _evaluate_element {
my $parser = shift;
my $xsl_node = shift;
my $current_xml_node = shift;
my $current_xml_selection_path = shift;
my $current_result_node = shift;
my $xsl_tag = $xsl_node->getTagName;
print " "x$_indent,"evaluating element $xsl_tag for \"$current_xml_selection_path\": $/" if $debug;
$_indent += $_indent_incr;
if ($xsl_tag =~ /^xsl:/i) {
if ($xsl_tag =~ /^xsl:apply-templates/i) {
$parser->_apply_templates ($current_xml_node,
$current_xml_selection_path,
$current_result_node);
# } elsif ($xsl_tag =~ /^xsl:call-template/i) {
# } elsif ($xsl_tag =~ /^xsl:choose/i) {
# } elsif ($xsl_tag =~ /^xsl:for-each/i) {
# } elsif ($xsl_tag =~ /^xsl:include/i) {
# } elsif ($xsl_tag =~ /^xsl:output/i) {
# } elsif ($xsl_tag =~ /^xsl:processing-instruction/i) {
} elsif ($xsl_tag =~ /^xsl:value-of/i) {
$parser->_value_of ($xsl_node, $current_xml_node,
$current_xml_selection_path,
$current_result_node);
} else {
$parser->_add_and_recurse ($xsl_node, $current_xml_node,
$current_xml_selection_path,
$current_result_node);
}
} else {
$parser->_add_and_recurse ($xsl_node, $current_xml_node,
$current_xml_selection_path,
$current_result_node);
}
$_indent -= $_indent_incr;
}
sub _add_and_recurse {
my $parser = shift;
my $xsl_node = shift;
my $current_xml_node = shift;
my $current_xml_selection_path = shift;
my $current_result_node = shift;
$parser->_add_node ($xsl_node, $current_result_node);
$parser->_evaluate_template ($xsl_node,
$current_xml_node,
$current_xml_selection_path,
$current_result_node->getLastChild);
}
sub _value_of {
my($parser, $xsl_node, $xml_node, $current_path, $result_node) = @_;
my $path = $xsl_node->getAttribute('select');
my $start = ($path =~ /^\//) ?
$xml_node : $parser->{xmlDocument};
my $value = $parser->CollectValues($start, $path);
if ($value ne "") {
$result_node->appendChild($parser->{xmlDocument}->createTextNode($value));
}
}
sub CollectValues {
my($parser, $xmlNode, $path) = @_;
if ($path =~ s/^\/\///) {
# Beginning with the current node, start a recursive collection
return $parser->CollectValuesDeep($xmlNode, $path);
}
$path =~ s/^\///;
if ($path =~ s/^\.\.//) {
my $parent = $xmlNode->getParent();
return defined $parent ? $parser->CollectValues($parent, $path) : "";
}
if ($path =~ s/^\.//) {
return $parser->CollectValues($xmlNode, $path);
}
if ($path =~ s/^\@//) {
return "" unless $xmlNode->getNodeType() == XML::DOM::ELEMENT_NODE();
my $value = $xmlNode->getAttribute($path);
return defined $value ? $value : "";
}
if ($path =~ s/^([\w\-\:\.]+)(?:\[(\d+)\])?//) {
my $name = $1;
my $index = $2;
my @elements = $parser->FindElementsByName($xmlNode, $name);
if ($index) { @elements = @elements > $index ? $elements[$index] : () }
my $value = "";
foreach my $elem (@elements) {
$value .= $parser->CollectValues($elem, $path);
}
return $value;
}
return "" unless $path eq ""; # Dunno how to handle $path
$parser->ElemValue($xmlNode);
}
sub ElemValue {
my($parser, $node) = @_;
my $type = $node->getNodeType();
if ($type == XML::DOM::ATTRIBUTE_NODE() ||
$type == XML::DOM::TEXT_NODE() ||
$type == XML::DOM::CDATA_SECTION_NODE()) {
$node->getData();
} elsif ($type == XML::DOM::ELEMENT_NODE() ||
$type == XML::DOM::DOCUMENT_NODE() ||
$type == XML::DOM::DOCUMENT_FRAGMENT_NODE()) {
my $value = "";
for (my $child = $node->getFirstChild(); $child;
$child = $child->getNextSibling()) {
$value .= $parser->ElemValue($child);
}
$value;
}
}
sub FindElementsByName {
my($parser, $node, $name) = @_;
my @result;
for (my $child = $node->getFirstChild(); $child;
$child = $child->getNextSibling()) {
if ($child->getNodeType() == XML::DOM::ELEMENT_NODE()) {
push(@result, $child) if $child->getTagName() eq $name;
} elsif ($child->getNodeType() == XML::DOM::DOCUMENT_NODE() ||
$child->getNodeType() == XML::DOM::DOCUMENT_FRAGMENT_NODE()) {
push(@result, $parser->FindElementsByName($child, $name));
}
}
@result;
}
sub CollectValuesDeep {
my($parser, $xmlNode, $path) = @_;
my $values = $parser->CollectValues($xmlNode, $path);
for (my $child = $xmlNode->getFirstChild(); $child;
$child = $child->getNextSibling()) {
$values .= $child->CollectValues_deep($xmlNode, $path);
}
$values;
}
1;