# $Id: XSP.pm,v 1.45.2.1 2003/07/28 22:51:19 matts Exp $ package Apache::AxKit::Language::XSP; use strict; use AxKit; use Apache::AxKit::Language; use Apache::Request; use Apache::AxKit::Exception; use Apache::AxKit::Cache; use Fcntl; BEGIN { $INC{'utf8.pm'}++ if $] < 5.006 } use utf8; use vars qw/@ISA/; @ISA = ('Apache::AxKit::Language'); sub stylesheet_exists () { 0; } sub get_mtime { return 30; # 30 days in the cache? } my $cache; # useful for debugging - not actually used by AxKit: # sub get_code { # my $filename = shift; # # # cannot register - no $AxKit::Cfg... # # _register_me_and_others(); # __PACKAGE__->register(); # # my $package = get_package_name($filename); # my $parser = get_parser($package, $filename); # return $parser->parsefile($filename); # } sub handler { my $class = shift; my ($r, $xml, undef, $last_in_chain) = @_; _register_me_and_others(); # warn "XSP Parse: $xmlfile\n"; my $key = $xml->key(); my $package = get_package_name($key); my $handler = AxKit::XSP::SAXHandler->new_handler( XSP_Package => $package, XSP_Line => $key, XSP_Debug => 0, ); my $parser = AxKit::XSP::SAXParser->new( provider => $xml, Handler => $handler, ); local $Apache::AxKit::Language::XSP::ResNamespaces = $r->dir_config('XSPResNamespaces'); my $to_eval; eval { if (my $dom_tree = $r->pnotes('dom_tree')) { AxKit::Debug(5, 'XSP: parsing dom_tree'); $to_eval = $parser->parse($dom_tree); delete $r->pnotes()->{'dom_tree'}; } elsif (my $xmlstr = $r->pnotes('xml_string')) { if ($r->no_cache() || !defined &{"${package}::xml_generator"}) { AxKit::Debug(5, 'XSP: parsing xml_string'); $to_eval = $parser->parse($xmlstr); } else { AxKit::Debug(5, 'XSP: not reparsing xml_string (cached)'); } } else { my $xcache = Apache::AxKit::Cache->new($r, $package, 'compiled XSP'); # check mtime. my $mtime = $xml->mtime(); no strict 'refs'; if (exists($cache->{$key}) && !$xml->has_changed($cache->{$key}{mtime}) && defined &{"${package}::xml_generator"} ) { # cached AxKit::Debug(5, 'XSP: xsp script cached in memory'); } elsif (!$xml->has_changed($xcache->mtime())) { AxKit::Debug(5, 'XSP: xsp script cached on disk'); $to_eval = $xcache->read(); } else { AxKit::Debug(5, 'XSP: parsing fh'); $to_eval = eval { $parser->parse($xml->get_fh()); } || $parser->parse(${ $xml->get_strref() }); $cache->{$key}{mtime} = $mtime; $xcache->write($to_eval); } } }; if ($@) { throw Apache::AxKit::Exception::Error( -text => "Parse of '$key' failed: $@" ); } if ($to_eval) { eval { require Perl::Tidy; AxKit::Debug(5,'Running PerlTidy...'); my $errors; my $res; Perl::Tidy::perltidy( source => \$to_eval, destination => \$res, stderr => \$errors, argv => '-se -npro -f -nsyn -pt=2 -sbt=2 -csc -csce=2 -vt=1 -lp -cab=3 -iob'); if ($errors) { AxKit::Debug(1,"PerlTidy warnings: $errors"); } else { AxKit::Debug(5,"PerlTidy successful"); } $to_eval = $res; } if $AxKit::Cfg->DebugTidy; AxKit::Debug(1,"AxDebugTidy unavailable for Perl code: $@") if $@; if (my $ti = $AxKit::Cfg->TraceIntermediate) { my $interm_prefix = $r->uri; $interm_prefix =~ s{%}{%25}g; $interm_prefix =~ s{/}{%2f}g; $interm_prefix =~ s/[^0-9a-zA-Z.,_|-]/_/g; $interm_prefix = $ti.'/'.$interm_prefix; if (!-d $ti) { if (!mkdir($ti, 0777)) { AxKit::Debug(1, "Can't create AxTraceIntermediate directory '$ti': $!"); } } my $fh = Apache->gensym(); # this is duplicated work: the cache has it as well, but with a # different filename and hard to find. if (AxKit::open($fh, '>'.$interm_prefix.'.XSP')) { print($fh $to_eval); } else { AxKit::Debug(1,"could not open $interm_prefix.XSP for writing: $!"); } } undef &{"${package}::xml_generator"}; AxKit::Debug(5, 'Recompiling XSP script'); AxKit::Debug(10, $to_eval); eval $to_eval; if ($@) { my $line = 1; $to_eval =~ s/\n/"\n".++$line." "/eg; warn("Script:\n1 $to_eval\n"); throw Apache::AxKit::Exception::Error( -text => "Compilation failed: $@" ); } AxKit::Debug(5, 'XSP Compilation finished'); } no strict 'refs'; # make sure we use inheritance to get this my $cv = $package->can('handler'); my $cgi = Apache::Request->instance($r); $r->no_cache(1); my $xsp_cache = Apache::AxKit::Cache->new($r, $package, $package->cache_params($r, $cgi)); if (!$package->has_changed($xsp_cache->mtime()) && !$xml->has_changed($xsp_cache->mtime())) { AxKit::Debug(3, "XSP results cached"); $r->print($xsp_cache->read); return; } my $dom = XML::LibXML::Document->createDocument("1.0", "UTF-8"); my $rc = eval { $package->$cv($r, $cgi, $dom); }; if ($@) { die $@ if (ref($@)); if ($to_eval) { my $line = 1; $to_eval =~ s/\n/"\n".++$line." "/eg; warn("Script:\n1 $to_eval\n"); } throw Apache::AxKit::Exception::Error( -text => "Execution failed: $@" ); } $r->pnotes('dom_tree', $dom); $r->print($dom->toString) if $last_in_chain; $xsp_cache->write( $dom->toString ); return $rc; } sub register { my $class = shift; no strict 'refs'; $class->register_taglib(${"${class}::NS"}); } sub _register_me_and_others { # warn "Loading taglibs\n"; foreach my $package ($AxKit::Cfg->XSPTaglibs()) { # warn "Registering taglib: $package\n"; AxKit::load_module($package); $package->register(); } } sub register_taglib { my $class = shift; my $namespace = shift; # warn "Register taglib: $namespace => $class\n"; $Apache::AxKit::Language::XSP::tag_lib{$namespace} = $class; } sub is_xsp_namespace { my ($ns) = @_; # a uri of the form "res:perl/" turns into an implicit loading of # the module indicated by (after slashes are turned into # double-colons). an example uri is "res:perl/My/Cool/Module". if ($Apache::AxKit::Language::XSP::ResNamespaces && $ns =~ m/^res:perl\/(.*)$/) { my $package = $1; $package =~ s/\//::/g; AxKit::load_module($package); $package->register(); } return 1 if $ns && $Apache::AxKit::Language::XSP::tag_lib{$ns}; } sub get_package_name { my $filename = shift; # Escape everything into valid perl identifiers $filename =~ s/([^A-Za-z0-9_\/])/sprintf("_%2x",unpack("C",$1))/eg; # second pass cares for slashes and words starting with a digit $filename =~ s{ (/+) # directory (\d?) # package's first character }[ "::" . (length $2 ? sprintf("_%2x",unpack("C",$2)) : "") ]egx; return "Apache::AxKit::Language::XSP::ROOT$filename"; } sub makeSingleQuoted($) { my $value = shift; $value =~ s/([\\|])/\\$1/g; return 'q|'.$value.'|'; } ############################################################ # SAX Handler code ############################################################ package AxKit::XSP::SAXHandler; sub new_handler { my ($type, %self) = @_; return bless \%self, $type; } sub start_expr { my ($e) = @_; my $element = { Name => "expr", NamespaceURI => $AxKit::XSP::Core::NS, Attributes => [ ], Parent => $e->{Current_Element}->{Parent}, # OldParent => $e->{Current_Element}, }; # warn "start_expr: $e->{Current_Element}->{Name}\n"; $e->start_element($element); } sub end_expr { my ($e) = @_; my $parent = $e->{Current_Element}->{Parent}; my $element = { Name => "expr", NamespaceURI => $AxKit::XSP::Core::NS, Attributes => [ ], Parent => $parent, }; # warn "end_expr: $parent->{Name}\n"; $e->end_element($element); } sub append_to_script { my ($e, $code) = @_; my (undef, $file, $line) = caller; $e->{XSP_Script} .= $e->location_debug_string($file,$line).$code; } sub manage_text { my ($e, $set, $go_back) = @_; $go_back ||= 0; my $depth = $e->depth(); if (defined($set) && $set >= 0) { $e->{XSP_Manage_Text}[$depth - $go_back] = $set; } else { if (defined($set) && $set == -1) { # called from characters handler, rather than expr return $e->{XSP_Manage_Text}[$depth]; } return $e->{XSP_Manage_Text}[$depth - 1]; } } sub depth { my ($e) = @_; my $element = $e->{Current_Element}; my $depth = 0; while ($element = $element->{Parent}) { $depth++; } return $depth; } sub current_element { my $e = shift; my $tag = $e->{Current_Element}{Name}; $tag =~ s/^(.*:)//; return $tag; } sub location_debug_string { my ($e, $file, $line) = @_; return '' if !$e->{XSP_Debug} || $file =~ m/^AxKit::XSP::Core::/; (undef, $file, $line) = caller if (@_ < 3); $file =~ s/"/''/; $file =~ s/\n/ /; return "\n# line $line \"XSP generated by $file\"\n"; } sub start_document { my $e = shift; $e->{XSP_chars} = 0; $e->{XSP_Script} = join("\n", $e->location_debug_string, "package $e->{XSP_Package};", "use Apache;", "use Apache::Constants qw(:common);", "use XML::LibXML;", "Apache::AxKit::Language::XSP::Page->import( qw(__mk_text_node __mk_comment_node __mk_ns_element_node __mk_element_node) );", ($] >= 5.008?"use utf8;":""), ); foreach my $ns (keys %Apache::AxKit::Language::XSP::tag_lib) { my $pkg = $Apache::AxKit::Language::XSP::tag_lib{$ns}; my $sub; local $AxKit::XSP::TaglibPkg = $pkg; if (($sub = $pkg->can("start_document")) && ($sub != \&start_document)) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::start_document",1).$sub->($e); } elsif ($sub = $pkg->can("parse_init")) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::parse_init",1).$sub->($e); } } } sub end_document { my $e = shift; $e->{XSP_chars} = 0; foreach my $ns (keys %Apache::AxKit::Language::XSP::tag_lib) { my $pkg = $Apache::AxKit::Language::XSP::tag_lib{$ns}; my $sub; local $AxKit::XSP::TaglibPkg = $pkg; if (($sub = $pkg->can("end_document")) && ($sub != \&end_document)) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::end_document",1).$sub->($e); } elsif ($sub = $pkg->can("parse_final")) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::parse_final",1).$sub->($e); } } ## we assume that if $e->{XSP_User_Root} is true, somebody, somewhere ## (most likely the default start_element() sub) must have started the ## "sub xml_generator {" declaration, and that we need to close it if ($e->{XSP_User_Root}) { $e->{XSP_Script} .= $e->location_debug_string."return OK;\n}\n"; } else { throw Apache::AxKit::Exception::Error( -text => "No user root element found" ) unless $Apache::AxKit::Language::XSP::AllowNoUserRoot; } return $e->{XSP_Script}; } sub start_element { my $e = shift; my $element = shift; $e->{XSP_chars} = 0; $element->{Parent} ||= $e->{Current_Element}; $e->{Current_Element} = $element; my $ns = $element->{NamespaceURI}; # warn "START-NS: $ns : $element->{Name}\n"; my @attribs; for my $attr (@{$element->{Attributes}}) { if ($attr->{Name} eq 'xmlns') { unless (Apache::AxKit::Language::XSP::is_xsp_namespace($attr->{Value})) { $e->{Current_NS}{'#default'} = $attr->{Value}; } } elsif ($attr->{Name} =~ /^xmlns:(.*)$/) { my $prefix = $1; unless (Apache::AxKit::Language::XSP::is_xsp_namespace($attr->{Value})) { $e->{Current_NS}{$prefix} = $attr->{Value}; } } else { push @attribs, $attr; } } $element->{Attributes} = \@attribs; if (!defined($ns) || !exists($Apache::AxKit::Language::XSP::tag_lib{ $ns })) { $e->manage_text(0); # set default for non-xsp tags $e->{XSP_Script} .= AxKit::XSP::DefaultHandler::start_element($e, $element); } else { # local $^W; $element->{Name} =~ s/^(.*)://; my $prefix = $1; my $tag = $element->{Name}; my %attribs; # this is probably a bad hack to turn xsp:name="value" into name="value" for my $attr (@{$element->{Attributes}}) { $attr->{Name} =~ s/^\Q$prefix\E://; $attribs{$attr->{Name}} = $attr->{Value}; } $e->manage_text(1); # set default for xsp tags my $pkg = $Apache::AxKit::Language::XSP::tag_lib{ $ns }; my $sub; local $AxKit::XSP::TaglibPkg = $pkg; if (($sub = $pkg->can("start_element")) && ($sub != \&start_element)) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::start_element",1).$sub->($e, $element); } elsif ($sub = $pkg->can("parse_start")) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::parse_start",1).$sub->($e, $tag, %attribs); } } } sub end_element { my $e = shift; my $element = shift; $e->{XSP_chars} = 0; my $ns = $element->{NamespaceURI}; # warn "END-NS: $ns : $_[0]\n"; if (!defined($ns) || !exists($Apache::AxKit::Language::XSP::tag_lib{ $ns })) { $e->{XSP_Script} .= AxKit::XSP::DefaultHandler::end_element($e, $element); } else { # local $^W; $element->{Name} =~ s/^(.*)://; my $tag = $element->{Name}; my $pkg = $Apache::AxKit::Language::XSP::tag_lib{ $ns }; my $sub; local $AxKit::XSP::TaglibPkg = $pkg; if (($sub = $pkg->can("end_element")) && ($sub != \&end_element)) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::end_element",1).$sub->($e, $element); } elsif ($sub = $pkg->can("parse_end")) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::parse_end",1).$sub->($e, $tag); } } $e->{Current_Element} = $element->{Parent} || $e->{Current_Element}->{Parent}; } sub characters { my $e = shift; my $text = shift; my $ns = $e->{Current_Element}->{NamespaceURI}; # warn "CHAR-NS: $ns\n"; if (!defined($ns) || !exists($Apache::AxKit::Language::XSP::tag_lib{ $ns }) || !$e->manage_text(-1)) { $e->{XSP_Script} .= AxKit::XSP::DefaultHandler::characters($e, $text); } else { my $pkg = $Apache::AxKit::Language::XSP::tag_lib{ $ns }; my $sub; local $AxKit::XSP::TaglibPkg = $pkg; if (($sub = $pkg->can("characters")) && ($sub != \&characters)) { $e->{XSP_Script} .= $sub->($e, $text); } elsif ($sub = $pkg->can("parse_char")) { $e->{XSP_Script} .= $sub->($e, $text->{Data}); } } $e->{XSP_chars} = 1; } sub comment { my $e = shift; my $comment = shift; my $ns = $e->{Current_Element}->{NamespaceURI}; if (!defined($ns) || !exists($Apache::AxKit::Language::XSP::tag_lib{ $ns })) { $e->{XSP_Script} .= AxKit::XSP::DefaultHandler::comment($e, $comment); } else { # local $^W; my $pkg = $Apache::AxKit::Language::XSP::tag_lib{ $ns }; my $sub; local $AxKit::XSP::TaglibPkg = $pkg; if (($sub = $pkg->can("comment")) && ($sub != \&comment)) { $e->{XSP_Script} .= $sub->($e, $comment); } elsif ($sub = $pkg->can("parse_comment")) { $e->{XSP_Script} .= $sub->($e, $comment->{Data}); } } } sub processing_instruction { my $e = shift; my $pi = shift; my $ns = $e->{Current_Element}->{NamespaceURI}; if (!defined($ns) || !exists($Apache::AxKit::Language::XSP::tag_lib{ $ns })) { $e->{XSP_Script} .= AxKit::XSP::DefaultHandler::processing_instruction($e, $pi); } else { # local $^W; my $pkg = $Apache::AxKit::Language::XSP::tag_lib{ $ns }; my $sub; local $AxKit::XSP::TaglibPkg = $pkg; if (($sub = $pkg->can("processing_instruction")) && ($sub != \&processing_instruction)) { $e->{XSP_Script} .= $sub->($e, $pi); } elsif ($sub = $pkg->can("parse_pi")) { $e->{XSP_Script} .= $sub->($e, $pi->{Target}, $pi->{Data}); } } } ############################################################ # Functions implementing xsp:* processing ############################################################ package AxKit::XSP::Core; use vars qw/@ISA $NS/; *makeSingleQuoted = \&Apache::AxKit::Language::XSP::makeSingleQuoted; @ISA = ('Apache::AxKit::Language::XSP'); $NS = 'http://apache.org/xsp/core/v1'; __PACKAGE__->register(); # hack for backwards compatibility: __PACKAGE__->register_taglib("http://www.apache.org/1999/XSP/Core"); sub start_document { return "#initialize xsp namespace\n"; } sub end_document { return ''; } sub comment { return ''; } sub processing_instruction { return ''; } sub characters { my ($e, $node) = @_; local $^W; my $text = $node->{Data}; # Ricardo writes: " produces either an [object] # _expression_ (not necessarily a String) or a character event depending # on context. When is enclosed in another XSP tag (except # ), it's replaced by the code it contains. Otherwise it # should be treated as a text node and, therefore, coerced to String to be # output through a characters SAX event." if ($e->current_element() =~ /^(content|element)$/) { if ($text =~ /\S/ || $e->{XSP_Indent}) { $text = makeSingleQuoted($text); return "__mk_text_node(\$document,\$parent,$text);"; } return ''; } elsif ($e->current_element() =~ /^(attribute|comment|name)$/) { return '' if ($e->current_element() eq 'attribute' && !$e->{attrib_seen_name}); $text =~ s/^\s*//; $text =~ s/\s*$//; $text = makeSingleQuoted($text); return ". $text"; } # return '' unless $e->{XSP_User_Root}; my $debug = ""; if (!$e->{XSP_chars}) { $e->{XSP_Debug_Section} ||= 1; my $lineno = $node->{LineNumber}; if (!$lineno) { $debug = $e->location_debug_string("expr|logic section nr. ".$e->{XSP_Debug_Section},1); } else { $debug = $e->location_debug_string("XSP page",$lineno); } $e->{XSP_Debug_Section}++; } return $debug.$text; } sub start_element { my ($e, $node) = @_; my ($tag, %attribs); $tag = $node->{Name}; foreach my $attrib (@{$node->{Attributes}}) { $attribs{$attrib->{Name}} = $attrib->{Value}; } if ($tag eq 'page') { if ($attribs{language} && lc($attribs{language}) ne 'perl') { die "Only Perl XSP pages supported at this time!"; } local $^W; if ($attribs{'indent-result'} eq 'yes') { $e->{XSP_Indent} = 1; } if (exists $attribs{'base-class'}) { $e->{XSP_Base_Class} = $attribs{'base-class'}; } if (my $i = lc $attribs{'attribute-value-interpolate'}) { if ($i eq 'no') { $e->{XSP_No_Attr_Interpolate} = 1; } elsif ($i eq 'yes') { $e->{XSP_No_Attr_Interpolate} = 0; } else { die "Unknown value for attribute-value-interpolate: $i"; } } } elsif ($tag eq 'structure') { } elsif ($tag eq 'dtd') { } elsif ($tag eq 'include') { return "warn \"xsp:include is deprecated\"; use "; } elsif ($tag eq 'content') { } elsif ($tag eq 'logic') { } elsif ($tag eq 'import') { return "use "; } elsif ($tag eq 'element') { if ($node->{Parent}->{Name} eq 'attribute' && Apache::AxKit::Language::XSP::is_xsp_namespace($node->{Parent}->{NamespaceURI})) { throw Apache::AxKit::Exception( -text => "[Core] Can't have element as child of attributes!" ); } if (my $name = $attribs{name}) { $e->manage_text(0); return '$parent = __mk_element_node($document, $parent, ' . makeSingleQuoted($name) . ');'; } } elsif ($tag eq 'attribute') { if (my $name = $attribs{name}) { $e->{attrib_seen_name} = 1; return '$parent->setAttribute('.makeSingleQuoted($name).', ""'; } $e->{attrib_seen_name} = 0; } elsif ($tag eq 'name') { if ($node->{Parent}->{Name} =~ /^(.*:)?element$/) { return '$parent = __mk_element_node($document, $parent, ""'; } elsif ($node->{Parent}->{Name} =~ /^(.*:)?attribute$/) { $e->{attrib_seen_name} = 1; return '$parent->setAttribute(""'; } else { die "xsp:name parent node: $node->{Parent}->{Name} not valid"; } } elsif ($tag eq 'pi') { } elsif ($tag eq 'comment') { return '__mk_comment_node($document, $parent, ""'; } elsif ($tag eq 'text') { return '__mk_text_node($document, $parent, ""'; } elsif ($tag eq 'expr') { #warn "expr: parent = {", $node->{Parent}->{NamespaceURI}, "}", $node->{Parent}->{Name}, "\n"; if (Apache::AxKit::Language::XSP::is_xsp_namespace($node->{Parent}->{NamespaceURI})) { if (!$e->manage_text() || $node->{Parent}->{Name} =~ /^(?:.*:)?(?:content|element)$/) { return '__mk_text_node($document, $parent, "" . do {'; } elsif ($node->{Parent}->{Name} =~ /^(.*:)?(logic|expr)$/) { return 'do {'; } return ' . do {'; } else { return '__mk_text_node($document, $parent, "" . do {'; } warn("EEEK - Should never get here!!!"); # warn "start Expr: CurrentEl: ", $e->current_element, "\n"; } else { warn("Unrecognised tag: $tag"); } return ''; } sub end_element { my ($e, $node) = @_; my $tag = $node->{Name}; if ($tag eq 'page') { } elsif ($tag eq 'structure') { } elsif ($tag eq 'dtd') { } elsif ($tag eq 'include') { return ";\n"; } elsif ($tag eq 'import') { return ";\n"; } elsif ($tag eq 'content') { } elsif ($tag eq 'logic') { } elsif ($tag eq 'element') { return '$parent = $parent->getParentNode;' . "\n"; } elsif ($tag eq 'attribute') { # ends function from either start('attribute') or end('name) # as in either # vs foo return ");\n"; } elsif ($tag eq 'name') { if ($node->{Parent}->{Name} =~ /^(.*:)?element$/) { return ");\n"; } elsif ($node->{Parent}->{Name} =~ /^(.*:)?attribute$/) { return ', ""'; } } elsif ($tag eq 'pi') { } elsif ($tag eq 'comment') { return ");\n"; } elsif ($tag eq 'text') { return ");\n"; } elsif ($tag eq 'expr') { # warn "expr: -2 = {", $node->{Parent}->{NamespaceURI}, "}", $node->{Parent}->{Name}, "\n"; if (Apache::AxKit::Language::XSP::is_xsp_namespace($node->{Parent}->{NamespaceURI})) { if (!$e->manage_text() || $node->{Parent}->{Name} =~ /^(?:.*:)?(?:content|element)$/) { return "}); # xsp tag\n"; } elsif ($node->{Parent}->{Name} =~ /^(.*:)?(logic|expr)$/) { return '}'; } else { return '}'; } } else { return "}); # non xsp tag\n"; } } return ''; } 1; ############################################################ ## Default (non-xsp-namespace) handlers ############################################################ package AxKit::XSP::DefaultHandler; *makeSingleQuoted = \&Apache::AxKit::Language::XSP::makeSingleQuoted; sub _undouble_curlies { my $value = shift; $value =~ s/\{\{/\{/g; $value =~ s/\}\}/\}/g; return $value; } sub _attr_value_template { my ($e, $value) = @_; if ($e->{XSP_No_Attr_Interpolate}) { return makeSingleQuoted($value); } # warn("Transforming: '$value'\n"); return makeSingleQuoted($value) unless $value =~ /{/; my $output = "''"; while ($value =~ /\G([^{]*){/gc) { $output .= "." . makeSingleQuoted(_undouble_curlies($1)) if $1; if ($value =~ /\G{/gc) { $output .= ".q|{|"; next; } # otherwise we're in code now... $output .= ".do{"; while ($value =~ /\G([^}]*)}/gc) { $output .= _undouble_curlies($1); if ($value =~ /\G}/gc) { $output .= "}"; next; } $output .= "}"; } } $value =~ /\G(.*)$/gc and $output .= "." . makeSingleQuoted(_undouble_curlies($1)); # warn("Changed to: $output\n"); return $output; } sub start_element { my ($e, $node) = @_; my $code; if (!$e->{XSP_User_Root}) { my $base_class = $e->{XSP_Base_Class} || 'Apache::AxKit::Language::XSP::Page'; $e->{XSP_Script} .= join("\n", $e->location_debug_string(), "\@$e->{XSP_Package}::ISA = ('$base_class');", 'sub xml_generator {', 'my $class = shift;', 'my ($r, $cgi, $document, $parent) = @_;', "\n", ); $e->{XSP_User_Root} = 1; foreach my $ns (keys %Apache::AxKit::Language::XSP::tag_lib) { my $pkg = $Apache::AxKit::Language::XSP::tag_lib{$ns}; local $AxKit::XSP::TaglibPkg = $pkg; if (my $sub = $pkg->can("start_xml_generator")) { $e->{XSP_Script} .= $e->location_debug_string("${pkg}::start_xml_generator",1).$sub->($e); } } # Note: No debugging here, to reduce bloat. Shouldn't be neccessary anyways. if ($node->{NamespaceURI}) { $code = '$parent = __mk_ns_element_node($document, $parent, '. makeSingleQuoted($node->{NamespaceURI}).','. makeSingleQuoted($node->{Name}).");\n"; } else { $code = '$parent = __mk_element_node($document, $parent, '. makeSingleQuoted($node->{Name}).");\n"; } } else { if ($node->{Parent}->{Name} eq 'attribute' && Apache::AxKit::Language::XSP::is_xsp_namespace($node->{Parent}->{NamespaceURI})) { throw Apache::AxKit::Exception( -text => "[Default] Can't have element as child of attributes!" ); } if ($node->{NamespaceURI}) { $code = '$parent = __mk_ns_element_node($document, $parent, ' . makeSingleQuoted($node->{NamespaceURI}).','. makeSingleQuoted($node->{Name}).");\n"; } else { $code = '$parent = __mk_element_node($document, $parent, ' . makeSingleQuoted($node->{Name}).");\n"; } } for my $attr (@{$node->{Attributes}}) { my $value = _attr_value_template($e, $attr->{Value}); $code .= '$parent->setAttribute('.makeSingleQuoted($attr->{Name}). ",$value);\n"; } for my $ns (keys %{$e->{Current_NS}}) { if ($ns eq '#default') { $code .= '$parent->setAttributeNS("","xmlns",' . makeSingleQuoted($e->{Current_NS}{$ns}) . ');'; } else { $code .= '$parent->setAttribute("xmlns:" . '.makeSingleQuoted($ns).',' . makeSingleQuoted($e->{Current_NS}{$ns}) . ');'; } } push @{ $e->{NS_Stack} }, { %{ $e->{Current_NS} || {} } }; $e->{Current_NS} = {}; return $code; } sub end_element { my ($e, $element) = @_; $e->{Current_NS} = pop @{ $e->{NS_Stack} }; return '$parent = $parent->getParentNode;' . "\n"; } sub characters { my ($e, $node) = @_; my $text = $node->{Data}; return '' unless $e->{XSP_User_Root}; # should not happen! if (!$e->{XSP_Indent}) { return '' unless $text =~ /\S/; } return '__mk_text_node($document, $parent, '.makeSingleQuoted($text).");\n"; } sub comment { return ''; } sub processing_instruction { return ''; } 1; ###################################################### ## SAXParser ###################################################### package AxKit::XSP::SAXParser; use XML::LibXML 1.30; use Apache::AxKit::LibXMLSupport; sub new { my ($type, %self) = @_; return bless \%self, $type; } sub parse { my ($self, $thing) = @_; my $doc; if (ref($thing) ne 'XML::LibXML::Document') { my $parser = XML::LibXML->new(); local($XML::LibXML::match_cb, $XML::LibXML::open_cb, $XML::LibXML::read_cb, $XML::LibXML::close_cb); Apache::AxKit::LibXMLSupport->reset($parser); $parser->expand_entities(1); eval { $parser->line_numbers(1); AxKit::Debug(6,"enabled line numbers"); } if $self->{Handler}->{XSP_Debug}; if (ref($thing)) { $doc = $parser->parse_fh($thing); } else { $doc = $parser->parse_string($thing); } AxKit::Debug(10, 'XSP: Parser returned doc'); $doc->process_xinclude; } else { $doc = $thing; } my $encoding = $doc->getEncoding() || 'UTF-8'; my $document = { Parent => undef }; $self->{Handler}->start_document($document); my $root = $doc->getDocumentElement; if ($root) { process_node($self->{Handler}, $root, $encoding); } $self->{Handler}->end_document($document); } sub process_node { my ($handler, $node, $encoding) = @_; my $lineno = eval { $node->lineNumber; } if $handler->{XSP_Debug}; my $node_type = $node->getType(); if ($node_type == XML_COMMENT_NODE) { $handler->comment( { Data => $node->getData, LineNumber => $lineno } ); } elsif ($node_type == XML_TEXT_NODE || $node_type == XML_CDATA_SECTION_NODE) { # warn($node->getData . "\n"); $handler->characters( { Data => encodeToUTF8($encoding,$node->getData()), LineNumber => $lineno } ); } elsif ($node_type == XML_ELEMENT_NODE) { # warn("<" . $node->getName . ">\n"); process_element($handler, $node, $encoding); # warn("getName . ">\n"); } elsif ($node_type == XML_ENTITY_REF_NODE) { foreach my $kid ($node->getChildnodes) { # warn("child of entity ref: " . $kid->getType() . " called: " . $kid->getName . "\n"); process_node($handler, $kid, $encoding); } } elsif ($node_type == XML_DOCUMENT_NODE) { # just get root element. Ignore other cruft. foreach my $kid ($node->getChildnodes) { if ($kid->getType() == XML_ELEMENT_NODE) { process_element($handler, $kid, $encoding); last; } } } elsif ($node_type == XML_XINCLUDE_START || $node_type == XML_XINCLUDE_END) { # ignore } else { warn("unknown node type: $node_type"); } } sub process_element { my ($handler, $element, $encoding) = @_; my @attr; my $debug = $handler->{XSP_Debug}; foreach my $attr ($element->getAttributes) { my $lineno = eval { $attr->lineNumber; } if $debug; if ($attr->getName) { push @attr, { Name => encodeToUTF8($encoding,$attr->getName), Value => encodeToUTF8($encoding,$attr->getData), NamespaceURI => encodeToUTF8($encoding,$attr->getNamespaceURI), Prefix => encodeToUTF8($encoding,$attr->getPrefix), LocalName => encodeToUTF8($encoding,$attr->getLocalName), LineNumber => $lineno, }; } else { push @attr, { Name => "xmlns", Value => "", NamespaceURI => "", Prefix => "", LocalName => "", LineNumber => $lineno, }; } } my $lineno = eval { $element->lineNumber; } if $debug; my $node = { Name => encodeToUTF8($encoding,$element->getName), Attributes => \@attr, NamespaceURI => encodeToUTF8($encoding,$element->getNamespaceURI), Prefix => encodeToUTF8($encoding,$element->getPrefix), LocalName => encodeToUTF8($encoding,$element->getLocalName), LineNumber => $lineno, }; $handler->start_element($node); foreach my $child ($element->getChildnodes) { process_node($handler, $child, $encoding); } $handler->end_element($node); } ############################################################ # Base page class ############################################################ package Apache::AxKit::Language::XSP::Page; use Exporter; @Apache::AxKit::Language::XSP::Page::ISA = qw(Exporter); @Apache::AxKit::Language::XSP::Page::EXPORT_OK = qw( __mk_text_node __mk_element_node __mk_comment_node __mk_ns_element_node ); sub has_changed { my $class = shift; my $mtime = shift; return 1; } sub cache_params { my $class = shift; my ($r, $cgi) = @_; return ''; } sub handler { my $class = shift; $class->xml_generator(@_); } sub __mk_text_node { my ($document, $parent, $text) = @_; my $node = $document->createTextNode($text); $parent->appendChild($node); } sub __mk_element_node { my ($document, $parent, $name) = @_; my $elem = $document->createElement($name); if ($parent) { $parent->appendChild($elem); } else { $document->setDocumentElement($elem); } return $elem; } sub __mk_ns_element_node { my ($document, $parent, $ns, $name) = @_; my $elem = $document->createElementNS($ns, $name); if ($parent) { $parent->appendChild($elem); } else { $document->setDocumentElement($elem); } return $elem; } sub __mk_comment_node { my ($document, $parent, $text) = @_; my $node = $document->createComment($text); $parent->appendChild($node); } 1; __END__ =pod =head1 NAME Apache::AxKit::Language::XSP - eXtensible Server Pages =head1 SYNOPSIS Time::Object XSP Test Hello World! Good if (localtime->hour >= 12) { Afternoon } else { Morning } =head1 DESCRIPTION XSP implements a tag-based dynamic language that allows you to develop your own tags, examples include sendmail and sql taglibs. It is AxKit's way of providing an environment for dynamic pages. XSP is originally part of the Apache Cocoon project, and so you will see some Apache namespaces used in XSP. Also, use only one XSP processor in a pipeline. XSP is powerful enough that you should only need one stage, and this implementation allows only one stage. If you have two XSP processors, perhaps in a pipeline that looks like: ... => XSP => XSLT => XSLT => XSP => ... it is pretty likely that the functionality of the intermediate XSLT stages can be factored in to either upstream or downstream XSLT: ... => XSLT => XSP => XSLT => ... This design is likely to lead to a clearer and more maintainable implementation, if only because generating code, especially embedded Perl code, in one XSP processor and consuming it in another is often confusing and even more often a symptom of misdesign. Likewise, you may want to lean towards using Perl taglib modules instead of upstream XSLT "LogicSheets". Upstream XSLT LogicSheets work fine, mind you, but using Perl taglib modules results in a simpler pipeline, simpler configuration (just load the taglib modules in httpd.conf, no need to have the correct LogicSheet XSLT page included whereever you need that taglib), a more flexible coding environment, the ability to pretest your taglibs before installing them on a server, and better isolation of interface (the taglib API) and implementation (the Perl module behind it). LogicSheets work, and can be useful, but are often the long way home. That said, people used to the Cocoon environment may prefer them. =head2 Result Code You can specify the result code of the request in two ways. Both actions go inside a tag. If you want to completely abort the current request, throw an exception: throw Apache::AxKit::Exception::Retval(return_code => FORBIDDEN); If you want to send your page but have a custom result code, return it: return FORBIDDEN; In that case, only the part of the document that was processed so far gets sent/processed further. =head2 Debugging If you have PerlTidy installed (get it from L), the compiled XSP scripts can be formatted nicely to spot errors easier. Enable AxDebugTidy for this, but be warned that reformatting is quite slow, it can take 20 seconds or more I for large scripts. If you enable AxTraceIntermediate, your script will be dumped alongside the other intermediate files, with an extension of ".XSP". These are unnumbered, thus only get one dump per request. If you have more than one XSP run in a single request, the last one will overwrite the dumps of earlier runs. =head1 Tag Reference =head2 C<< >> This is the top level element, although it does not have to be. AxKit's XSP implementation can process XSP pages even if the top level element is not there, provided you use one of the standard AxKit ways to turn on XSP processing for that page. See L. The attribute C can be present, to mandate the language. This is useful if you expect people might mistakenly try and use this page on a Cocoon system. The default value of this attribute is "Perl". XSP normally swallows all whitespace in your output. If you don't like this feature, or it creates invalid output, then you can add the attribute: C By default all non-XSP and non-taglib attributes are interpolated in a similar way to XSLT attributes - by checking for C<{ code }> in the attributes. The C can be any perl code, and is treated exactly the same as having an C<< code >> in the attribute value. In order to turn this I, simply specify the attribute C. The default is C which enables the interpolation. =head2 C<< >> parent: This element appears at the root level of your page before any non-XSP tags. It defines page-global "things" in the C<> and C<> tags. =head2 C<< >> parent: Use this tag for including modules into your code, for example: DBI =head2 C<< >> parent: , any The C<> tag introduces some Perl code into your page. As a child of C<>, this element allows you to define page global variables, or functions that get used in the page. Placing functions in here allows you to get around the Apache::Registry closures problem (see the mod_perl guide at http://perl.apache.org/guide for details). Elsewhere the perl code contained within the tags is executed on every view of the XSP page. B Be careful - the Perl code contained within this tag is still subject to XML's validity constraints. Most notably to Perl code is that the & and < characters must be escaped into & and < respectively. You can get around this to some extent by using CDATA sections. This is especially relevant if you happen to think something like this will work: if ($some_condition) { print "Condition True!"; } else { print "Condition False!"; } The correct way to write that is simply: if ($some_condition) { Condition True! } else { Condition False! } The reason is that XSP intrinsically knows about XML! =head2 C<< >> parent: This tag allows you to temporarily "break out" of logic sections to generate some XML text to go in the output. Using something similar to the above example, but without the surrounding C<> tag, we have: if ($some_condition) { Condition True! } else { Condition False! } =head2 C<< >> This tag generates an element of name equal to the value in the attribute C. Alternatively you can use a child element C<> to specify the name of the element. Text contents of the C<> are created as text node children of the new element. =head2 C<< >> Generates an attribute. The name of the attribute can either be specified in the C attribute, or via a child element C<>. The value of the attribute is the text contents of the tag. =head2 C<< >> Normally XML comments are stripped from the output. So to add one back in you can use the C<> tag. The contents of the tag are the value of the comment. =head2 C<< >> Create a plain text node. The contents of the tag are the text node to be generated. This is useful when you wish to just generate a text node while in an C<> section. =head2 C<< >> This is probably the most useful, and most important (and also the most complex) tag. An expression is some perl code that executes, and the results of which are added to the output. Exactly how the results are added to the output depends very much on context. The default method for output for an expression is as a text node. So for example:

It is now: localtime

Will generate a text node containing the time. If the expression is contained within an XSP namespaces, that is either a tag in the xsp:* namespace, or a tag implementing a tag library, then an expression generally does not create a text node, but instead is simply wrapped in a Perl C block, and added to the perl script. However, there are anti-cases to this. For example if the expression is within a C<> tag, then a text node is created. Needless to say, in every case, C<> should just "do the right thing". If it doesn't, then something (either a taglib or XSP.pm itself) is broken and you should report a bug. =head1 Writing Taglibs Writing your own taglibs can be tricky, because you're using an event based API to write out Perl code. You may want to take a look at the Apache::AxKit::Language::XSP::TaglibHelper module, which comes with AxKit and allows you to easily publish a taglib without writing XML event code. Recently, another taglib helper has been developed, Apache::AxKit::Language::XSP::SimpleTaglib. The latter manages all the details described under 'Design Patterns' for you, so you don't really need to bother with them anymore. A warning about character sets: All string values are passed in and expected back as UTF-8 encoded strings. So you cannot use national characters in a different encoding, like the widespread ISO-8859-1. This applies to Taglib source code only. The XSP XML-source is of course interpreted according to the XML rules. Your taglib module may want to 'use utf8;' as well, see L and L for more information. =head1 Design Patterns These patterns represent the things you may want to achieve when authoring a tag library "from scratch". =head2 1. Your tag is a wrapper around other things. Example: ... Solution: Start a new block, so that you can store lexical variables, and declare any variables relevant to your tag: in parse_start: if ($tag eq 'sendmail') { return '{ my ($to, $from, $sender);'; } Often it will also be relevant to execute that code when you see the end tag: in parse_end: if ($tag eq 'sendmail') { return 'Mail::Sendmail::sendmail( to => $to, from => $from, sender => $sender ); }'; } Note there the closing of that original opening block. =head2 2. Your tag indicates a parameter for a surrounding taglib. Example: ... Solution: Having declared the variable as above, you simply set it to the empty string, with no semi-colon: in parse_start: if ($tag eq 'to') { return '$to = ""'; } Then in parse_char: sub parse_char { my ($e, $text) = @_; $text =~ s/^\s*//; $text =~ s/\s*$//; return '' unless $text; $text = Apache::AxKit::Language::XSP::makeSingleQuoted($text); return ". $text"; } Note there's no semi-colon at the end of all this, so we add that: in parse_end: if ($tag eq 'to') { return ';'; } All of this black magic allows other taglibs to set the thing in that variable using expressions. =head2 3. You want your tag to return a scalar (string) that does the right thing depending on context. For example, generates a Text node in one place or generates a scalar in another context. Solution: use $e->start_expr(), $e->append_to_script(), $e->end_expr(). Example: in parse_start: if ($tag eq 'get-datetime') { $e->start_expr($tag); # creates a new { ... } block my $local_format = lc($attribs{format}) || '%a, %d %b %Y %H:%M:%S %z'; return 'my ($format); $format = q|' . $local_format . '|;'; } in parse_end: if ($tag eq 'get-datetime') { $e->append_to_script('use Time::Object; localtime->strftime($format);'); $e->end_expr(); return ''; } Explanation: This is more complex than the first 2 examples, so it warrants some explanation. I'll go through it step by step. $e->start_expr($tag) This tells XSP that this really generates a tag. Now we don't really generate that tag, we just execute the handler for it. So what happens is the handler gets called, and it looks to see what the current calling context is. If its supposed to generate a text node, it generates some code to do that. If its supposed to generate a scalar, it does that too. Ultimately both generate a do {} block, so we'll summarise that by saying the code now becomes: do { (the end of the block is generated by end_expr()). Now the next step (ignoring the simple gathering of the format variable), is a return, which appends more code onto the generated perl script, so we get: do { my ($format); $format = q|%a, %d %b %Y %H:%M:%S %z|; Now we immediately receive an end_expr, because this is an empty element (we'll see why we formatted it this way in #5 below). The first thing we get is: $e->append_to_script('use Time::Object; localtime->strftime($format);'); This does exactly what it says, and the script becomes: do { my ($format); $format = q|%a, %d %b %Y %H:%M:%S %z|; use Time::Object; localtime->strftime($format); Finally, we call: $e->end_expr(); which closes the do {} block, leaving us with: do { my ($format); $format = q|%a, %d %b %Y %H:%M:%S %z|; use Time::Object; localtime->strftime($format); } Now if you execute that in Perl, you'll see the do {} returns the last statement executed, which is the Cstrftime()> bit there, thus doing exactly what we wanted. =head2 4. Your tag can take as an option either an attribute, or a child tag. Example: or $some_uri Solution: There are several parts to this. The simplest is to ensure that whitespace is ignored. We have that dealt with in the example parse_char above. Next we need to handle that variable. Do this by starting a new block with the tag, and setting up the variable: in parse_start: if ($tag eq 'include-uri') { my $code = '{ my ($uri);'; if ($attribs{uri}) { $code .= '$uri = q|' . $attribs{uri} . '|;'; } return $code; } Now if we don't have the attribute, we can expect it to come in the C<> tag: in parse_start: if ($tag eq 'uri') { return '$uri = ""'; # note the empty string! } Now you can see that we're not explicitly setting C<$uri>, that's because the parse_char we wrote above handles it by returning '. q|$text|'. And if we have a C<> in there, that's handled automagically too. Now we just need to wrap things up in the end handlers: in parse_end: if ($tag eq 'uri') { return ';'; } if ($tag eq 'include-uri') { return 'Taglib::include_uri($uri); # execute the code } # close the block '; } =head2 5. You want to return a scalar that does the right thing in context, but also can take a parameter as an attribute I a child tag. Example: vs $some_column Solution: This is a combination of patterns 3 and 4. What we need to do is change #3 to simply allow our variable to be added as in #4 above: in parse_start: if ($tag eq 'get-column') { $e->start_expr($tag); my $code = 'my ($col);' if ($attribs{col}) { $code .= '$col = q|' . $attribs{col} . '|;'; } return $code; } if ($tag eq 'column') { return '$col = ""'; } in parse_end: if ($tag eq 'column') { return ';'; } if ($tag eq 'get-column') { $e->append_to_script('Full::Package::get_column($col)'); $e->end_expr(); return ''; } =head2 6. You have a conditional tag Example: No results! Solution: The problem here is that taglibs normally recieve character/text events so that they can manage variables. With a conditional tag, you want character events to be handled by the core XSP and generate text events. So we have a switch for that: if ($tag eq 'no-results') { $e->manage_text(0); return 'if (AxKit::XSP::ESQL::get_count() == 0) {'; } Turning off manage_text with a zero simply ensures that immediate children text nodes of this tag don't fire text events to the tag library, but instead get handled by XSP core, thus creating text nodes (and doing the right thing, generally). =head2 (and start_expr, end_expr) Notes B consider adding in the 'do {' ... '}' bits yourself. Always leave this to the start_expr, and end_expr functions. This is because the implementation could change, and you really don't know better than the underlying XSP implementation. You have been warned. =cut