655
|
1 |
############################################################################
|
|
2 |
# Copyright (c) 1998,1999 Enno Derksen
|
|
3 |
# All rights reserved.
|
|
4 |
# This program is free software; you can redistribute it and/or modify it
|
|
5 |
# under the same terms as Perl itself.
|
|
6 |
############################################################################
|
|
7 |
#
|
|
8 |
# To do (in no particular order):
|
|
9 |
#
|
|
10 |
# - Element tag names that are the same as a XQL keyword (e.g. "or", "not", ..)
|
|
11 |
# are currently not supported. The parser and lexer needs to be smarter and
|
|
12 |
# know what context they are in.
|
|
13 |
# - output using xql:result etc.
|
|
14 |
# - xml:space=preserve still needs to be adhered to in text() etc.
|
|
15 |
# - I already added xql_preserveSpace. Still need to use it in (raw)text() etc.
|
|
16 |
# - XQL functions (like value()) should probably work on input lists > 1 node
|
|
17 |
# (The code was changed, but it needs to be tested. ancestor() wasn't fixed)
|
|
18 |
# - verify implementation of xql_namespace
|
|
19 |
# - verify implementation of end, index
|
|
20 |
# - check passing of context to the solve() methods
|
|
21 |
# - functions/methods may be wrong. They receive the entire LHS set,
|
|
22 |
# so count() is right, but the rest may be wrong!
|
|
23 |
# - may need to use different comment delimiters, '#' may be used in future XQL
|
|
24 |
# definition (according to Joe Lapp, one of the XQL spec authors)
|
|
25 |
# - caching of Node xql_values (?)
|
|
26 |
# - finish the Date class
|
|
27 |
# - discuss which classes: Date, Time, and/or DateTime ?
|
|
28 |
# - conversion of Query result to Perl primitives, i.e. how do we return the
|
|
29 |
# result of a query.
|
|
30 |
# - add support for ordering/formatting the query results, see XML-QL
|
|
31 |
# - discuss typecasting mechanism
|
|
32 |
# - error reporting mechanism
|
|
33 |
# - yyerror handler doesn't seem to work
|
|
34 |
# - passing intermediate exceptions ($@) to the user
|
|
35 |
# - more debugging support
|
|
36 |
# - subst, map etc.
|
|
37 |
# - use rawText for Nodes?
|
|
38 |
# - recurse or not?
|
|
39 |
# - text/rawText default - recurse or not?
|
|
40 |
# - what should default value() implementation use?
|
|
41 |
# - check if all Syntactic Constraints in XQL spec are implemented
|
|
42 |
# - support all node types, i.e. Notation, Attlist etc.
|
|
43 |
# - sorting in 'document order' doesn't work yet for 'other' DOM nodes
|
|
44 |
# - generateFunction - support functions that return lists?
|
|
45 |
# - match() function - what should it return?
|
|
46 |
# - keeping track of reference nodes not always done right
|
|
47 |
# - also think about Perl builtin functions
|
|
48 |
# - conversion to Perl number throws warnings with -w (in comparisons etc.)
|
|
49 |
# - sorting
|
|
50 |
# - add sorting by attribute name (within same element)
|
|
51 |
# (or other criteria)
|
|
52 |
# - optional sorting in $union$ ?
|
|
53 |
# - could add a flag that says "don't worry about document order for $union$"
|
|
54 |
# - user defined sort?
|
|
55 |
# - OPTIMIZE!
|
|
56 |
# - Subscript operator
|
|
57 |
# - Filter operator
|
|
58 |
# - etc.
|
|
59 |
|
|
60 |
package XML::XQL;
|
|
61 |
use strict;
|
|
62 |
|
|
63 |
use Carp;
|
|
64 |
use XML::RegExp;
|
|
65 |
|
|
66 |
use vars qw( @EXPORT $VERSION
|
|
67 |
$ContextStart $ContextEnd $BoldOn $BoldOff
|
|
68 |
%Func %Method %FuncArgCount
|
|
69 |
%AllowedOutsideSubquery %ConstFunc %ExpandedType
|
|
70 |
$Restricted $Included $ReXQLName
|
|
71 |
%CompareOper $Token_q $Token_qq $LAST_SORT_KEY
|
|
72 |
);
|
|
73 |
|
|
74 |
@EXPORT = qw( $VERSION $Restricted $Included );
|
|
75 |
|
|
76 |
BEGIN
|
|
77 |
{
|
|
78 |
$VERSION = '0.63';
|
|
79 |
|
|
80 |
die "XML::XQL is already used/required" if defined $Included;
|
|
81 |
$Included = 1;
|
|
82 |
|
|
83 |
# From XQL spec (The '-' was added to allow XPath style function names.)
|
|
84 |
$ReXQLName = "(?:[-a-zA-Z_]+\\w*)";
|
|
85 |
|
|
86 |
$Token_q = undef;
|
|
87 |
$Token_qq = undef;
|
|
88 |
|
|
89 |
$Restricted = 0 unless defined $Restricted;
|
|
90 |
|
|
91 |
if (not $Restricted)
|
|
92 |
{
|
|
93 |
# Allow names with Perl package prefixes
|
|
94 |
$ReXQLName = "(?:$ReXQLName(?:::$ReXQLName)*)";
|
|
95 |
|
|
96 |
# Support q// and qq// strings
|
|
97 |
$Token_q = "q";
|
|
98 |
$Token_qq = "qq";
|
|
99 |
}
|
|
100 |
};
|
|
101 |
|
|
102 |
# To save the user some typing for the simplest cases
|
|
103 |
sub solve
|
|
104 |
{
|
|
105 |
my ($expr, @args) = @_;
|
|
106 |
my $query = new XML::XQL::Query (Expr => $expr);
|
|
107 |
my @result = $query->solve (@args);
|
|
108 |
$query->dispose;
|
|
109 |
|
|
110 |
@result;
|
|
111 |
}
|
|
112 |
|
|
113 |
#---------- Parser related stuff ----------------------------------------------
|
|
114 |
|
|
115 |
# Find (nested) closing delimiter in q{} or qq{} strings
|
|
116 |
sub parse_q
|
|
117 |
{
|
|
118 |
my ($qname, $q, $str, $d1, $d2) = @_;
|
|
119 |
my ($match) = "";
|
|
120 |
my ($found);
|
|
121 |
|
|
122 |
while ($str =~ /^([^$d1$d2]*)($d1|($d2))(.*)/s)
|
|
123 |
{
|
|
124 |
defined ($3) and return ($4, $match . $1); # $d2 found
|
|
125 |
|
|
126 |
# match delimiters recursively
|
|
127 |
$match .= $1 . $2;
|
|
128 |
|
|
129 |
($str, $found) = parse_q ($qname, $q, $4, $d1, $d2);
|
|
130 |
$match .= $found . $d2;
|
|
131 |
}
|
|
132 |
XML::XQL::parseError ("no $qname// closing delimiter found near '$q$d1'");
|
|
133 |
}
|
|
134 |
|
|
135 |
# To support nested delimiters in q{} and qq() strings
|
|
136 |
my %MatchingCloseDelim =
|
|
137 |
(
|
|
138 |
'{' => '}',
|
|
139 |
'(' => ')',
|
|
140 |
'<' => '>',
|
|
141 |
'[' => ']'
|
|
142 |
);
|
|
143 |
|
|
144 |
sub Lexer
|
|
145 |
{
|
|
146 |
my($parser)=shift;
|
|
147 |
|
|
148 |
exists($parser->YYData->{LINE})
|
|
149 |
or $parser->YYData->{LINE} = 1;
|
|
150 |
|
|
151 |
$parser->YYData->{INPUT}
|
|
152 |
or return('', undef);
|
|
153 |
|
|
154 |
print "Lexer input=[" . $parser->YYData->{INPUT} . "]\n"
|
|
155 |
if $parser->{yydebug};
|
|
156 |
|
|
157 |
if ($Restricted)
|
|
158 |
{
|
|
159 |
# strip leading whitespace
|
|
160 |
$parser->YYData->{INPUT} =~ s/^\s*//;
|
|
161 |
}
|
|
162 |
else
|
|
163 |
{
|
|
164 |
# strip leading whitespace and comments
|
|
165 |
$parser->YYData->{INPUT} =~ s/^(\s|#.*)*//;
|
|
166 |
}
|
|
167 |
|
|
168 |
|
|
169 |
for ($parser->YYData->{INPUT})
|
|
170 |
{
|
|
171 |
s#^"([^"]*)"##o and return ('TEXT', $1);
|
|
172 |
s#^'([^']*)'##o and return ('TEXT', $1);
|
|
173 |
|
|
174 |
if (not $Restricted)
|
|
175 |
{
|
|
176 |
# Support q// and qq// string delimiters
|
|
177 |
for my $qname ('q', 'qq')
|
|
178 |
{
|
|
179 |
my ($q) = $parser->{Query}->{$qname};
|
|
180 |
if (defined ($q) and s/^$q(\[\(\{\<#!=-\+|'":;\.,\?\/!@\%^\*)//)
|
|
181 |
{
|
|
182 |
my ($d1, $d2) = ($1, $MatchingCloseDelim{$1});
|
|
183 |
my ($str);
|
|
184 |
if (defined $d2)
|
|
185 |
{
|
|
186 |
($parser->YYData->{INPUT}, $str) = parse_q (
|
|
187 |
$qname, $q, $_, $d1, $d2);
|
|
188 |
}
|
|
189 |
else # close delim is same open delim
|
|
190 |
{
|
|
191 |
$d2 = $d1;
|
|
192 |
s/([^$d2])*$d2// or XML::XQL::parseError (
|
|
193 |
"no $qname// closing delimiter found near '$q$d1'");
|
|
194 |
$str = $1;
|
|
195 |
}
|
|
196 |
return ('TEXT', eval "$q$d1$str$d2");
|
|
197 |
}
|
|
198 |
}
|
|
199 |
}
|
|
200 |
|
|
201 |
s/^(-?\d+\.(\d+)?)// and return ('NUMBER', $1);
|
|
202 |
s/^(-?\d+)// and return ('INTEGER', $1);
|
|
203 |
|
|
204 |
s/^(\$|\b)(i?(eq|ne|lt|le|gt|ge))\1(?=\W)//i
|
|
205 |
and return ('COMPARE', "\L$2");
|
|
206 |
|
|
207 |
s/^((\$|\b)(any|all|or|and|not|to|intersect)\2)(?=\W)//i
|
|
208 |
and return ("\L$3", $1);
|
|
209 |
|
|
210 |
s/^((\$|\b)union\2(?=\W)|\|)//i and return ('UnionOp', $1);
|
|
211 |
|
|
212 |
s/^(;;?)// and return ('SeqOp', $1);
|
|
213 |
|
|
214 |
if (not $Restricted)
|
|
215 |
{
|
|
216 |
s/^(=~|!~)// and return ('MATCH', $1);
|
|
217 |
s/^\$((no_)?match)\$//i
|
|
218 |
and return ('MATCH', "\L$1");
|
|
219 |
s/^\$($ReXQLName)\$//o and return ('COMPARE', $1);
|
|
220 |
}
|
|
221 |
|
|
222 |
s/^(=|!=|<|<=|>|>=)// and return ('COMPARE', $1);
|
|
223 |
|
|
224 |
s!^(//|/|\(|\)|\.\.?|@|\!|\[|\]|\*|:|,)!!
|
|
225 |
and return ($1, $1);
|
|
226 |
|
|
227 |
s/^($ReXQLName)\s*\(//o
|
|
228 |
and return ('XQLName_Paren', $1);
|
|
229 |
|
|
230 |
s/^($XML::RegExp::Name)//o and return ('NCName', $1);
|
|
231 |
}
|
|
232 |
}
|
|
233 |
|
|
234 |
#------ end Parser related stuff ----------------------------------------------
|
|
235 |
|
|
236 |
# Converts result from a Disjunction to a 0 or 1.
|
|
237 |
# If it's a XML::XQL::Boolean, its value is returned.
|
|
238 |
# If it's an empty list it returns 0.
|
|
239 |
# If it's a node or a Text or Number, it returns 1.
|
|
240 |
# If it's a list with 1 or more elements, it returns 1 if at least one
|
|
241 |
# element evaluates to 1 (with toBoolean)
|
|
242 |
sub toBoolean # static method
|
|
243 |
{
|
|
244 |
my $arg = shift;
|
|
245 |
|
|
246 |
my $type = ref ($arg);
|
|
247 |
if ($type eq "ARRAY")
|
|
248 |
{
|
|
249 |
for my $n (@$arg)
|
|
250 |
{
|
|
251 |
return 1 if toBoolean ($n);
|
|
252 |
}
|
|
253 |
return 0;
|
|
254 |
}
|
|
255 |
return $arg->xql_toBoolean;
|
|
256 |
}
|
|
257 |
|
|
258 |
sub listContains
|
|
259 |
{
|
|
260 |
my ($list, $x) = @_;
|
|
261 |
|
|
262 |
#?? $n should be a PrimitiveType or an XML Node
|
|
263 |
for my $y (@$list)
|
|
264 |
{
|
|
265 |
#?? return 1 if $x == $y;
|
|
266 |
|
|
267 |
if (ref($x) eq ref($y)) # same object class
|
|
268 |
{
|
|
269 |
my ($src1, $src2) = ($x->xql_sourceNode, $y->xql_sourceNode);
|
|
270 |
next if ((defined $src1 or defined $src2) and $src1 != $src2);
|
|
271 |
|
|
272 |
return ($x == $y) if (UNIVERSAL::isa ($x, 'XML::XQL::Node'));
|
|
273 |
|
|
274 |
return 1 if $x->xql_eq ($y);
|
|
275 |
}
|
|
276 |
}
|
|
277 |
0;
|
|
278 |
}
|
|
279 |
|
|
280 |
sub toList
|
|
281 |
{
|
|
282 |
my $r = shift;
|
|
283 |
(ref ($r) eq "ARRAY") ? $r : [ $r ];
|
|
284 |
}
|
|
285 |
|
|
286 |
# Prepare right hand side for a comparison, i.e.
|
|
287 |
# turn it into a single value.
|
|
288 |
# If it is a list with 2 or more values, it croaks.
|
|
289 |
sub prepareRvalue
|
|
290 |
{
|
|
291 |
my $r = shift;
|
|
292 |
|
|
293 |
if (ref ($r) eq "ARRAY")
|
|
294 |
{
|
|
295 |
# more than 1 value gives a runtime error (as per Joe Lapp)
|
|
296 |
croak "bad rvalue $r" if @$r > 1;
|
|
297 |
$r = $r->[0];
|
|
298 |
}
|
|
299 |
|
|
300 |
if (ref ($r) and $r->isa ('XML::XQL::Node'))
|
|
301 |
{
|
|
302 |
$r = $r->xql_value;
|
|
303 |
}
|
|
304 |
$r;
|
|
305 |
}
|
|
306 |
|
|
307 |
sub trimSpace
|
|
308 |
{
|
|
309 |
$_[0] =~ s/^\s+//;
|
|
310 |
$_[0] =~ s/\s+$//;
|
|
311 |
$_[0];
|
|
312 |
}
|
|
313 |
|
|
314 |
# Assumption: max. 32768 (2**15 = 2**($BITS-1)) children (or attributes) per node
|
|
315 |
# Use setMaxChildren() to support larger offspring.
|
|
316 |
my $BITS = 16;
|
|
317 |
$LAST_SORT_KEY = (2 ** $BITS) - 1;
|
|
318 |
|
|
319 |
# Call with values: $max = 128 * (256**N), where N=0, 1, 2, ...
|
|
320 |
sub setMaxChildren
|
|
321 |
{
|
|
322 |
my $max = shift;
|
|
323 |
my $m = 128;
|
|
324 |
$BITS = 8;
|
|
325 |
while ($max > $m)
|
|
326 |
{
|
|
327 |
$m = $m * 256;
|
|
328 |
$BITS += 8;
|
|
329 |
}
|
|
330 |
$LAST_SORT_KEY = (2 ** $BITS) - 1;
|
|
331 |
}
|
|
332 |
|
|
333 |
sub createSortKey
|
|
334 |
{
|
|
335 |
# $_[0] = parent sort key, $_[1] = child index,
|
|
336 |
# $_[2] = 0 for attribute nodes, 1 for other node types
|
|
337 |
my $vec = "";
|
|
338 |
vec ($vec, 0, $BITS) = $_[1];
|
|
339 |
vec ($vec, 7, 1) = $_[2] if $_[2]; # set leftmost bit (for non-attributes)
|
|
340 |
$_[0] . $vec;
|
|
341 |
}
|
|
342 |
|
|
343 |
#--------------- Sorting source nodes ----------------------------------------
|
|
344 |
|
|
345 |
# Sort the list by 'document order' (as per the XQL spec.)
|
|
346 |
# Values with an associated source node are sorted by the position of their
|
|
347 |
# source node in the XML document.
|
|
348 |
# Values without a source node are placed at the end of the resulting list.
|
|
349 |
# The source node of an Attribute node, is its (parent) Element node
|
|
350 |
# (per definition.) The source node of the other types of XML nodes, is itself.
|
|
351 |
# The order for values with the same source node is undefined.
|
|
352 |
|
|
353 |
sub sortDocOrder
|
|
354 |
{
|
|
355 |
#?? or should I just use: sort { $a->xql_sortKey cmp $b->xql_sortKey }
|
|
356 |
|
|
357 |
my $list = shift;
|
|
358 |
|
|
359 |
#print "before---\n";
|
|
360 |
#for (@$list)
|
|
361 |
#{
|
|
362 |
# print "key=" . keyStr($_->xql_sortKey) . " node=" . $_->getTagName . " id=" . $_->getAttribute('id') . "\n";
|
|
363 |
#}
|
|
364 |
|
|
365 |
@$list = map { $_->[1] } # 3) extract nodes
|
|
366 |
sort { $a->[0] cmp $b->[0] } # 2) sort by sortKey
|
|
367 |
map { [$_->xql_sortKey, $_] } # 1) make [sortKey,node] records
|
|
368 |
@$list;
|
|
369 |
|
|
370 |
#print "after---\n";
|
|
371 |
#for (@$list)
|
|
372 |
#{
|
|
373 |
# print "key=" . keyStr($_->xql_sortKey) . " node=" . $_->getTagName . " id=" . $_->getAttribute('id') . "\n";
|
|
374 |
#}
|
|
375 |
|
|
376 |
$list;
|
|
377 |
}
|
|
378 |
|
|
379 |
# Converts sort key from createSortKey in human readable form
|
|
380 |
# For debugging only.
|
|
381 |
sub keyStr
|
|
382 |
{
|
|
383 |
my $key = shift;
|
|
384 |
my $n = $BITS / 8;
|
|
385 |
my $bitn = 2 ** ($BITS - 1);
|
|
386 |
my $str;
|
|
387 |
for (my $i = 0; $i < length $key; $i += $n)
|
|
388 |
{
|
|
389 |
my $dig = substr ($key, $i, $n);
|
|
390 |
my $v = vec ($dig, 0, $BITS);
|
|
391 |
my $elem = 0;
|
|
392 |
if ($v >= $bitn)
|
|
393 |
{
|
|
394 |
$v -= $bitn;
|
|
395 |
$elem = 1;
|
|
396 |
}
|
|
397 |
$str .= "/" if defined $str;
|
|
398 |
$str .= "@" unless $elem;
|
|
399 |
$str .= $v;
|
|
400 |
}
|
|
401 |
$str;
|
|
402 |
}
|
|
403 |
|
|
404 |
sub isEmptyList
|
|
405 |
{
|
|
406 |
my $list = shift;
|
|
407 |
(ref ($list) eq "ARRAY") && (@$list == 0);
|
|
408 |
}
|
|
409 |
|
|
410 |
# Used by Element and Attribute nodes
|
|
411 |
sub buildNameSpaceExpr
|
|
412 |
{
|
|
413 |
my ($nameSpace, $name) = @_;
|
|
414 |
$name = ".*" if $name eq "*";
|
|
415 |
if (defined $nameSpace)
|
|
416 |
{
|
|
417 |
$nameSpace = ".*" if $nameSpace eq "*";
|
|
418 |
"^$nameSpace:$name\$";
|
|
419 |
}
|
|
420 |
else
|
|
421 |
{
|
|
422 |
"^$name\$";
|
|
423 |
}
|
|
424 |
}
|
|
425 |
|
|
426 |
sub prepareForCompare
|
|
427 |
{
|
|
428 |
my ($left, $right) = @_;
|
|
429 |
my $leftType = $left->xql_primType;
|
|
430 |
if ($leftType == 0) # Node
|
|
431 |
{
|
|
432 |
$left = $left->xql_value;
|
|
433 |
$leftType = $left->xql_primType;
|
|
434 |
}
|
|
435 |
my $rightType = $right->xql_primType;
|
|
436 |
if ($rightType == 0) # Node
|
|
437 |
{
|
|
438 |
$right = $right->xql_value;
|
|
439 |
$rightType = $right->xql_primType;
|
|
440 |
}
|
|
441 |
# Note: reverse the order if $leftType < $rightType
|
|
442 |
($leftType < $rightType, $left, $right);
|
|
443 |
}
|
|
444 |
|
|
445 |
sub xql_eq
|
|
446 |
{
|
|
447 |
my ($left, $right, $ignoreCase) = @_;
|
|
448 |
my $reverse;
|
|
449 |
($reverse, $left, $right) = prepareForCompare ($left, $right);
|
|
450 |
$reverse ? $right->xql_eq ($left, $ignoreCase)
|
|
451 |
: $left->xql_eq ($right, $ignoreCase);
|
|
452 |
}
|
|
453 |
|
|
454 |
sub xql_ne
|
|
455 |
{
|
|
456 |
my ($left, $right, $ignoreCase) = @_;
|
|
457 |
my $reverse;
|
|
458 |
($reverse, $left, $right) = prepareForCompare ($left, $right);
|
|
459 |
$reverse ? $right->xql_ne ($left, $ignoreCase)
|
|
460 |
: $left->xql_ne ($right, $ignoreCase);
|
|
461 |
}
|
|
462 |
|
|
463 |
sub xql_lt
|
|
464 |
{
|
|
465 |
my ($left, $right, $ignoreCase) = @_;
|
|
466 |
my $reverse;
|
|
467 |
($reverse, $left, $right) = prepareForCompare ($left, $right);
|
|
468 |
$reverse ? $right->xql_ge ($left, $ignoreCase)
|
|
469 |
: $left->xql_lt ($right, $ignoreCase);
|
|
470 |
}
|
|
471 |
|
|
472 |
sub xql_le
|
|
473 |
{
|
|
474 |
my ($left, $right, $ignoreCase) = @_;
|
|
475 |
my $reverse;
|
|
476 |
($reverse, $left, $right) = prepareForCompare ($left, $right);
|
|
477 |
$reverse ? $right->xql_gt ($left, $ignoreCase)
|
|
478 |
: $left->xql_le ($right, $ignoreCase);
|
|
479 |
}
|
|
480 |
|
|
481 |
sub xql_gt
|
|
482 |
{
|
|
483 |
my ($left, $right, $ignoreCase) = @_;
|
|
484 |
my $reverse;
|
|
485 |
($reverse, $left, $right) = prepareForCompare ($left, $right);
|
|
486 |
$reverse ? $right->xql_le ($left, $ignoreCase)
|
|
487 |
: $left->xql_gt ($right, $ignoreCase);
|
|
488 |
}
|
|
489 |
|
|
490 |
sub xql_ge
|
|
491 |
{
|
|
492 |
my ($left, $right, $ignoreCase) = @_;
|
|
493 |
my $reverse;
|
|
494 |
($reverse, $left, $right) = prepareForCompare ($left, $right);
|
|
495 |
$reverse ? $right->xql_lt ($left, $ignoreCase)
|
|
496 |
: $left->xql_ge ($right, $ignoreCase);
|
|
497 |
}
|
|
498 |
|
|
499 |
sub xql_ieq { xql_eq (@_, 1); }
|
|
500 |
sub xql_ine { xql_ne (@_, 1); }
|
|
501 |
sub xql_ilt { xql_lt (@_, 1); }
|
|
502 |
sub xql_igt { xql_gt (@_, 1); }
|
|
503 |
sub xql_ige { xql_ge (@_, 1); }
|
|
504 |
sub xql_ile { xql_le (@_, 1); }
|
|
505 |
|
|
506 |
sub tput
|
|
507 |
{
|
|
508 |
# Let me know if I need to add other systems for which 'tput' is not
|
|
509 |
# available.
|
|
510 |
if ($^O =~ /Win|MacOS/)
|
|
511 |
{
|
|
512 |
return undef;
|
|
513 |
}
|
|
514 |
else
|
|
515 |
{
|
|
516 |
my $c = shift;
|
|
517 |
|
|
518 |
# tput is only available on Unix systems.
|
|
519 |
# Calling `tput ...` on Windows generates warning messages
|
|
520 |
# that can not be suppressed.
|
|
521 |
return `tput $c`;
|
|
522 |
}
|
|
523 |
}
|
|
524 |
|
|
525 |
# Underline the query subexpression that fails (if tput exists)
|
|
526 |
$ContextStart = tput ('smul') || ">>"; # smul: underline on
|
|
527 |
$ContextEnd = tput ('rmul') || "<<"; # rmul: underline off
|
|
528 |
# Used for making the significant keyword of a subexpression bold, e.g. "$and$"
|
|
529 |
$BoldOn = tput ('bold') || "";
|
|
530 |
$BoldOff = tput ('rmul') . tput ('smul') || "";
|
|
531 |
# rmul reverts the string back to normal text, smul makes it underlined again,
|
|
532 |
# so the rest of the subexpresion will be underlined.
|
|
533 |
|
|
534 |
sub setErrorContextDelimiters
|
|
535 |
{
|
|
536 |
($ContextStart, $ContextEnd, $BoldOn, $BoldOff) = @_;
|
|
537 |
}
|
|
538 |
|
|
539 |
sub delim
|
|
540 |
{
|
|
541 |
my ($str, $node, $contextNode) = @_;
|
|
542 |
if ($node == $contextNode)
|
|
543 |
{
|
|
544 |
$str =~ s/\016([^\017]*)\017/$BoldOn$1$BoldOff/g;
|
|
545 |
"$ContextStart$str$ContextEnd";
|
|
546 |
}
|
|
547 |
else
|
|
548 |
{
|
|
549 |
$str =~ s/\016([^\017]*)\017/$1/g;
|
|
550 |
$str;
|
|
551 |
}
|
|
552 |
}
|
|
553 |
|
|
554 |
sub bold
|
|
555 |
{
|
|
556 |
my $x = shift;
|
|
557 |
"\016$x\017"; # arbitrary ASCII codes
|
|
558 |
}
|
|
559 |
|
|
560 |
sub parseError
|
|
561 |
{
|
|
562 |
my ($msg) = @_;
|
|
563 |
print STDERR $msg . "\n";
|
|
564 |
croak $msg;
|
|
565 |
}
|
|
566 |
|
|
567 |
# Builtin XQL functions (may not appear after Bang "!")
|
|
568 |
%Func =
|
|
569 |
(
|
|
570 |
ancestor => \&XML::XQL::Func::ancestor,
|
|
571 |
attribute => \&XML::XQL::Func::attribute,
|
|
572 |
comment => \&XML::XQL::Func::comment,
|
|
573 |
element => \&XML::XQL::Func::element,
|
|
574 |
id => \&XML::XQL::Func::id,
|
|
575 |
node => \&XML::XQL::Func::node,
|
|
576 |
pi => \&XML::XQL::Func::pi,
|
|
577 |
textNode => \&XML::XQL::Func::textNode,
|
|
578 |
true => \&XML::XQL::Func::true,
|
|
579 |
false => \&XML::XQL::Func::false,
|
|
580 |
|
|
581 |
# NOTE: date() is added with: use XML::XQL::Date;
|
|
582 |
);
|
|
583 |
|
|
584 |
# Builtin XQL methods (may appear after Bang "!")
|
|
585 |
%Method =
|
|
586 |
(
|
|
587 |
baseName => \&XML::XQL::Func::baseName,
|
|
588 |
count => \&XML::XQL::Func::count,
|
|
589 |
end => \&XML::XQL::Func::end,
|
|
590 |
'index' => \&XML::XQL::Func::xql_index,
|
|
591 |
namespace => \&XML::XQL::Func::namespace,
|
|
592 |
nodeName => \&XML::XQL::Func::nodeName,
|
|
593 |
nodeType => \&XML::XQL::Func::nodeType,
|
|
594 |
nodeTypeString => \&XML::XQL::Func::nodeTypeString,
|
|
595 |
prefix => \&XML::XQL::Func::prefix,
|
|
596 |
text => \&XML::XQL::Func::text,
|
|
597 |
rawText => \&XML::XQL::Func::rawText,
|
|
598 |
value => \&XML::XQL::Func::value,
|
|
599 |
);
|
|
600 |
|
|
601 |
# Number of arguments for builtin XQL functions:
|
|
602 |
# Value is either an integer or a range. Value is 0 if not specified.
|
|
603 |
# Range syntax:
|
|
604 |
#
|
|
605 |
# range ::= '[' start ',' end [ ',' start ',' end ]* ']'
|
|
606 |
# start ::= INTEGER
|
|
607 |
# end ::= INTEGER | '-1' ('-1' means: "or more")
|
|
608 |
#
|
|
609 |
# Example: [2, 4, 7, 7, 10, -1] means (2,3,4,7,10,11,...)
|
|
610 |
|
|
611 |
%FuncArgCount =
|
|
612 |
(
|
|
613 |
ancestor => 1,
|
|
614 |
attribute => [0,1],
|
|
615 |
count => [0,1],
|
|
616 |
# date => 1,
|
|
617 |
element => [0,1],
|
|
618 |
id => 1,
|
|
619 |
text => [0,1],
|
|
620 |
rawText => [0,1],
|
|
621 |
);
|
|
622 |
|
|
623 |
%AllowedOutsideSubquery =
|
|
624 |
(
|
|
625 |
ancestor => 1,
|
|
626 |
attribute => 1,
|
|
627 |
comment => 1,
|
|
628 |
element => 1,
|
|
629 |
id => 1,
|
|
630 |
node => 1,
|
|
631 |
pi => 1,
|
|
632 |
textNode => 1,
|
|
633 |
|
|
634 |
#?? what about subst etc.
|
|
635 |
);
|
|
636 |
|
|
637 |
# Functions that always return the same thing if their arguments are constant
|
|
638 |
%ConstFunc =
|
|
639 |
(
|
|
640 |
true => 1,
|
|
641 |
false => 1,
|
|
642 |
# date => 1,
|
|
643 |
);
|
|
644 |
|
|
645 |
%ExpandedType =
|
|
646 |
(
|
|
647 |
"boolean" => "XML::XQL::Boolean",
|
|
648 |
"text" => "XML::XQL::Text",
|
|
649 |
"number" => "XML::XQL::Number",
|
|
650 |
"date" => "XML::XQL::Date",
|
|
651 |
"node" => "XML::XQL::Node",
|
|
652 |
);
|
|
653 |
|
|
654 |
sub expandType
|
|
655 |
{
|
|
656 |
my ($type) = @_;
|
|
657 |
# Expand "number" to "XML::XQL::Number" etc.
|
|
658 |
my $expanded = $ExpandedType{"\L$type"};
|
|
659 |
defined $expanded ? $expanded : $type;
|
|
660 |
}
|
|
661 |
|
|
662 |
sub defineExpandedTypes
|
|
663 |
{
|
|
664 |
my (%args) = @_;
|
|
665 |
while (my ($key, $val) = each %args)
|
|
666 |
{
|
|
667 |
# Convert keys to lowercase
|
|
668 |
$ExpandedType{"\L$key"} = $val;
|
|
669 |
}
|
|
670 |
}
|
|
671 |
|
|
672 |
sub generateFunction
|
|
673 |
{
|
|
674 |
my ($name, $funcName, $returnType, $argCount, $allowedOutsideSubquery,
|
|
675 |
$const, $queryArg) = @_;
|
|
676 |
$argCount = 0 unless defined $argCount;
|
|
677 |
$allowedOutsideSubquery = 1 unless defined $allowedOutsideSubquery;
|
|
678 |
$const = 0 unless defined $const;
|
|
679 |
$queryArg = 0 unless defined $queryArg;
|
|
680 |
|
|
681 |
$returnType = expandType ($returnType);
|
|
682 |
my $wrapperName = "xql_wrap_$name";
|
|
683 |
$wrapperName =~ s/\W/_/g; # replace colons etc.
|
|
684 |
|
|
685 |
my $func;
|
|
686 |
my $code = <<END_CODE;
|
|
687 |
sub $wrapperName {
|
|
688 |
my (\$context, \$list, \@arg) = \@_;
|
|
689 |
for my \$i (0 .. \$#arg)
|
|
690 |
{
|
|
691 |
if (\$i == $queryArg)
|
|
692 |
{
|
|
693 |
\$arg[\$i] = XML::XQL::toList (\$arg[\$i]->solve (\$context, \$list));
|
|
694 |
}
|
|
695 |
else
|
|
696 |
{
|
|
697 |
\$arg[\$i] = XML::XQL::prepareRvalue (\$arg[\$i]->solve (\$context, \$list));
|
|
698 |
return [] if XML::XQL::isEmptyList (\$arg[\$i]);
|
|
699 |
\$arg[\$i] = \$arg[\$i]->xql_toString;
|
|
700 |
}
|
|
701 |
}
|
|
702 |
END_CODE
|
|
703 |
|
|
704 |
if (ref ($argCount) eq "ARRAY" && @$argCount == 2 &&
|
|
705 |
$argCount->[0] == $argCount->[1])
|
|
706 |
{
|
|
707 |
$argCount = $argCount->[0];
|
|
708 |
}
|
|
709 |
|
|
710 |
if ($queryArg != -1)
|
|
711 |
{
|
|
712 |
$code .=<<END_CODE;
|
|
713 |
my \@result = ();
|
|
714 |
my \@qp = \@{\$arg[$queryArg]};
|
|
715 |
for (my \$k = 0; \$k < \@qp; \$k++)
|
|
716 |
{
|
|
717 |
\$arg[$queryArg] = \$qp[\$k]->xql_toString;
|
|
718 |
END_CODE
|
|
719 |
}
|
|
720 |
|
|
721 |
if (ref ($argCount) ne "ARRAY")
|
|
722 |
{
|
|
723 |
$code .= " my \$result = $funcName (";
|
|
724 |
for my $i (0 .. $argCount-1)
|
|
725 |
{
|
|
726 |
$code .= ", " if $i;
|
|
727 |
$code .= "\$arg[$i]";
|
|
728 |
}
|
|
729 |
$code .= ");\n";
|
|
730 |
}
|
|
731 |
elsif (@$argCount == 2)
|
|
732 |
{
|
|
733 |
my ($start, $end) = ($argCount->[0], $argCount->[1]);
|
|
734 |
if ($end == -1)
|
|
735 |
{
|
|
736 |
$code .= " my \$result = $funcName (";
|
|
737 |
for my $i (0 .. ($start - 1))
|
|
738 |
{
|
|
739 |
$code .= ", " if $i;
|
|
740 |
$code .= "\$arg[$i]";
|
|
741 |
}
|
|
742 |
$code .= ", \@arg[" . $start . " .. \$#arg]);\n";
|
|
743 |
}
|
|
744 |
else
|
|
745 |
{
|
|
746 |
$code .= " my \$n = \@arg;\n my \$result;\n ";
|
|
747 |
for my $j ($argCount->[0] .. $argCount->[1])
|
|
748 |
{
|
|
749 |
$code .= " els" unless $j == $argCount->[0];
|
|
750 |
$code .= ($j == $argCount->[1] ? "e\n" :
|
|
751 |
"if (\$n == $j)\n");
|
|
752 |
$code .= " {\n \$result = $funcName (";
|
|
753 |
for my $i (0 .. $j-1)
|
|
754 |
{
|
|
755 |
$code .= ", " if $i;
|
|
756 |
$code .= "\$arg[$i]";
|
|
757 |
}
|
|
758 |
$code .= ");\n }\n";
|
|
759 |
}
|
|
760 |
}
|
|
761 |
}
|
|
762 |
else #?? what now...
|
|
763 |
{
|
|
764 |
$code .= " my \$result = $funcName (\@arg);\n";
|
|
765 |
}
|
|
766 |
|
|
767 |
if ($returnType eq "*") # return result as is
|
|
768 |
{
|
|
769 |
$code .= " \$result = [] unless defined \$result;\n";
|
|
770 |
}
|
|
771 |
else
|
|
772 |
{
|
|
773 |
$code .= " \$result = defined \$result ? new $returnType (\$result) : [];\n";
|
|
774 |
}
|
|
775 |
|
|
776 |
if ($queryArg == -1)
|
|
777 |
{
|
|
778 |
$code .= " \$result;\n}\n";
|
|
779 |
}
|
|
780 |
else
|
|
781 |
{
|
|
782 |
$code .= " push \@result, \$result;\n }\n \\\@result;\n}\n";
|
|
783 |
}
|
|
784 |
$code .= "\$func = \\\&$wrapperName;";
|
|
785 |
|
|
786 |
#print "CODE=$code\n";
|
|
787 |
|
|
788 |
eval "$code";
|
|
789 |
if ($@) { croak "generateFunction failed for $funcName: $@\n"; }
|
|
790 |
|
|
791 |
defineFunction ($name, $func, $argCount,
|
|
792 |
$allowedOutsideSubquery, $const);
|
|
793 |
}
|
|
794 |
|
|
795 |
sub defineFunction
|
|
796 |
{
|
|
797 |
my ($name, $func, $argCount, $allowedOutside, $const) = @_;
|
|
798 |
$Func{$name} = $func;
|
|
799 |
$FuncArgCount{$name} = $argCount;
|
|
800 |
$AllowedOutsideSubquery{$name} = 1 if $allowedOutside;
|
|
801 |
$ConstFunc{$name} = $const;
|
|
802 |
}
|
|
803 |
|
|
804 |
sub defineMethod
|
|
805 |
{
|
|
806 |
my ($name, $func, $argCount, $allowedOutside) = @_;
|
|
807 |
$Method{$name} = $func;
|
|
808 |
$FuncArgCount{$name} = $argCount;
|
|
809 |
$AllowedOutsideSubquery{$name} = 1 if $allowedOutside;
|
|
810 |
}
|
|
811 |
|
|
812 |
%CompareOper =
|
|
813 |
(
|
|
814 |
'eq' => \&XML::XQL::xql_eq,
|
|
815 |
'ne' => \&XML::XQL::xql_ne,
|
|
816 |
'le' => \&XML::XQL::xql_le,
|
|
817 |
'ge' => \&XML::XQL::xql_ge,
|
|
818 |
'gt' => \&XML::XQL::xql_gt,
|
|
819 |
'lt' => \&XML::XQL::xql_lt,
|
|
820 |
|
|
821 |
'ieq' => \&XML::XQL::xql_ieq,
|
|
822 |
'ine' => \&XML::XQL::xql_ine,
|
|
823 |
'ile' => \&XML::XQL::xql_ile,
|
|
824 |
'ige' => \&XML::XQL::xql_ige,
|
|
825 |
'igt' => \&XML::XQL::xql_igt,
|
|
826 |
'ilt' => \&XML::XQL::xql_ilt,
|
|
827 |
|
|
828 |
'=' => \&XML::XQL::xql_eq,
|
|
829 |
'!=' => \&XML::XQL::xql_ne,
|
|
830 |
'>' => \&XML::XQL::xql_gt,
|
|
831 |
'>=' => \&XML::XQL::xql_ge,
|
|
832 |
'<' => \&XML::XQL::xql_lt,
|
|
833 |
'<=' => \&XML::XQL::xql_le,
|
|
834 |
);
|
|
835 |
|
|
836 |
sub defineComparisonOperators
|
|
837 |
{
|
|
838 |
my (%args) = @_;
|
|
839 |
%CompareOper = (%CompareOper, %args);
|
|
840 |
}
|
|
841 |
|
|
842 |
sub defineTokenQ
|
|
843 |
{
|
|
844 |
$Token_q = $_[0];
|
|
845 |
}
|
|
846 |
|
|
847 |
sub defineTokenQQ
|
|
848 |
{
|
|
849 |
$Token_qq = $_[0];
|
|
850 |
}
|
|
851 |
|
|
852 |
my %ElementValueType = ();
|
|
853 |
my $ElementValueTypeCount = 0;
|
|
854 |
|
|
855 |
sub elementValue
|
|
856 |
{
|
|
857 |
my ($elem) = @_;
|
|
858 |
|
|
859 |
#?? raw text/recursive ?
|
|
860 |
|
|
861 |
return new XML::XQL::Text ($elem->xql_text, $elem)
|
|
862 |
if $ElementValueTypeCount == 0; # user hasn't defined any types
|
|
863 |
|
|
864 |
my $tagName = $elem->xql_nodeName;
|
|
865 |
my $func = $ElementValueType{$tagName};
|
|
866 |
return new XML::XQL::Text ($elem->xql_text, $elem) unless defined $func;
|
|
867 |
|
|
868 |
&$func ($elem, $tagName);
|
|
869 |
}
|
|
870 |
|
|
871 |
sub defineElementValueConvertor
|
|
872 |
{
|
|
873 |
my ($elemTagName, $func) = @_;
|
|
874 |
my $prev = defined $ElementValueType{$elemTagName};
|
|
875 |
$ElementValueType{$elemTagName} = $func;
|
|
876 |
if (defined $func != $prev)
|
|
877 |
{
|
|
878 |
defined $func ? $ElementValueTypeCount++ : $ElementValueTypeCount--;
|
|
879 |
}
|
|
880 |
}
|
|
881 |
|
|
882 |
my %AttrValueType = ();
|
|
883 |
my $AttrValueTypeCount = 0;
|
|
884 |
|
|
885 |
sub attrValue
|
|
886 |
{
|
|
887 |
my ($attr) = @_;
|
|
888 |
|
|
889 |
#?? raw text/recursive ?
|
|
890 |
return new XML::XQL::Text ($attr->xql_text, $attr)
|
|
891 |
if $AttrValueTypeCount == 0; # user hasn't defined any types
|
|
892 |
|
|
893 |
my $elem = $attr->xql_parent->xql_nodeName;
|
|
894 |
my $attrName = $attr->xql_nodeName;
|
|
895 |
my $func = $AttrValueType{"$elem $attrName"};
|
|
896 |
|
|
897 |
if (not defined $func)
|
|
898 |
{
|
|
899 |
$elem = "*";
|
|
900 |
$func = $AttrValueType{"$elem $attrName"};
|
|
901 |
}
|
|
902 |
return new XML::XQL::Text ($attr->xql_text, $attr) unless defined $func;
|
|
903 |
|
|
904 |
&$func ($attr, $attrName, $elem);
|
|
905 |
}
|
|
906 |
|
|
907 |
sub defineAttrValueConvertor
|
|
908 |
{
|
|
909 |
my ($elemTagName, $attrName, $type) = @_;
|
|
910 |
my $both = "$elemTagName $attrName";
|
|
911 |
|
|
912 |
my $prev = defined $AttrValueType{$both};
|
|
913 |
$AttrValueType{$both} = $type;
|
|
914 |
if (defined $type != $prev)
|
|
915 |
{
|
|
916 |
defined $type ? $AttrValueTypeCount++ : $AttrValueTypeCount--;
|
|
917 |
}
|
|
918 |
}
|
|
919 |
|
|
920 |
#=== debug
|
|
921 |
|
|
922 |
sub exception
|
|
923 |
{
|
|
924 |
my ($ex) = @_;
|
|
925 |
print "Exception: $ex\n" if $ex;
|
|
926 |
$ex;
|
|
927 |
}
|
|
928 |
|
|
929 |
sub d
|
|
930 |
{
|
|
931 |
my $n = shift;
|
|
932 |
my $type = ref $n;
|
|
933 |
|
|
934 |
if ($type eq "ARRAY")
|
|
935 |
{
|
|
936 |
my $str = "";
|
|
937 |
for my $i (@$n)
|
|
938 |
{
|
|
939 |
$str .= ", " unless $str eq "";
|
|
940 |
$str .= d ($i);
|
|
941 |
}
|
|
942 |
return "[$str]";
|
|
943 |
}
|
|
944 |
elsif ($type eq "HASH")
|
|
945 |
{
|
|
946 |
my $str = "";
|
|
947 |
while (my ($key, $val) = %$n)
|
|
948 |
{
|
|
949 |
$str .= ", " unless $str eq "";
|
|
950 |
$str .= $key . " => " . d ($val);
|
|
951 |
}
|
|
952 |
return "{$str}";
|
|
953 |
}
|
|
954 |
elsif ($type)
|
|
955 |
{
|
|
956 |
return $n->xql_contextString if ($n->isa ('XML::XQL::Operator'));
|
|
957 |
return "${type}\[" . $n->xql_toString . "]" if $n->isa ('XML::XQL::PrimitiveType');
|
|
958 |
# return "${type}\[" . $n->toString . "]" if $n->isa ('XML::DOM::Element');
|
|
959 |
}
|
|
960 |
$n;
|
|
961 |
}
|
|
962 |
|
|
963 |
|
|
964 |
package XML::XQL::Query;
|
|
965 |
|
|
966 |
use Carp;
|
|
967 |
use XML::XQL::Parser;
|
|
968 |
|
|
969 |
use vars qw( %Func %FuncArgCount );
|
|
970 |
|
|
971 |
my $parser = new XML::XQL::Parser;
|
|
972 |
|
|
973 |
# This is passed as 'yyerror' to YYParse
|
|
974 |
sub Error
|
|
975 |
{
|
|
976 |
my($parser) = shift;
|
|
977 |
|
|
978 |
print STDERR "Error in Query Expression near: " . $parser->YYData->{INPUT} . "\n";
|
|
979 |
}
|
|
980 |
|
|
981 |
sub defineFunction
|
|
982 |
{
|
|
983 |
my ($self, $name, $func, $argCount, $allowedOutside, $const) = @_;
|
|
984 |
$self->{Func}->{$name} = $func;
|
|
985 |
$self->{FuncArgCount}->{$name} = $argCount;
|
|
986 |
$self->{AllowedOutsideSubquery}->{$name} = 1 if $allowedOutside;
|
|
987 |
$self->{ConstFunc} = $const;
|
|
988 |
}
|
|
989 |
|
|
990 |
sub defineMethod
|
|
991 |
{
|
|
992 |
my ($self, $name, $func, $argCount, $allowedOutside) = @_;
|
|
993 |
$self->{Method}->{$name} = $func;
|
|
994 |
$self->{FuncArgCount}->{$name} = $argCount;
|
|
995 |
$self->{AllowedOutsideSubquery}->{$name} = 1 if $allowedOutside;
|
|
996 |
}
|
|
997 |
|
|
998 |
sub defineComparisonOperators
|
|
999 |
{
|
|
1000 |
my ($self, %args) = @_;
|
|
1001 |
$self->{CompareOper} = \%args;
|
|
1002 |
}
|
|
1003 |
|
|
1004 |
sub defineTokenQ
|
|
1005 |
{
|
|
1006 |
$_[0]->{'q'} = $_[1];
|
|
1007 |
}
|
|
1008 |
|
|
1009 |
sub defineTokenQQ
|
|
1010 |
{
|
|
1011 |
$_[0]->{'qq'} = $_[1];
|
|
1012 |
}
|
|
1013 |
|
|
1014 |
sub new
|
|
1015 |
{
|
|
1016 |
my ($class, %args) = @_;
|
|
1017 |
|
|
1018 |
croak "no Expr specified" unless defined $args{Expr};
|
|
1019 |
|
|
1020 |
my $self = bless \%args, $class;
|
|
1021 |
|
|
1022 |
my $error = $self->{'Error'} || \&XML::XQL::Query::Error;
|
|
1023 |
my $debug = defined ($self->{Debug}) ? $self->{Debug} : 0; # 0x17;
|
|
1024 |
|
|
1025 |
$self->{'q'} = $XML::XQL::Token_q unless exists $self->{'q'};
|
|
1026 |
$self->{'qq'} = $XML::XQL::Token_qq unless exists $self->{'qq'};
|
|
1027 |
|
|
1028 |
# Invoke the query expression parser
|
|
1029 |
$parser->YYData->{INPUT} = $self->{Expr};
|
|
1030 |
$parser->{Query} = $self;
|
|
1031 |
$self->{Tree} = $parser->YYParse (yylex => \&XML::XQL::Lexer,
|
|
1032 |
yyerror => $error,
|
|
1033 |
yydebug => $debug);
|
|
1034 |
|
|
1035 |
# Nothing but whitespace should be left over
|
|
1036 |
if ($parser->YYData->{INPUT} !~ /^\s*$/)
|
|
1037 |
{
|
|
1038 |
XML::XQL::parseError ("Error when parsing expression. Unexpected characters at end of expression [" . $parser->YYData->{INPUT} . "]")
|
|
1039 |
}
|
|
1040 |
|
|
1041 |
XML::XQL::parseError ("Error when parsing expression")
|
|
1042 |
unless defined $self->{Tree};
|
|
1043 |
|
|
1044 |
$self->{Tree}->{Query} = $self;
|
|
1045 |
$self->{Tree}->xql_check (0, 0); # inSubQuery=0, inParam=0
|
|
1046 |
|
|
1047 |
print "Expression parsed successfully\n" if $debug;
|
|
1048 |
|
|
1049 |
$self;
|
|
1050 |
}
|
|
1051 |
|
|
1052 |
sub dispose
|
|
1053 |
{
|
|
1054 |
my $self = shift;
|
|
1055 |
|
|
1056 |
undef $self->{Tree}->{Query};
|
|
1057 |
|
|
1058 |
$self->{Tree}->dispose;
|
|
1059 |
delete $self->{Tree};
|
|
1060 |
}
|
|
1061 |
|
|
1062 |
sub isNodeQuery
|
|
1063 |
{
|
|
1064 |
$_[0]->{NodeQuery};
|
|
1065 |
}
|
|
1066 |
|
|
1067 |
sub solve
|
|
1068 |
{
|
|
1069 |
my ($self, @list) = @_;
|
|
1070 |
my $context = undef;
|
|
1071 |
|
|
1072 |
# clear cached "once" values
|
|
1073 |
$self->{Tree}->xql_prepCache;
|
|
1074 |
my $result = $self->{Tree}->solve ($context, \@list);
|
|
1075 |
ref ($result) eq "ARRAY" ? @$result : ($result);
|
|
1076 |
}
|
|
1077 |
|
|
1078 |
sub toString
|
|
1079 |
{
|
|
1080 |
$_[0]->{Expr};
|
|
1081 |
}
|
|
1082 |
|
|
1083 |
sub toDOM
|
|
1084 |
{
|
|
1085 |
my ($self, $doc) = @_;
|
|
1086 |
my $root = $doc->createElement ("XQL");
|
|
1087 |
$doc->appendChild ($root);
|
|
1088 |
$root->appendChild ($self->{Tree}->xql_toDOM ($doc));
|
|
1089 |
$doc;
|
|
1090 |
}
|
|
1091 |
|
|
1092 |
sub findComparisonOperator
|
|
1093 |
{
|
|
1094 |
my ($self, $name) = @_;
|
|
1095 |
my $cmp;
|
|
1096 |
if (exists $self->{CompareOper}->{$name})
|
|
1097 |
{
|
|
1098 |
$cmp = $self->{CompareOper}->{$name};
|
|
1099 |
}
|
|
1100 |
else
|
|
1101 |
{
|
|
1102 |
$cmp = $XML::XQL::CompareOper{$name};
|
|
1103 |
}
|
|
1104 |
if (not defined $cmp)
|
|
1105 |
{
|
|
1106 |
XML::XQL::parseError ("undefined comparison operator '$name'");
|
|
1107 |
}
|
|
1108 |
$cmp;
|
|
1109 |
}
|
|
1110 |
|
|
1111 |
# Return function pointer. Croak if wrong number of arguments.
|
|
1112 |
sub findFunctionOrMethod
|
|
1113 |
{
|
|
1114 |
my ($self, $name, $args) = @_;
|
|
1115 |
|
|
1116 |
my $func;
|
|
1117 |
my $type = "function";
|
|
1118 |
if (exists $self->{Func}->{$name})
|
|
1119 |
{
|
|
1120 |
$func = $self->{Func}->{$name};
|
|
1121 |
}
|
|
1122 |
elsif (exists $self->{Method}->{$name})
|
|
1123 |
{
|
|
1124 |
$func = $self->{Method}->{$name};
|
|
1125 |
$type = "method";
|
|
1126 |
}
|
|
1127 |
elsif (defined $XML::XQL::Func{$name})
|
|
1128 |
{
|
|
1129 |
$func = $XML::XQL::Func{$name};
|
|
1130 |
}
|
|
1131 |
elsif (defined $XML::XQL::Method{$name})
|
|
1132 |
{
|
|
1133 |
$func = $XML::XQL::Method{$name};
|
|
1134 |
$type = "method";
|
|
1135 |
}
|
|
1136 |
elsif (not $XML::XQL::Restricted)
|
|
1137 |
{
|
|
1138 |
$func = XML::XQL::generatePerlWrapper ($name);
|
|
1139 |
}
|
|
1140 |
|
|
1141 |
XML::XQL::parseError ("undefined function/method '$name' in query '" .
|
|
1142 |
$self->toString . "'")
|
|
1143 |
unless defined &$func;
|
|
1144 |
|
|
1145 |
my $funcArgCount = $self->{FuncArgCount}->{$name}
|
|
1146 |
|| $XML::XQL::FuncArgCount{$name} || 0;
|
|
1147 |
|
|
1148 |
# Check number of args
|
|
1149 |
my $nargs = @$args;
|
|
1150 |
|
|
1151 |
#print "$args " . XML::XQL::d($args) . "\n";
|
|
1152 |
|
|
1153 |
my $ok = 0;
|
|
1154 |
if (ref ($funcArgCount) eq "ARRAY")
|
|
1155 |
{
|
|
1156 |
my $i = 0;
|
|
1157 |
my $n = @$funcArgCount;
|
|
1158 |
while ($i < $n)
|
|
1159 |
{
|
|
1160 |
my $s = $funcArgCount->[$i++];
|
|
1161 |
my $e = $funcArgCount->[$i++] || $s; # same as $s if odd #args
|
|
1162 |
if ($nargs >= $s && ($e == -1 || $nargs <= $e))
|
|
1163 |
{
|
|
1164 |
$ok = 1; # found it
|
|
1165 |
last;
|
|
1166 |
}
|
|
1167 |
}
|
|
1168 |
}
|
|
1169 |
else
|
|
1170 |
{
|
|
1171 |
$ok = ($nargs eq $funcArgCount);
|
|
1172 |
}
|
|
1173 |
|
|
1174 |
XML::XQL::parseError ("wrong number of args ($nargs) for $type $name in query '" .
|
|
1175 |
$self->toString . "', it should be " . XML::XQL::d($funcArgCount))
|
|
1176 |
if not $ok;
|
|
1177 |
|
|
1178 |
return ($func, $type);
|
|
1179 |
}
|
|
1180 |
|
|
1181 |
sub isAllowedOutsideSubquery
|
|
1182 |
{
|
|
1183 |
my ($self, $funcName) = @_;
|
|
1184 |
my ($ok) = $self->{AllowedOutsideSubquery}->{$funcName};
|
|
1185 |
return $ok if defined $ok;
|
|
1186 |
$XML::XQL::AllowedOutsideSubquery{$funcName};
|
|
1187 |
}
|
|
1188 |
|
|
1189 |
package XML::XQL::Operator;
|
|
1190 |
use fields qw{ Left Right Parent };
|
|
1191 |
|
|
1192 |
sub new
|
|
1193 |
{
|
|
1194 |
my ($class, %attr) = @_;
|
|
1195 |
my $self = bless \%attr, $class;
|
|
1196 |
|
|
1197 |
$self->{Left}->setParent ($self) if defined $self->{Left};
|
|
1198 |
$self->{Right}->setParent ($self) if defined $self->{Right};
|
|
1199 |
|
|
1200 |
$self;
|
|
1201 |
}
|
|
1202 |
|
|
1203 |
sub dispose
|
|
1204 |
{
|
|
1205 |
my $self = shift;
|
|
1206 |
if (defined ($self->{Left}))
|
|
1207 |
{
|
|
1208 |
$self->{Left}->dispose;
|
|
1209 |
undef $self->{Left};
|
|
1210 |
}
|
|
1211 |
if (defined ($self->{Right}))
|
|
1212 |
{
|
|
1213 |
$self->{Right}->dispose;
|
|
1214 |
undef $self->{Right};
|
|
1215 |
}
|
|
1216 |
|
|
1217 |
undef $self->{Parent};
|
|
1218 |
}
|
|
1219 |
|
|
1220 |
sub xql_check
|
|
1221 |
{
|
|
1222 |
my ($self, $inSubQuery, $inParam) = @_;
|
|
1223 |
$self->{Left}->xql_check ($inSubQuery, $inParam);
|
|
1224 |
$self->{Right}->xql_check ($inSubQuery, $inParam) if defined $self->{Right};
|
|
1225 |
}
|
|
1226 |
|
|
1227 |
sub xql_prepCache
|
|
1228 |
{
|
|
1229 |
my ($self) = @_;
|
|
1230 |
$self->{Left}->xql_prepCache;
|
|
1231 |
$self->{Right}->xql_prepCache if defined $self->{Right};
|
|
1232 |
}
|
|
1233 |
|
|
1234 |
sub xql_toDOM
|
|
1235 |
{
|
|
1236 |
my ($self, $doc) = @_;
|
|
1237 |
my $name = ref $self;
|
|
1238 |
$name =~ s/.*:://;
|
|
1239 |
my $elem = $doc->createElement ($name);
|
|
1240 |
if (defined $self->{Left})
|
|
1241 |
{
|
|
1242 |
my $left = $doc->createElement ("left");
|
|
1243 |
$elem->appendChild ($left);
|
|
1244 |
$left->appendChild ($self->{Left}->xql_toDOM ($doc));
|
|
1245 |
}
|
|
1246 |
if (defined $self->{Right})
|
|
1247 |
{
|
|
1248 |
my $right = $doc->createElement ("right");
|
|
1249 |
$elem->appendChild ($right);
|
|
1250 |
$right->appendChild ($self->{Right}->xql_toDOM ($doc));
|
|
1251 |
}
|
|
1252 |
$elem;
|
|
1253 |
}
|
|
1254 |
|
|
1255 |
sub isConstant
|
|
1256 |
{
|
|
1257 |
0;
|
|
1258 |
}
|
|
1259 |
|
|
1260 |
# Overriden by Union and Path operators
|
|
1261 |
sub mustSort
|
|
1262 |
{
|
|
1263 |
0;
|
|
1264 |
}
|
|
1265 |
|
|
1266 |
sub setParent
|
|
1267 |
{
|
|
1268 |
$_[0]->{Parent} = $_[1];
|
|
1269 |
}
|
|
1270 |
|
|
1271 |
sub warning
|
|
1272 |
{
|
|
1273 |
my ($self, $msg) = @_;
|
|
1274 |
print STDERR "WARNING: $msg";
|
|
1275 |
print STDERR " Context: " . $self->toContextString . "\n";
|
|
1276 |
}
|
|
1277 |
|
|
1278 |
sub root
|
|
1279 |
{
|
|
1280 |
my ($self) = @_;
|
|
1281 |
my $top = $self;
|
|
1282 |
|
|
1283 |
while (defined ($top->{Parent}))
|
|
1284 |
{
|
|
1285 |
$top = $top->{Parent};
|
|
1286 |
}
|
|
1287 |
$top;
|
|
1288 |
}
|
|
1289 |
|
|
1290 |
sub query
|
|
1291 |
{
|
|
1292 |
$_[0]->root->{Query};
|
|
1293 |
}
|
|
1294 |
|
|
1295 |
sub toContextString
|
|
1296 |
{
|
|
1297 |
my ($self) = @_;
|
|
1298 |
$self->root->xql_contextString ($self);
|
|
1299 |
}
|
|
1300 |
|
|
1301 |
sub debugString
|
|
1302 |
{
|
|
1303 |
my ($self) = @_;
|
|
1304 |
my $str = "[" . ref($self);
|
|
1305 |
while (my ($key, $val) = each %$self)
|
|
1306 |
{
|
|
1307 |
$str .= "$key=>" . XML::XQL::d($val);
|
|
1308 |
}
|
|
1309 |
$str . "]";
|
|
1310 |
}
|
|
1311 |
|
|
1312 |
sub verbose
|
|
1313 |
{
|
|
1314 |
my ($self, $str, $list) = @_;
|
|
1315 |
# print STDERR "$self - $str: " . XML::XQL::d($list) . "\n";
|
|
1316 |
$list;
|
|
1317 |
}
|
|
1318 |
|
|
1319 |
package XML::XQL::Root; # "/" at start of XQL expression
|
|
1320 |
use base 'XML::XQL::Operator'; # L -> L
|
|
1321 |
|
|
1322 |
sub solve
|
|
1323 |
{
|
|
1324 |
my ($self, $context, $list) = @_;
|
|
1325 |
return [] if (@$list < 1);
|
|
1326 |
|
|
1327 |
#?? what if first value is not a XML::XQL::Node? should we try the second one?
|
|
1328 |
[$list->[0]->xql_document];
|
|
1329 |
}
|
|
1330 |
#?? add isOnce here?
|
|
1331 |
|
|
1332 |
sub xql_check
|
|
1333 |
{
|
|
1334 |
}
|
|
1335 |
|
|
1336 |
sub xql_prepCache
|
|
1337 |
{
|
|
1338 |
}
|
|
1339 |
|
|
1340 |
sub xql_contextString
|
|
1341 |
{
|
|
1342 |
XML::XQL::delim ("/", @_);
|
|
1343 |
}
|
|
1344 |
|
|
1345 |
package XML::XQL::Path;
|
|
1346 |
use base 'XML::XQL::Operator'; # L -> L
|
|
1347 |
use fields qw{ PathOp };
|
|
1348 |
|
|
1349 |
sub new
|
|
1350 |
{
|
|
1351 |
my ($class, %arg) = @_;
|
|
1352 |
my $self = bless \%arg, $class;
|
|
1353 |
|
|
1354 |
$self->{Left} ||= new XML::XQL::Root;
|
|
1355 |
|
|
1356 |
$self->{Left}->setParent ($self);
|
|
1357 |
$self->{Right}->setParent ($self);
|
|
1358 |
|
|
1359 |
$self;
|
|
1360 |
}
|
|
1361 |
|
|
1362 |
sub solve
|
|
1363 |
{
|
|
1364 |
my ($self, $context, $list) = @_;
|
|
1365 |
$list = $self->{Left}->solve ($context, $list);
|
|
1366 |
$self->verbose ("left", $list);
|
|
1367 |
|
|
1368 |
return $list if @$list < 1;
|
|
1369 |
|
|
1370 |
if ($self->{PathOp} eq '/')
|
|
1371 |
{
|
|
1372 |
$self->verbose ("result", $self->{Right}->solve ($context, $list));
|
|
1373 |
}
|
|
1374 |
else # recurse "//"
|
|
1375 |
{
|
|
1376 |
my $new_list = [];
|
|
1377 |
my $n = @$list;
|
|
1378 |
NODE: for (my $i = 0; $i < $n; $i++)
|
|
1379 |
{
|
|
1380 |
my $node = $list->[$i];
|
|
1381 |
# Node must be an Element or must be allowed to contain Elements
|
|
1382 |
# i.e. must be an Element or a Document
|
|
1383 |
# (DocumentFragment is not expected here)
|
|
1384 |
my $nodeType = $node->xql_nodeType;
|
|
1385 |
next NODE unless ($nodeType == 1 || $nodeType == 9);
|
|
1386 |
|
|
1387 |
# Skip the node if one of its ancestors is part of the input $list
|
|
1388 |
# (and therefore already processed)
|
|
1389 |
my $parent = $node->xql_parent;
|
|
1390 |
while (defined $parent)
|
|
1391 |
{
|
|
1392 |
for (my $j = $i - 1; $j >= 0; $j--)
|
|
1393 |
{
|
|
1394 |
next NODE if ($parent == $list->[$j]);
|
|
1395 |
}
|
|
1396 |
$parent = $parent->xql_parent;
|
|
1397 |
}
|
|
1398 |
recurse ($node, $new_list);
|
|
1399 |
}
|
|
1400 |
|
|
1401 |
my $results = $self->{Right}->solve ($context, $new_list);
|
|
1402 |
|
|
1403 |
# Sort the result list unless the parent Operator will sort
|
|
1404 |
my $parent = $self->{Parent};
|
|
1405 |
XML::XQL::sortDocOrder ($results)
|
|
1406 |
unless defined ($parent) and $parent->mustSort;
|
|
1407 |
|
|
1408 |
$self->verbose ("result //", $results);
|
|
1409 |
}
|
|
1410 |
}
|
|
1411 |
|
|
1412 |
sub mustSort
|
|
1413 |
{
|
|
1414 |
$_[0]->{PathOp} eq '//';
|
|
1415 |
}
|
|
1416 |
|
|
1417 |
sub recurse
|
|
1418 |
{
|
|
1419 |
my ($node, $list) = @_;
|
|
1420 |
push @$list, $node;
|
|
1421 |
for my $kid (@{$node->xql_element})
|
|
1422 |
{
|
|
1423 |
recurse ($kid, $list);
|
|
1424 |
}
|
|
1425 |
}
|
|
1426 |
|
|
1427 |
sub xql_contextString
|
|
1428 |
{
|
|
1429 |
my $self = shift;
|
|
1430 |
|
|
1431 |
my $str = $self->{Left}->isa ('XML::XQL::Root') ?
|
|
1432 |
"" : $self->{Left}->xql_contextString (@_);
|
|
1433 |
|
|
1434 |
XML::XQL::delim ($str . XML::XQL::bold($self->{PathOp}) .
|
|
1435 |
$self->{Right}->xql_contextString (@_), $self, @_);
|
|
1436 |
}
|
|
1437 |
|
|
1438 |
sub xql_toDOM
|
|
1439 |
{
|
|
1440 |
my ($self, $doc) = @_;
|
|
1441 |
my $elem = $self->SUPER::xql_toDOM ($doc);
|
|
1442 |
$elem->setAttribute ("pathOp", $self->{PathOp});
|
|
1443 |
$elem;
|
|
1444 |
}
|
|
1445 |
|
|
1446 |
package XML::XQL::Sequence; # "elem;elem" or "elem;;elem"
|
|
1447 |
use base 'XML::XQL::Operator'; # L -> L
|
|
1448 |
use fields qw{ Oper };
|
|
1449 |
|
|
1450 |
# See "The Design of XQL" by Jonathan Robie
|
|
1451 |
# <URL:http://www.texcel.no/whitepapers/xql-design.html>
|
|
1452 |
# for definition of Sequence operators.
|
|
1453 |
|
|
1454 |
# Note that the "naive" implementation slows things down quite a bit here...
|
|
1455 |
sub solve
|
|
1456 |
{
|
|
1457 |
my ($self, $context, $list) = @_;
|
|
1458 |
my $left = $self->{Left}->solve ($context, $list);
|
|
1459 |
$self->verbose ("left", $left);
|
|
1460 |
return [] unless @$left;
|
|
1461 |
|
|
1462 |
my $right = $self->{Right}->solve ($context, $list);
|
|
1463 |
$self->verbose ("right", $right);
|
|
1464 |
return [] unless @$right;
|
|
1465 |
|
|
1466 |
my @result;
|
|
1467 |
if ($self->{Oper} eq ';') # immediately precedes
|
|
1468 |
{
|
|
1469 |
my %hleft; @hleft{@$left} = (); # initialize all values to undef
|
|
1470 |
my %pushed;
|
|
1471 |
|
|
1472 |
for my $r (@$right)
|
|
1473 |
{
|
|
1474 |
# Find previous sibling that is not a text node that has only
|
|
1475 |
# whitespace that can be ignored (because xml:space=preserve)
|
|
1476 |
my $prev = $r->xql_prevNonWS;
|
|
1477 |
# $prev must be defined and must exist in $left
|
|
1478 |
next unless $prev and exists $hleft{$prev};
|
|
1479 |
|
|
1480 |
# Filter duplicates (no need to sort afterwards)
|
|
1481 |
push @result, $prev unless $pushed{$prev}++;
|
|
1482 |
push @result, $r unless $pushed{$r}++;
|
|
1483 |
}
|
|
1484 |
}
|
|
1485 |
else # oper eq ';;' (i.e. precedes)
|
|
1486 |
{
|
|
1487 |
my %pushed;
|
|
1488 |
|
|
1489 |
for my $r (@$right)
|
|
1490 |
{
|
|
1491 |
for my $l (@$left)
|
|
1492 |
{
|
|
1493 |
# If left node precedes right node, add them
|
|
1494 |
if ($l->xql_sortKey lt $r->xql_sortKey)
|
|
1495 |
{
|
|
1496 |
# Filter duplicates
|
|
1497 |
push @result, $l unless $pushed{$l}++;
|
|
1498 |
push @result, $r unless $pushed{$r}++;
|
|
1499 |
}
|
|
1500 |
}
|
|
1501 |
|
|
1502 |
#?? optimize - left & right are already sorted...
|
|
1503 |
# sort in document order
|
|
1504 |
XML::XQL::sortDocOrder (\@result) if @result;
|
|
1505 |
}
|
|
1506 |
}
|
|
1507 |
\@result;
|
|
1508 |
}
|
|
1509 |
|
|
1510 |
sub xql_contextString
|
|
1511 |
{
|
|
1512 |
my $self = shift;
|
|
1513 |
XML::XQL::delim ($self->{Left}->xql_contextString (@_) .
|
|
1514 |
XML::XQL::bold($self->{Oper}) .
|
|
1515 |
$self->{Right}->xql_contextString (@_), $self, @_);
|
|
1516 |
}
|
|
1517 |
|
|
1518 |
package XML::XQL::Current; # "."
|
|
1519 |
use base 'XML::XQL::Operator'; # L -> L
|
|
1520 |
|
|
1521 |
sub xql_check
|
|
1522 |
{
|
|
1523 |
}
|
|
1524 |
|
|
1525 |
sub xql_prepCache
|
|
1526 |
{
|
|
1527 |
}
|
|
1528 |
|
|
1529 |
sub solve
|
|
1530 |
{
|
|
1531 |
my ($self, $context, $list) = @_;
|
|
1532 |
$list;
|
|
1533 |
}
|
|
1534 |
|
|
1535 |
sub xql_contextString
|
|
1536 |
{
|
|
1537 |
XML::XQL::delim (".", @_);
|
|
1538 |
}
|
|
1539 |
|
|
1540 |
package XML::XQL::Parent; # ".."
|
|
1541 |
use base 'XML::XQL::Operator';
|
|
1542 |
|
|
1543 |
sub xql_check
|
|
1544 |
{
|
|
1545 |
}
|
|
1546 |
|
|
1547 |
sub xql_prepCache
|
|
1548 |
{
|
|
1549 |
}
|
|
1550 |
|
|
1551 |
sub solve
|
|
1552 |
{
|
|
1553 |
my ($self, $context, $list) = @_;
|
|
1554 |
my @result = ();
|
|
1555 |
for my $node (@$list)
|
|
1556 |
{
|
|
1557 |
push @result, $node->xql_parent;
|
|
1558 |
}
|
|
1559 |
\@result;
|
|
1560 |
}
|
|
1561 |
|
|
1562 |
sub xql_contextString
|
|
1563 |
{
|
|
1564 |
XML::XQL::delim ("..", @_);
|
|
1565 |
}
|
|
1566 |
|
|
1567 |
package XML::XQL::Element; # "elem"
|
|
1568 |
use base 'XML::XQL::Operator'; # L -> L
|
|
1569 |
use fields qw{ Name NameSpace Expr };
|
|
1570 |
|
|
1571 |
sub new
|
|
1572 |
{
|
|
1573 |
my ($class, %args) = @_;
|
|
1574 |
if (not defined ($args{NameSpace}))
|
|
1575 |
{
|
|
1576 |
if ($args{Name} eq "*")
|
|
1577 |
{
|
|
1578 |
return bless \%args, 'XML::XQL::AllElements';
|
|
1579 |
}
|
|
1580 |
else
|
|
1581 |
{
|
|
1582 |
return bless \%args, 'XML::XQL::SimpleElement';
|
|
1583 |
}
|
|
1584 |
}
|
|
1585 |
|
|
1586 |
$args{Expr} = XML::XQL::buildNameSpaceExpr ($args{NameSpace},
|
|
1587 |
$args{Name});
|
|
1588 |
bless \%args, $class;
|
|
1589 |
}
|
|
1590 |
|
|
1591 |
sub xql_check
|
|
1592 |
{
|
|
1593 |
}
|
|
1594 |
|
|
1595 |
sub xql_prepCache
|
|
1596 |
{
|
|
1597 |
}
|
|
1598 |
|
|
1599 |
sub solve
|
|
1600 |
{
|
|
1601 |
my ($self, $context, $list) = @_;
|
|
1602 |
my @result = ();
|
|
1603 |
|
|
1604 |
my $expr = $self->{Expr};
|
|
1605 |
for my $node (@$list)
|
|
1606 |
{
|
|
1607 |
for my $kid (@{$node->xql_element})
|
|
1608 |
{
|
|
1609 |
push @result, $kid if $kid->xql_nodeName =~ /$expr/;
|
|
1610 |
}
|
|
1611 |
}
|
|
1612 |
\@result;
|
|
1613 |
}
|
|
1614 |
|
|
1615 |
sub xql_contextString
|
|
1616 |
{
|
|
1617 |
my $self = shift;
|
|
1618 |
my $name = $self->{Name};
|
|
1619 |
my $space = $self->{NameSpace};
|
|
1620 |
|
|
1621 |
my $str = defined($space) ? "$space:$name" : $name;
|
|
1622 |
|
|
1623 |
XML::XQL::delim ($str, $self, @_);
|
|
1624 |
}
|
|
1625 |
|
|
1626 |
sub xql_toDOM
|
|
1627 |
{
|
|
1628 |
my ($self, $doc) = @_;
|
|
1629 |
my $elem = $self->SUPER::xql_toDOM ($doc);
|
|
1630 |
|
|
1631 |
my $name = $self->{Name};
|
|
1632 |
my $space = $self->{NameSpace};
|
|
1633 |
my $str = defined($space) ? "$space:$name" : $name;
|
|
1634 |
|
|
1635 |
$elem->setAttribute ("name", $str);
|
|
1636 |
$elem;
|
|
1637 |
}
|
|
1638 |
|
|
1639 |
package XML::XQL::SimpleElement; # "elem"
|
|
1640 |
use base 'XML::XQL::Element'; # L -> L
|
|
1641 |
|
|
1642 |
sub solve
|
|
1643 |
{
|
|
1644 |
my ($self, $context, $list) = @_;
|
|
1645 |
my @result = ();
|
|
1646 |
my $name = $self->{Name};
|
|
1647 |
|
|
1648 |
for my $node (@$list)
|
|
1649 |
{
|
|
1650 |
push @result, @{ $node->xql_element ($name) };
|
|
1651 |
}
|
|
1652 |
\@result;
|
|
1653 |
}
|
|
1654 |
|
|
1655 |
package XML::XQL::AllElements; # "*"
|
|
1656 |
use base 'XML::XQL::Element'; # L -> L
|
|
1657 |
|
|
1658 |
sub solve
|
|
1659 |
{
|
|
1660 |
my ($self, $context, $list) = @_;
|
|
1661 |
my @result = ();
|
|
1662 |
|
|
1663 |
for my $node (@$list)
|
|
1664 |
{
|
|
1665 |
push @result, @{$node->xql_element};
|
|
1666 |
}
|
|
1667 |
\@result;
|
|
1668 |
}
|
|
1669 |
|
|
1670 |
package XML::XQL::Attribute; # "@attr"
|
|
1671 |
use base 'XML::XQL::Operator'; # L -> L of Attributes
|
|
1672 |
use fields qw{ Name NameSpace Expr };
|
|
1673 |
|
|
1674 |
sub new
|
|
1675 |
{
|
|
1676 |
my ($class, %args) = @_;
|
|
1677 |
|
|
1678 |
if (not defined ($args{NameSpace}))
|
|
1679 |
{
|
|
1680 |
if ($args{Name} eq "*")
|
|
1681 |
{
|
|
1682 |
return bless \%args, 'XML::XQL::AllAttr';
|
|
1683 |
}
|
|
1684 |
else
|
|
1685 |
{
|
|
1686 |
return bless \%args, 'XML::XQL::SimpleAttr';
|
|
1687 |
}
|
|
1688 |
}
|
|
1689 |
|
|
1690 |
$args{Expr} = XML::XQL::buildNameSpaceExpr ($args{NameSpace},
|
|
1691 |
$args{Name});
|
|
1692 |
bless \%args, $class;
|
|
1693 |
}
|
|
1694 |
|
|
1695 |
sub xql_check
|
|
1696 |
{
|
|
1697 |
}
|
|
1698 |
|
|
1699 |
sub xql_prepCache
|
|
1700 |
{
|
|
1701 |
}
|
|
1702 |
|
|
1703 |
sub solve
|
|
1704 |
{
|
|
1705 |
my ($self, $context, $list) = @_;
|
|
1706 |
my @result = ();
|
|
1707 |
|
|
1708 |
my $expr = $self->{Expr};
|
|
1709 |
for my $node (@$list)
|
|
1710 |
{
|
|
1711 |
for my $kid (@{$node->xql_attribute})
|
|
1712 |
{
|
|
1713 |
push @result, $kid if $kid->xql_nodeName =~ /$expr/;
|
|
1714 |
}
|
|
1715 |
}
|
|
1716 |
}
|
|
1717 |
|
|
1718 |
sub xql_contextString
|
|
1719 |
{
|
|
1720 |
my $self = shift;
|
|
1721 |
my $name = $self->{Name};
|
|
1722 |
my $space = $self->{NameSpace};
|
|
1723 |
|
|
1724 |
my $str = defined($space) ? "\@$space:$name" : ('@' . $name);
|
|
1725 |
|
|
1726 |
XML::XQL::delim ($str, $self, @_);
|
|
1727 |
}
|
|
1728 |
|
|
1729 |
package XML::XQL::SimpleAttr; # "@attr"
|
|
1730 |
use base 'XML::XQL::Attribute'; # L -> L
|
|
1731 |
|
|
1732 |
sub solve
|
|
1733 |
{
|
|
1734 |
my ($self, $context, $list) = @_;
|
|
1735 |
my @result = ();
|
|
1736 |
my $name = $self->{Name};
|
|
1737 |
|
|
1738 |
for my $node (@$list)
|
|
1739 |
{
|
|
1740 |
push @result, @{ $node->xql_attribute ($name) };
|
|
1741 |
}
|
|
1742 |
\@result;
|
|
1743 |
}
|
|
1744 |
|
|
1745 |
package XML::XQL::AllAttr; # "@*"
|
|
1746 |
use base 'XML::XQL::Attribute'; # L -> L
|
|
1747 |
|
|
1748 |
sub solve
|
|
1749 |
{
|
|
1750 |
my ($self, $context, $list) = @_;
|
|
1751 |
my @result = ();
|
|
1752 |
|
|
1753 |
for my $node (@$list)
|
|
1754 |
{
|
|
1755 |
push @result, @{$node->xql_attribute};
|
|
1756 |
}
|
|
1757 |
\@result;
|
|
1758 |
}
|
|
1759 |
|
|
1760 |
package XML::XQL::Subscript; # "[3, 5 $to$ 7, -1]"
|
|
1761 |
use base 'XML::XQL::Operator'; # L -> L
|
|
1762 |
use fields qw{ IndexList };
|
|
1763 |
|
|
1764 |
#?? optimize for simple subscripts
|
|
1765 |
sub solve
|
|
1766 |
{
|
|
1767 |
my ($self, $context, $inlist) = @_;
|
|
1768 |
my @result = ();
|
|
1769 |
|
|
1770 |
for my $node (@$inlist)
|
|
1771 |
{
|
|
1772 |
|
|
1773 |
my $list = $self->{Left}->solve ($context, [$node]);
|
|
1774 |
$self->verbose("Left", $list);
|
|
1775 |
|
|
1776 |
my $n = int (@$list);
|
|
1777 |
next if ($n == 0);
|
|
1778 |
|
|
1779 |
# build ordered index list
|
|
1780 |
my @indexFlags = ();
|
|
1781 |
$#indexFlags = $n - 1;
|
|
1782 |
|
|
1783 |
my $index = $self->{IndexList};
|
|
1784 |
my $len = @$index;
|
|
1785 |
|
|
1786 |
#?? this is done a lot - optimize....
|
|
1787 |
my $i = 0;
|
|
1788 |
while ($i < $len)
|
|
1789 |
{
|
|
1790 |
my $start = $index->[$i++];
|
|
1791 |
$start += $n if ($start < 0);
|
|
1792 |
my $end = $index->[$i++];
|
|
1793 |
$end += $n if ($end < 0);
|
|
1794 |
|
|
1795 |
next unless $start <= $end && $end >=0 && $start < $n;
|
|
1796 |
$start = 0 if ($start < 0);
|
|
1797 |
$end = $n-1 if ($end >= $n);
|
|
1798 |
|
|
1799 |
for my $j ($start .. $end)
|
|
1800 |
{
|
|
1801 |
$indexFlags[$j] = 1;
|
|
1802 |
}
|
|
1803 |
}
|
|
1804 |
for $i (0 .. $n-1)
|
|
1805 |
{
|
|
1806 |
push @result, $list->[$i] if $indexFlags[$i];
|
|
1807 |
}
|
|
1808 |
}
|
|
1809 |
\@result;
|
|
1810 |
}
|
|
1811 |
|
|
1812 |
sub xql_contextString
|
|
1813 |
{
|
|
1814 |
my $self = shift;
|
|
1815 |
|
|
1816 |
my $index = $self->{IndexList};
|
|
1817 |
my $str = XML::XQL::bold("[");
|
|
1818 |
for (my $i = 0; $i < @$index; $i++)
|
|
1819 |
{
|
|
1820 |
$str .= ", " if $i > 0;
|
|
1821 |
|
|
1822 |
my $s = $index->[$i++];
|
|
1823 |
my $e = $index->[$i];
|
|
1824 |
$str = ($s == $e) ? $s : "$s \$to\$ $e";
|
|
1825 |
}
|
|
1826 |
$str .= XML::XQL::bold("]");
|
|
1827 |
|
|
1828 |
XML::XQL::delim ($self->{Left}->xql_contextString (@_) . $str, $self, @_);
|
|
1829 |
}
|
|
1830 |
|
|
1831 |
sub xql_toDOM
|
|
1832 |
{
|
|
1833 |
my ($self, $doc) = @_;
|
|
1834 |
my $elem = $self->SUPER::xql_toDOM ($doc);
|
|
1835 |
|
|
1836 |
my $index = $self->{IndexList};
|
|
1837 |
my $str = "";
|
|
1838 |
for (my $i = 0; $i < @$index; $i++)
|
|
1839 |
{
|
|
1840 |
$str .= ", " if $i > 0;
|
|
1841 |
|
|
1842 |
my $s = $index->[$i++];
|
|
1843 |
my $e = $index->[$i];
|
|
1844 |
$str .= ($s == $e) ? $s : "$s \$to\$ $e";
|
|
1845 |
}
|
|
1846 |
|
|
1847 |
my $ie = $doc->createElement ("index");
|
|
1848 |
$ie->setAttribute ("list", $str);
|
|
1849 |
$elem->appendChild ($ie);
|
|
1850 |
$elem;
|
|
1851 |
}
|
|
1852 |
|
|
1853 |
package XML::XQL::Union; # "book $union$ magazine", also "|"
|
|
1854 |
use base 'XML::XQL::Operator'; # L x L -> L
|
|
1855 |
|
|
1856 |
sub solve
|
|
1857 |
{
|
|
1858 |
my ($self, $context, $list) = @_;
|
|
1859 |
my $left = XML::XQL::toList ($self->{Left}->solve ($context, $list));
|
|
1860 |
my $right = XML::XQL::toList ($self->{Right}->solve ($context, $list));
|
|
1861 |
|
|
1862 |
return $right if (@$left < 1);
|
|
1863 |
return $left if (@$right < 1);
|
|
1864 |
|
|
1865 |
my @result = @$left;
|
|
1866 |
for my $node (@$right)
|
|
1867 |
{
|
|
1868 |
push @result, $node unless XML::XQL::listContains ($left, $node);
|
|
1869 |
}
|
|
1870 |
|
|
1871 |
my $parent = $self->{Parent};
|
|
1872 |
|
|
1873 |
# Don't sort if parent is a Union or //, because the parent will do the sort
|
|
1874 |
unless (defined $parent and $parent->mustSort)
|
|
1875 |
{
|
|
1876 |
XML::XQL::sortDocOrder (\@result)
|
|
1877 |
}
|
|
1878 |
# $self->verbose ("Union result", \@result);
|
|
1879 |
|
|
1880 |
\@result;
|
|
1881 |
}
|
|
1882 |
|
|
1883 |
sub mustSort
|
|
1884 |
{
|
|
1885 |
1;
|
|
1886 |
}
|
|
1887 |
|
|
1888 |
sub xql_contextString
|
|
1889 |
{
|
|
1890 |
my $self = shift;
|
|
1891 |
XML::XQL::delim ($self->{Left}->xql_contextString (@_) .
|
|
1892 |
XML::XQL::bold (" \$union\$ ") .
|
|
1893 |
$self->{Right}->xql_contextString (@_), $self, @_);
|
|
1894 |
}
|
|
1895 |
|
|
1896 |
package XML::XQL::Intersect; # "book $intersect$ magazine"
|
|
1897 |
use base 'XML::XQL::Operator'; # L x L -> L
|
|
1898 |
|
|
1899 |
sub solve
|
|
1900 |
{
|
|
1901 |
my ($self, $context, $list) = @_;
|
|
1902 |
my $left = XML::XQL::toList ($self->{Left}->solve ($context, $list));
|
|
1903 |
return [] if @$left < 1;
|
|
1904 |
|
|
1905 |
my $right = XML::XQL::toList ($self->{Right}->solve ($context, $list));
|
|
1906 |
return [] if @$right < 1;
|
|
1907 |
|
|
1908 |
# Assumption: $left and $right don't have duplicates themselves
|
|
1909 |
my @result = ();
|
|
1910 |
for my $node (@$left)
|
|
1911 |
{
|
|
1912 |
#? reimplement with hash - faster!
|
|
1913 |
push @result, $node if XML::XQL::listContains ($right, $node);
|
|
1914 |
}
|
|
1915 |
\@result;
|
|
1916 |
}
|
|
1917 |
|
|
1918 |
sub xql_contextString
|
|
1919 |
{
|
|
1920 |
my $self = shift;
|
|
1921 |
XML::XQL::delim ($self->{Left}->xql_contextString (@_) .
|
|
1922 |
XML::XQL::bold (" \$intersect\$ ") .
|
|
1923 |
$self->{Right}->xql_contextString (@_), $self, @_);
|
|
1924 |
}
|
|
1925 |
|
|
1926 |
package XML::XQL::Filter; # "elem[expr]"
|
|
1927 |
use base 'XML::XQL::Operator'; # L -> L
|
|
1928 |
|
|
1929 |
sub solve
|
|
1930 |
{
|
|
1931 |
my ($self, $context, $inlist) = @_;
|
|
1932 |
my @result = ();
|
|
1933 |
|
|
1934 |
for my $node (@$inlist)
|
|
1935 |
{
|
|
1936 |
|
|
1937 |
my $list = $self->{Left}->solve ($context, [$node]);
|
|
1938 |
next if @$list == 0;
|
|
1939 |
|
|
1940 |
my $subQuery = $self->{Right};
|
|
1941 |
|
|
1942 |
$context = [0, scalar (@$list)];
|
|
1943 |
for my $node (@$list)
|
|
1944 |
{
|
|
1945 |
#?? optimize? only need the first one to succeed
|
|
1946 |
my $r = $subQuery->solve ($context, [ $node ]);
|
|
1947 |
push @result, $node if XML::XQL::toBoolean ($r);
|
|
1948 |
$context->[0]++; # increase the index for the index() method
|
|
1949 |
}
|
|
1950 |
}
|
|
1951 |
\@result;
|
|
1952 |
}
|
|
1953 |
|
|
1954 |
sub xql_check
|
|
1955 |
{
|
|
1956 |
my ($self, $inSubQuery, $inParam) = @_;
|
|
1957 |
$self->{Left}->xql_check ($inSubQuery, $inParam);
|
|
1958 |
$self->{Right}->xql_check (1, $inParam);
|
|
1959 |
}
|
|
1960 |
|
|
1961 |
sub xql_contextString
|
|
1962 |
{
|
|
1963 |
my $self = shift;
|
|
1964 |
XML::XQL::delim ($self->{Left}->xql_contextString (@_) .
|
|
1965 |
XML::XQL::bold ("[") .
|
|
1966 |
$self->{Right}->xql_contextString (@_) .
|
|
1967 |
XML::XQL::bold ("]"), $self, @_);
|
|
1968 |
}
|
|
1969 |
|
|
1970 |
package XML::XQL::BooleanOp;
|
|
1971 |
use base 'XML::XQL::Operator';
|
|
1972 |
|
|
1973 |
package XML::XQL::Or;
|
|
1974 |
use base 'XML::XQL::BooleanOp';
|
|
1975 |
|
|
1976 |
sub solve
|
|
1977 |
{
|
|
1978 |
my ($self, $context, $list) = @_;
|
|
1979 |
my $left = $self->{Left}->solve ($context, $list);
|
|
1980 |
return $XML::XQL::Boolean::TRUE if XML::XQL::toBoolean ($left);
|
|
1981 |
return $self->{Right}->solve ($context, $list);
|
|
1982 |
}
|
|
1983 |
|
|
1984 |
sub xql_contextString
|
|
1985 |
{
|
|
1986 |
my $self = shift;
|
|
1987 |
XML::XQL::delim ($self->{Left}->xql_contextString (@_) .
|
|
1988 |
XML::XQL::bold (" \$or\$ ") .
|
|
1989 |
$self->{Right}->xql_contextString (@_), $self, @_);
|
|
1990 |
}
|
|
1991 |
|
|
1992 |
package XML::XQL::And;
|
|
1993 |
use base 'XML::XQL::BooleanOp';
|
|
1994 |
|
|
1995 |
sub solve
|
|
1996 |
{
|
|
1997 |
my ($self, $context, $list) = @_;
|
|
1998 |
my $left = $self->{Left}->solve ($context, $list);
|
|
1999 |
return $XML::XQL::Boolean::FALSE unless XML::XQL::toBoolean ($left);
|
|
2000 |
return $self->{Right}->solve ($context, $list);
|
|
2001 |
}
|
|
2002 |
|
|
2003 |
sub xql_contextString
|
|
2004 |
{
|
|
2005 |
my $self = shift;
|
|
2006 |
XML::XQL::delim ($self->{Left}->xql_contextString (@_) .
|
|
2007 |
XML::XQL::bold (" \$and\$ ") .
|
|
2008 |
$self->{Right}->xql_contextString (@_), $self, @_);
|
|
2009 |
}
|
|
2010 |
|
|
2011 |
package XML::XQL::Not;
|
|
2012 |
use base 'XML::XQL::BooleanOp';
|
|
2013 |
|
|
2014 |
sub solve
|
|
2015 |
{
|
|
2016 |
my ($self, $context, $list) = @_;
|
|
2017 |
my $left = $self->{Left}->solve ($context, $list);
|
|
2018 |
return XML::XQL::toBoolean ($left) ? $XML::XQL::Boolean::FALSE : $XML::XQL::Boolean::TRUE;
|
|
2019 |
}
|
|
2020 |
|
|
2021 |
sub xql_contextString
|
|
2022 |
{
|
|
2023 |
my $self = shift;
|
|
2024 |
XML::XQL::delim (XML::XQL::bold ("\$not\$ ") .
|
|
2025 |
$self->{Left}->xql_contextString (@_), $self, @_);
|
|
2026 |
}
|
|
2027 |
|
|
2028 |
package XML::XQL::Compare;
|
|
2029 |
use base 'XML::XQL::Operator';
|
|
2030 |
use fields qw{ Func All };
|
|
2031 |
|
|
2032 |
use Carp;
|
|
2033 |
|
|
2034 |
sub solve
|
|
2035 |
{
|
|
2036 |
my ($self, $context, $list) = @_;
|
|
2037 |
|
|
2038 |
my $type;
|
|
2039 |
my $cmpFunc = $self->{Func};
|
|
2040 |
|
|
2041 |
my $left = $self->verbose ("left", XML::XQL::toList ($self->{Left}->solve ($context, $list)));
|
|
2042 |
return [] if @$left < 1;
|
|
2043 |
|
|
2044 |
my $right;
|
|
2045 |
eval {
|
|
2046 |
$right = $self->verbose ("right", XML::XQL::prepareRvalue ($self->{Right}->solve ($context, $list)));
|
|
2047 |
};
|
|
2048 |
return [] if XML::XQL::exception ($@);
|
|
2049 |
|
|
2050 |
if ($self->{All})
|
|
2051 |
{
|
|
2052 |
for my $node (@$left)
|
|
2053 |
{
|
|
2054 |
eval {
|
|
2055 |
# Stop if any of the comparisons fails
|
|
2056 |
return [] unless &$cmpFunc ($node, $right);
|
|
2057 |
};
|
|
2058 |
return [] if XML::XQL::exception ($@);
|
|
2059 |
}
|
|
2060 |
return $left;
|
|
2061 |
}
|
|
2062 |
else # $any$
|
|
2063 |
{
|
|
2064 |
my @result = ();
|
|
2065 |
for my $node (@$left)
|
|
2066 |
{
|
|
2067 |
eval {
|
|
2068 |
push (@result, $node)
|
|
2069 |
if &$cmpFunc ($node, $right);
|
|
2070 |
};
|
|
2071 |
return [] if XML::XQL::exception ($@);
|
|
2072 |
}
|
|
2073 |
return \@result;
|
|
2074 |
}
|
|
2075 |
}
|
|
2076 |
|
|
2077 |
sub xql_contextString
|
|
2078 |
{
|
|
2079 |
my $self = shift;
|
|
2080 |
my $all = $self->{All} ? "\$all\$ " : "";
|
|
2081 |
|
|
2082 |
XML::XQL::delim ($all . $self->{Left}->xql_contextString (@_) . " " .
|
|
2083 |
XML::XQL::bold ($self->{Oper}) . " " .
|
|
2084 |
$self->{Right}->xql_contextString (@_), $self, @_);
|
|
2085 |
}
|
|
2086 |
|
|
2087 |
package XML::XQL::Func;
|
|
2088 |
|
|
2089 |
use Carp;
|
|
2090 |
|
|
2091 |
sub count
|
|
2092 |
{
|
|
2093 |
my ($context, $list, $expr) = @_;
|
|
2094 |
|
|
2095 |
my $cnt;
|
|
2096 |
if (defined $expr)
|
|
2097 |
{
|
|
2098 |
$list = XML::XQL::toList ($expr->solve ($context, $list));
|
|
2099 |
$cnt = @$list;
|
|
2100 |
}
|
|
2101 |
else
|
|
2102 |
{
|
|
2103 |
$cnt = $context->[1];
|
|
2104 |
}
|
|
2105 |
#?? ref node?
|
|
2106 |
new XML::XQL::Number ($cnt);
|
|
2107 |
}
|
|
2108 |
|
|
2109 |
sub id
|
|
2110 |
{
|
|
2111 |
my ($context, $list, $query) = @_;
|
|
2112 |
|
|
2113 |
return [] if @$list == 0;
|
|
2114 |
|
|
2115 |
my $id = XML::XQL::prepareRvalue ($query->solve ($context, $list));
|
|
2116 |
#?? check result?
|
|
2117 |
|
|
2118 |
#?? if [0] is not a Node, I should probably try the next one
|
|
2119 |
my $doc = $list->[0]->xql_document;
|
|
2120 |
|
|
2121 |
_findId ($doc->xql_element->[0], $id);
|
|
2122 |
}
|
|
2123 |
|
|
2124 |
sub _findId # static method
|
|
2125 |
{
|
|
2126 |
my ($elem, $id) = @_;
|
|
2127 |
my $attr = $elem->xql_attribute ("id");
|
|
2128 |
return [$elem] if (@$attr == 1 && $attr->[0]->xql_nodeName eq $id);
|
|
2129 |
|
|
2130 |
for my $kid (@{$elem->xql_element})
|
|
2131 |
{
|
|
2132 |
$attr = _findId ($kid);
|
|
2133 |
return $attr if @$attr;
|
|
2134 |
}
|
|
2135 |
return [];
|
|
2136 |
}
|
|
2137 |
|
|
2138 |
sub end
|
|
2139 |
{
|
|
2140 |
my ($context, $list) = @_;
|
|
2141 |
|
|
2142 |
return [] if @$list == 0;
|
|
2143 |
new XML::XQL::Boolean ($context->[0] == $context->[1] - 1);
|
|
2144 |
}
|
|
2145 |
|
|
2146 |
sub xql_index
|
|
2147 |
{
|
|
2148 |
my ($context, $list) = @_;
|
|
2149 |
|
|
2150 |
# print "index: " . XML::XQL::d($context) . "\n";
|
|
2151 |
#?? wrong!
|
|
2152 |
return [] if @$list == 0;
|
|
2153 |
new XML::XQL::Number ($context->[0]);
|
|
2154 |
}
|
|
2155 |
|
|
2156 |
sub ancestor
|
|
2157 |
{
|
|
2158 |
my ($context, $list, $query) = @_;
|
|
2159 |
|
|
2160 |
return [] if @$list == 0;
|
|
2161 |
|
|
2162 |
my @anc = ();
|
|
2163 |
#?? fix for @$list > 1
|
|
2164 |
my $parent = $list->[0]->xql_parent;
|
|
2165 |
|
|
2166 |
while (defined $parent)
|
|
2167 |
{
|
|
2168 |
# keep list of ancestors so far
|
|
2169 |
unshift @anc, $parent;
|
|
2170 |
|
|
2171 |
# solve the query for the ancestor
|
|
2172 |
my $result = $query->solve ($context, [$parent]);
|
|
2173 |
for my $node (@{$result})
|
|
2174 |
{
|
|
2175 |
for my $anc (@anc)
|
|
2176 |
{
|
|
2177 |
return [$node] if $node == $anc;
|
|
2178 |
}
|
|
2179 |
}
|
|
2180 |
$parent = $parent->xql_parent;
|
|
2181 |
}
|
|
2182 |
return [];
|
|
2183 |
}
|
|
2184 |
|
|
2185 |
sub node
|
|
2186 |
{
|
|
2187 |
my ($context, $list) = @_;
|
|
2188 |
|
|
2189 |
return [] if @$list == 0;
|
|
2190 |
return $list->[0]->xql_node if @$list == 1;
|
|
2191 |
|
|
2192 |
my @result;
|
|
2193 |
for my $node (@$list)
|
|
2194 |
{
|
|
2195 |
push @result, @{ $node->xql_node };
|
|
2196 |
}
|
|
2197 |
XML::XQL::sortDocOrder (\@result);
|
|
2198 |
}
|
|
2199 |
|
|
2200 |
sub _nodesByType
|
|
2201 |
{
|
|
2202 |
my ($list, $type) = @_;
|
|
2203 |
|
|
2204 |
return [] if @$list == 0;
|
|
2205 |
|
|
2206 |
my @result;
|
|
2207 |
for my $node (@$list)
|
|
2208 |
{
|
|
2209 |
for my $kid (@{ $node->xql_node })
|
|
2210 |
{
|
|
2211 |
push @result, $kid if $kid->xql_nodeType == $type;
|
|
2212 |
}
|
|
2213 |
}
|
|
2214 |
@$list > 1 ? XML::XQL::sortDocOrder (\@result) : \@result;
|
|
2215 |
}
|
|
2216 |
|
|
2217 |
sub pi
|
|
2218 |
{
|
|
2219 |
my ($context, $list, $pi_name) = @_;
|
|
2220 |
if (defined $pi_name)
|
|
2221 |
{
|
|
2222 |
return [] if @$list == 0;
|
|
2223 |
|
|
2224 |
$pi_name = $pi_name->solve ($context, $list)->xql_toString;
|
|
2225 |
|
|
2226 |
my @result;
|
|
2227 |
for my $node (@$list)
|
|
2228 |
{
|
|
2229 |
for my $kid (@{ $node->xql_node })
|
|
2230 |
{
|
|
2231 |
push @result, $kid
|
|
2232 |
if $kid->xql_nodeType == 7 && $kid->getTarget eq $pi_name;
|
|
2233 |
}
|
|
2234 |
}
|
|
2235 |
return @$list > 1 ? XML::XQL::sortDocOrder (\@result) : \@result;
|
|
2236 |
}
|
|
2237 |
|
|
2238 |
return _nodesByType ($_[1], 7);
|
|
2239 |
}
|
|
2240 |
|
|
2241 |
sub comment
|
|
2242 |
{
|
|
2243 |
_nodesByType ($_[1], 8);
|
|
2244 |
}
|
|
2245 |
|
|
2246 |
sub textNode
|
|
2247 |
{
|
|
2248 |
_nodesByType ($_[1], 3);
|
|
2249 |
}
|
|
2250 |
|
|
2251 |
sub nodeName
|
|
2252 |
{
|
|
2253 |
my ($context, $list) = @_;
|
|
2254 |
|
|
2255 |
return [] if @$list == 0;
|
|
2256 |
|
|
2257 |
my @result;
|
|
2258 |
for my $node (@$list)
|
|
2259 |
{
|
|
2260 |
push @result, new XML::XQL::Text ($node->xql_nodeName, $node);
|
|
2261 |
}
|
|
2262 |
\@result;
|
|
2263 |
}
|
|
2264 |
|
|
2265 |
sub namespace
|
|
2266 |
{
|
|
2267 |
my ($context, $list) = @_;
|
|
2268 |
|
|
2269 |
return [] if @$list == 0;
|
|
2270 |
|
|
2271 |
my @result;
|
|
2272 |
for my $node (@$list)
|
|
2273 |
{
|
|
2274 |
my $namespace = $node->xql_namespace;
|
|
2275 |
next unless defined $namespace;
|
|
2276 |
push @result, new XML::XQL::Text ($namespace, $node);
|
|
2277 |
}
|
|
2278 |
\@result;
|
|
2279 |
}
|
|
2280 |
|
|
2281 |
sub prefix
|
|
2282 |
{
|
|
2283 |
my ($context, $list) = @_;
|
|
2284 |
|
|
2285 |
return [] if @$list == 0;
|
|
2286 |
|
|
2287 |
my @result;
|
|
2288 |
for my $node (@$list)
|
|
2289 |
{
|
|
2290 |
my $prefix = $node->xql_prefix;
|
|
2291 |
next unless defined $prefix;
|
|
2292 |
push @result, new XML::XQL::Text ($prefix, $node);
|
|
2293 |
}
|
|
2294 |
\@result;
|
|
2295 |
}
|
|
2296 |
|
|
2297 |
sub baseName
|
|
2298 |
{
|
|
2299 |
my ($context, $list) = @_;
|
|
2300 |
|
|
2301 |
return [] if @$list == 0;
|
|
2302 |
|
|
2303 |
my @result;
|
|
2304 |
for my $node (@$list)
|
|
2305 |
{
|
|
2306 |
my $basename = $node->xql_baseName;
|
|
2307 |
next unless defined $basename;
|
|
2308 |
push @result, new XML::XQL::Text ($basename, $node);
|
|
2309 |
}
|
|
2310 |
\@result;
|
|
2311 |
}
|
|
2312 |
|
|
2313 |
sub nodeType
|
|
2314 |
{
|
|
2315 |
my ($context, $list) = @_;
|
|
2316 |
|
|
2317 |
return [] if @$list == 0;
|
|
2318 |
|
|
2319 |
my @result;
|
|
2320 |
for my $node (@$list)
|
|
2321 |
{
|
|
2322 |
push @result, new XML::XQL::Number ($node->xql_nodeType, $node);
|
|
2323 |
}
|
|
2324 |
\@result;
|
|
2325 |
}
|
|
2326 |
|
|
2327 |
sub nodeTypeString
|
|
2328 |
{
|
|
2329 |
my ($context, $list) = @_;
|
|
2330 |
|
|
2331 |
return [] if @$list == 0;
|
|
2332 |
|
|
2333 |
my @result;
|
|
2334 |
for my $node (@$list)
|
|
2335 |
{
|
|
2336 |
push @result, new XML::XQL::Text ($node->xql_nodeTypeString, $node);
|
|
2337 |
}
|
|
2338 |
@result;
|
|
2339 |
}
|
|
2340 |
|
|
2341 |
sub value
|
|
2342 |
{
|
|
2343 |
my ($context, $list) = @_;
|
|
2344 |
|
|
2345 |
return [] if @$list == 0;
|
|
2346 |
|
|
2347 |
my @result;
|
|
2348 |
for my $node (@$list)
|
|
2349 |
{
|
|
2350 |
push @result, $node->xql_value; # value always returns an object
|
|
2351 |
}
|
|
2352 |
\@result;
|
|
2353 |
}
|
|
2354 |
|
|
2355 |
sub text
|
|
2356 |
{
|
|
2357 |
my ($context, $list, $recurse) = @_;
|
|
2358 |
|
|
2359 |
return [] if @$list == 0;
|
|
2360 |
|
|
2361 |
if (defined $recurse)
|
|
2362 |
{
|
|
2363 |
$recurse = $recurse->solve ($context, $list)->xql_toString;
|
|
2364 |
}
|
|
2365 |
else
|
|
2366 |
{
|
|
2367 |
$recurse = 1; # default
|
|
2368 |
}
|
|
2369 |
|
|
2370 |
my @result;
|
|
2371 |
for my $node (@$list)
|
|
2372 |
{
|
|
2373 |
my $text = $node->xql_text ($recurse);
|
|
2374 |
next unless defined $text;
|
|
2375 |
|
|
2376 |
push @result, new XML::XQL::Text ($text, $node);
|
|
2377 |
}
|
|
2378 |
\@result;
|
|
2379 |
}
|
|
2380 |
|
|
2381 |
sub rawText
|
|
2382 |
{
|
|
2383 |
my ($context, $list, $recurse) = @_;
|
|
2384 |
|
|
2385 |
return [] if @$list == 0;
|
|
2386 |
|
|
2387 |
if (defined $recurse)
|
|
2388 |
{
|
|
2389 |
$recurse = $recurse->solve ($context, $list)->xql_toString;
|
|
2390 |
}
|
|
2391 |
else
|
|
2392 |
{
|
|
2393 |
$recurse = 1; # default
|
|
2394 |
}
|
|
2395 |
|
|
2396 |
my @result;
|
|
2397 |
for my $node (@$list)
|
|
2398 |
{
|
|
2399 |
my $text = $node->xql_rawText ($recurse);
|
|
2400 |
next unless defined $text;
|
|
2401 |
|
|
2402 |
push @result, new XML::XQL::Text ($text, $node);
|
|
2403 |
}
|
|
2404 |
\@result;
|
|
2405 |
}
|
|
2406 |
|
|
2407 |
sub true
|
|
2408 |
{
|
|
2409 |
return $XML::XQL::Boolean::TRUE;
|
|
2410 |
}
|
|
2411 |
|
|
2412 |
sub false
|
|
2413 |
{
|
|
2414 |
return $XML::XQL::Boolean::FALSE;
|
|
2415 |
}
|
|
2416 |
|
|
2417 |
#sub date() is in XQL::XML::Date
|
|
2418 |
|
|
2419 |
sub element
|
|
2420 |
{
|
|
2421 |
my ($context, $list, $text) = @_;
|
|
2422 |
|
|
2423 |
return [] if @$list == 0;
|
|
2424 |
|
|
2425 |
my @result;
|
|
2426 |
if (defined $text)
|
|
2427 |
{
|
|
2428 |
$text = XML::XQL::prepareRvalue ($text->solve ($context, $list))->xql_toString;
|
|
2429 |
for my $node (@$list)
|
|
2430 |
{
|
|
2431 |
push @result, @{$node->xql_element ($text)};
|
|
2432 |
}
|
|
2433 |
}
|
|
2434 |
else
|
|
2435 |
{
|
|
2436 |
for my $node (@$list)
|
|
2437 |
{
|
|
2438 |
push @result, @{$node->xql_element};
|
|
2439 |
}
|
|
2440 |
}
|
|
2441 |
@$list > 1 ? XML::XQL::sortDocOrder (\@result) : \@result;
|
|
2442 |
}
|
|
2443 |
|
|
2444 |
sub attribute
|
|
2445 |
{
|
|
2446 |
my ($context, $list, $text) = @_;
|
|
2447 |
|
|
2448 |
return [] if @$list == 0;
|
|
2449 |
|
|
2450 |
my @result;
|
|
2451 |
if (defined $text)
|
|
2452 |
{
|
|
2453 |
$text = XML::XQL::prepareRvalue ($text->solve ($context, $list))->xql_toString;
|
|
2454 |
for my $node (@$list)
|
|
2455 |
{
|
|
2456 |
push @result, @{ $node->xql_attribute ($text) };
|
|
2457 |
}
|
|
2458 |
}
|
|
2459 |
else
|
|
2460 |
{
|
|
2461 |
for my $node (@$list)
|
|
2462 |
{
|
|
2463 |
push @result, @{ $node->xql_attribute };
|
|
2464 |
}
|
|
2465 |
}
|
|
2466 |
\@result;
|
|
2467 |
}
|
|
2468 |
|
|
2469 |
package XML::XQL::Bang;
|
|
2470 |
use base 'XML::XQL::Operator';
|
|
2471 |
|
|
2472 |
sub solve
|
|
2473 |
{
|
|
2474 |
my ($self, $context, $list) = @_;
|
|
2475 |
$list = $self->{Left}->solve ($context, $list);
|
|
2476 |
$self->{Right}->solve ($context, $list);
|
|
2477 |
}
|
|
2478 |
|
|
2479 |
sub xql_contextString
|
|
2480 |
{
|
|
2481 |
my $self = shift;
|
|
2482 |
XML::XQL::delim ($self->{Left}->xql_contextString (@_) .
|
|
2483 |
XML::XQL::bold ("!") .
|
|
2484 |
$self->{Right}->xql_contextString (@_), $self, @_);
|
|
2485 |
}
|
|
2486 |
|
|
2487 |
package XML::XQL::Invocation;
|
|
2488 |
use base 'XML::XQL::Operator';
|
|
2489 |
use fields qw{ Args Name Type Once ConstVal };
|
|
2490 |
|
|
2491 |
use Carp;
|
|
2492 |
|
|
2493 |
sub new
|
|
2494 |
{
|
|
2495 |
my ($class, %args) = @_;
|
|
2496 |
|
|
2497 |
my $self = bless \%args, $class;
|
|
2498 |
for my $par (@{$self->{Args}})
|
|
2499 |
{
|
|
2500 |
$par->setParent ($self);
|
|
2501 |
}
|
|
2502 |
$self;
|
|
2503 |
}
|
|
2504 |
|
|
2505 |
sub dispose
|
|
2506 |
{
|
|
2507 |
my $self = shift;
|
|
2508 |
for (@{ $self->{Args} })
|
|
2509 |
{
|
|
2510 |
$_->dispose;
|
|
2511 |
}
|
|
2512 |
undef $self->{Args};
|
|
2513 |
|
|
2514 |
undef $self->{Parent};
|
|
2515 |
}
|
|
2516 |
|
|
2517 |
sub isConstant
|
|
2518 |
{
|
|
2519 |
my ($self) = @_;
|
|
2520 |
|
|
2521 |
# An Invocation is constant, if all it's arguments are constant
|
|
2522 |
# and it's a "constant" function
|
|
2523 |
my $name = $self->{Name};
|
|
2524 |
my $cf = $self->query->{ConstFunc};
|
|
2525 |
my $const = exists ($cf->{$name}) ?
|
|
2526 |
$cf->{name} : $XML::XQL::ConstFunc{$name};
|
|
2527 |
return 0 unless $const;
|
|
2528 |
|
|
2529 |
for my $par (@{$self->{Args}})
|
|
2530 |
{
|
|
2531 |
return 0 unless $par->isConstant;
|
|
2532 |
}
|
|
2533 |
1;
|
|
2534 |
}
|
|
2535 |
|
|
2536 |
sub xql_check
|
|
2537 |
{
|
|
2538 |
my ($self, $inSubQuery, $inParam) = @_;
|
|
2539 |
|
|
2540 |
# Syntactic Constraint 7:
|
|
2541 |
# In a node query this function or method is only valid inside an instance
|
|
2542 |
# of Subquery, unless it appears within an instance of Param.
|
|
2543 |
# Functions and methods are valid anywhere in a full query.
|
|
2544 |
|
|
2545 |
my $query;
|
|
2546 |
if (not ($inSubQuery or $inParam) and ($query = $self->query)->isNodeQuery)
|
|
2547 |
{
|
|
2548 |
unless ($query->isAllowedOutsideSubquery ($self->{Name}))
|
|
2549 |
{
|
|
2550 |
XML::XQL::parseError $self->{Type} . " " . $self->{Name} .
|
|
2551 |
" is only allowed inside a Subquery or Param for 'Node Queries'." .
|
|
2552 |
" Context: " . $self->toContextString;
|
|
2553 |
}
|
|
2554 |
}
|
|
2555 |
for my $par (@{$self->{Args}})
|
|
2556 |
{
|
|
2557 |
$par->xql_check ($inSubQuery, 1); # these are Params
|
|
2558 |
}
|
|
2559 |
# once() should only be evaluated once per query
|
|
2560 |
# "constant" functions should only be evaluated once *ever*
|
|
2561 |
$self->{Once} = $self->isOnce || $self->isConstant;
|
|
2562 |
}
|
|
2563 |
|
|
2564 |
sub xql_prepCache
|
|
2565 |
{
|
|
2566 |
my ($self) = @_;
|
|
2567 |
# once() should only be evaluated once per query
|
|
2568 |
# "constant" functions should only be evaluated once *ever*
|
|
2569 |
delete $self->{ConstVal} if $self->isOnce;
|
|
2570 |
|
|
2571 |
for my $par (@{$self->{Args}})
|
|
2572 |
{
|
|
2573 |
$par->xql_prepCache;
|
|
2574 |
}
|
|
2575 |
}
|
|
2576 |
|
|
2577 |
sub isOnce
|
|
2578 |
{
|
|
2579 |
$_[0]->{Name} eq "once";
|
|
2580 |
}
|
|
2581 |
|
|
2582 |
sub isMethod
|
|
2583 |
{
|
|
2584 |
$_[0]->{Type} eq "method";
|
|
2585 |
}
|
|
2586 |
|
|
2587 |
sub solve
|
|
2588 |
{
|
|
2589 |
my ($self, $context, $list) = @_;
|
|
2590 |
|
|
2591 |
# Use the cached value if it's a "constant" function
|
|
2592 |
return $self->{ConstVal} if (exists $self->{ConstVal});
|
|
2593 |
|
|
2594 |
my $func = $self->{Func};
|
|
2595 |
|
|
2596 |
my $result;
|
|
2597 |
eval {
|
|
2598 |
$result = &$func ($context, $list, @{$self->{Args}});
|
|
2599 |
$self->{ConstVal} = $result if $self->{Once};
|
|
2600 |
};
|
|
2601 |
if ($@)
|
|
2602 |
{
|
|
2603 |
#?? or croak
|
|
2604 |
$self->warning ("invocation of '" . $self->{Name} . "' failed:\n\t$@");
|
|
2605 |
$self->{ConstVal} = [] if $self->{Once};
|
|
2606 |
return [];
|
|
2607 |
}
|
|
2608 |
$result;
|
|
2609 |
}
|
|
2610 |
|
|
2611 |
sub xql_contextString
|
|
2612 |
{
|
|
2613 |
my $self = shift;
|
|
2614 |
|
|
2615 |
my $str = XML::XQL::bold ($self->{Name}) . "(";
|
|
2616 |
for (my $i = 0; $i < @{$self->{Args}}; $i++)
|
|
2617 |
{
|
|
2618 |
$str .= ", " if $i > 0;
|
|
2619 |
$str .= $self->{Args}->[$i]->xql_contextString (@_);
|
|
2620 |
}
|
|
2621 |
$str .= ")";
|
|
2622 |
|
|
2623 |
XML::XQL::delim ($str, $self, @_);
|
|
2624 |
}
|
|
2625 |
|
|
2626 |
# Base class shared by Node and PrimitiveType
|
|
2627 |
package XML::XQL::PrimitiveTypeBase;
|
|
2628 |
|
|
2629 |
sub dispose
|
|
2630 |
{
|
|
2631 |
}
|
|
2632 |
|
|
2633 |
sub xql_check
|
|
2634 |
{
|
|
2635 |
}
|
|
2636 |
|
|
2637 |
sub xql_prepCache
|
|
2638 |
{
|
|
2639 |
}
|
|
2640 |
|
|
2641 |
sub xql_prevSibling
|
|
2642 |
{
|
|
2643 |
undef;
|
|
2644 |
}
|
|
2645 |
|
|
2646 |
# This method returns an integer that determines how values should be casted
|
|
2647 |
# for comparisons. If the left value (LHS) has a higher xql_primType, the
|
|
2648 |
# right value (RHS) is cast to the type of the LHS (otherwise, the LHS is casted
|
|
2649 |
# to the type of the LHS)
|
|
2650 |
#
|
|
2651 |
# Values for certain types:
|
|
2652 |
# Node 0 (always cast a node to a Text string first)
|
|
2653 |
# Text 1
|
|
2654 |
# Number 2
|
|
2655 |
# Boolean 3
|
|
2656 |
# Date 4 (other classes automatically use 4 by default)
|
|
2657 |
|
|
2658 |
sub xql_primType
|
|
2659 |
{
|
|
2660 |
4; # default for all classes other then Node, Text, Number, Boolean
|
|
2661 |
}
|
|
2662 |
|
|
2663 |
sub xql_toBoolean
|
|
2664 |
{
|
|
2665 |
1; # it is true if it exists
|
|
2666 |
}
|
|
2667 |
|
|
2668 |
sub xql_namespace
|
|
2669 |
{
|
|
2670 |
undef;
|
|
2671 |
}
|
|
2672 |
|
|
2673 |
sub xql_baseName
|
|
2674 |
{
|
|
2675 |
undef;
|
|
2676 |
}
|
|
2677 |
|
|
2678 |
sub xql_prefix
|
|
2679 |
{
|
|
2680 |
undef;
|
|
2681 |
}
|
|
2682 |
|
|
2683 |
sub xql_sortKey
|
|
2684 |
{
|
|
2685 |
my $src = $_[0]->xql_sourceNode;
|
|
2686 |
$src ? $src->xql_sortKey : $XML::XQL::LAST_SORT_KEY;
|
|
2687 |
}
|
|
2688 |
|
|
2689 |
sub xql_toDOM
|
|
2690 |
{
|
|
2691 |
my ($self, $doc) = @_;
|
|
2692 |
my $name = ref $self;
|
|
2693 |
$name =~ s/.*:://;
|
|
2694 |
my $elem = $doc->createElement ($name);
|
|
2695 |
$elem->setAttribute ("value", $self->xql_toString);
|
|
2696 |
$elem;
|
|
2697 |
}
|
|
2698 |
|
|
2699 |
package XML::XQL::PrimitiveType;
|
|
2700 |
use vars qw( @ISA );
|
|
2701 |
@ISA = qw( XML::XQL::PrimitiveTypeBase );
|
|
2702 |
|
|
2703 |
sub new
|
|
2704 |
{
|
|
2705 |
my ($class, $val, $srcNode) = @_;
|
|
2706 |
bless [$val, $srcNode], $class;
|
|
2707 |
}
|
|
2708 |
|
|
2709 |
sub isConstant
|
|
2710 |
{
|
|
2711 |
1;
|
|
2712 |
}
|
|
2713 |
|
|
2714 |
sub setParent
|
|
2715 |
{
|
|
2716 |
# not defined
|
|
2717 |
}
|
|
2718 |
|
|
2719 |
sub solve
|
|
2720 |
{
|
|
2721 |
$_[0]; # evaluates to itself
|
|
2722 |
}
|
|
2723 |
|
|
2724 |
#
|
|
2725 |
# Derived classes should not override this method.
|
|
2726 |
# Override xql_toString instead.
|
|
2727 |
#
|
|
2728 |
sub xql_contextString
|
|
2729 |
{
|
|
2730 |
my $self = shift;
|
|
2731 |
|
|
2732 |
XML::XQL::delim ($self->xql_toString, $self, @_);
|
|
2733 |
}
|
|
2734 |
|
|
2735 |
#
|
|
2736 |
# Return the value of the Object as a primitive Perl value, i.e. an integer,
|
|
2737 |
# a float, or a string.
|
|
2738 |
#
|
|
2739 |
sub xql_toString
|
|
2740 |
{
|
|
2741 |
$_[0]->[0];
|
|
2742 |
}
|
|
2743 |
|
|
2744 |
sub xql_sourceNode
|
|
2745 |
{
|
|
2746 |
$_[0]->[1];
|
|
2747 |
}
|
|
2748 |
|
|
2749 |
sub xql_setSourceNode
|
|
2750 |
{
|
|
2751 |
$_[0]->[1] = $_[1];
|
|
2752 |
}
|
|
2753 |
|
|
2754 |
sub xql_setValue
|
|
2755 |
{
|
|
2756 |
# This could potentially change the value of a constant in the XQL
|
|
2757 |
# query expression.
|
|
2758 |
$_[0]->[0] = $_[1];
|
|
2759 |
}
|
|
2760 |
|
|
2761 |
sub xql_nodeType
|
|
2762 |
{
|
|
2763 |
0; # it's not a Node
|
|
2764 |
}
|
|
2765 |
|
|
2766 |
sub xql_compare
|
|
2767 |
{
|
|
2768 |
# Temporarily switch off $WARNING flag, to disable messages a la:
|
|
2769 |
# Argument "1993-02-14" isn't numeric in ncmp
|
|
2770 |
local $^W = 0;
|
|
2771 |
$_[0]->[0] <=> $_[1]->xql_toString;
|
|
2772 |
}
|
|
2773 |
|
|
2774 |
sub xql_eq { my $self = shift; $self->xql_compare (@_) == 0; }
|
|
2775 |
sub xql_ne { my $self = shift; $self->xql_compare (@_) != 0; }
|
|
2776 |
sub xql_lt { my $self = shift; $self->xql_compare (@_) < 0; }
|
|
2777 |
sub xql_le { my $self = shift; $self->xql_compare (@_) <= 0; }
|
|
2778 |
sub xql_gt { my $self = shift; $self->xql_compare (@_) > 0; }
|
|
2779 |
sub xql_ge { my $self = shift; $self->xql_compare (@_) >= 0; }
|
|
2780 |
|
|
2781 |
package XML::XQL::Boolean;
|
|
2782 |
use vars qw( @ISA @EXPORT $TRUE $FALSE );
|
|
2783 |
|
|
2784 |
use Carp;
|
|
2785 |
|
|
2786 |
@ISA = qw( XML::XQL::PrimitiveType );
|
|
2787 |
@EXPORT = qw( $TRUE $FALSE );
|
|
2788 |
|
|
2789 |
$TRUE = new XML::XQL::Boolean (1);
|
|
2790 |
$FALSE = new XML::XQL::Boolean (0);
|
|
2791 |
|
|
2792 |
sub xql_primType
|
|
2793 |
{
|
|
2794 |
3;
|
|
2795 |
}
|
|
2796 |
|
|
2797 |
sub xql_toBoolean
|
|
2798 |
{
|
|
2799 |
$_[0]->[0]; # evaluate it to its value
|
|
2800 |
}
|
|
2801 |
|
|
2802 |
sub xql_negate
|
|
2803 |
{
|
|
2804 |
#?? do we need to keep track of a source node here?
|
|
2805 |
$_[0]->[0] ? $FALSE : $TRUE;
|
|
2806 |
}
|
|
2807 |
|
|
2808 |
sub xql_compare
|
|
2809 |
{
|
|
2810 |
#?? how do we convert string to boolean value
|
|
2811 |
$_[0]->[0] <=> ($_[1]->xql_toString ? 1 : 0);
|
|
2812 |
}
|
|
2813 |
|
|
2814 |
sub xql_lt { badComparisonError (@_); }
|
|
2815 |
sub xql_gt { badComparisonError (@_); }
|
|
2816 |
sub xql_le { badComparisonError (@_); }
|
|
2817 |
sub xql_ge { badComparisonError (@_); }
|
|
2818 |
|
|
2819 |
sub badComparisonError
|
|
2820 |
{
|
|
2821 |
croak 'comparison operator (other than =, !=, $ieq$, $ine$) not defined for type Boolean';
|
|
2822 |
}
|
|
2823 |
|
|
2824 |
package XML::XQL::Number;
|
|
2825 |
use vars qw( @ISA );
|
|
2826 |
@ISA = qw( XML::XQL::PrimitiveType );
|
|
2827 |
|
|
2828 |
#use overload
|
|
2829 |
# 'fallback' => 1, # use default operators, if not specified
|
|
2830 |
# '""' => \&debug;
|
|
2831 |
|
|
2832 |
sub debug
|
|
2833 |
{
|
|
2834 |
"Number[" . $_[0]->[0] . "]";
|
|
2835 |
}
|
|
2836 |
|
|
2837 |
sub xql_primType
|
|
2838 |
{
|
|
2839 |
2;
|
|
2840 |
}
|
|
2841 |
|
|
2842 |
package XML::XQL::Text;
|
|
2843 |
use vars qw( @ISA );
|
|
2844 |
@ISA = qw( XML::XQL::PrimitiveType );
|
|
2845 |
|
|
2846 |
#use overload
|
|
2847 |
# 'fallback' => 1, # use default operators, if not specified
|
|
2848 |
# '""' => \&debug;
|
|
2849 |
|
|
2850 |
sub debug
|
|
2851 |
{
|
|
2852 |
"Text[" . $_[0]->[0] . "]";
|
|
2853 |
}
|
|
2854 |
|
|
2855 |
sub xql_primType
|
|
2856 |
{
|
|
2857 |
1;
|
|
2858 |
}
|
|
2859 |
|
|
2860 |
sub xql_compare
|
|
2861 |
{
|
|
2862 |
my ($self, $other, $ignoreCase) = @_;
|
|
2863 |
if ($ignoreCase)
|
|
2864 |
{
|
|
2865 |
my $lhs = $self->[0];
|
|
2866 |
my $rhs = $other->xql_toString;
|
|
2867 |
"\U$lhs" cmp "\U$rhs";
|
|
2868 |
}
|
|
2869 |
else
|
|
2870 |
{
|
|
2871 |
$self->[0] cmp $other->xql_toString;
|
|
2872 |
}
|
|
2873 |
}
|
|
2874 |
|
|
2875 |
# Declare package XML::XQL::Node so that XML implementations can say
|
|
2876 |
# that their nodes derive from it:
|
|
2877 |
#
|
|
2878 |
# This worked for me when I added XQL support for XML::DOM:
|
|
2879 |
#
|
|
2880 |
# BEGIN
|
|
2881 |
# {
|
|
2882 |
# push @XML::DOM::Node::ISA, 'XML::XQL::Node';
|
|
2883 |
# }
|
|
2884 |
#
|
|
2885 |
|
|
2886 |
package XML::XQL::Node;
|
|
2887 |
|
|
2888 |
use vars qw( @ISA );
|
|
2889 |
@ISA = qw( XML::XQL::PrimitiveTypeBase );
|
|
2890 |
|
|
2891 |
use Carp;
|
|
2892 |
|
|
2893 |
sub xql_primType
|
|
2894 |
{
|
|
2895 |
0;
|
|
2896 |
}
|
|
2897 |
|
|
2898 |
sub xql_toBoolean
|
|
2899 |
{
|
|
2900 |
1; # it is true if it exists
|
|
2901 |
}
|
|
2902 |
|
|
2903 |
sub xql_attribute
|
|
2904 |
{
|
|
2905 |
[];
|
|
2906 |
}
|
|
2907 |
|
|
2908 |
sub xql_sourceNode
|
|
2909 |
{
|
|
2910 |
$_[0];
|
|
2911 |
}
|
|
2912 |
|
|
2913 |
# Default implementation - override this for speed
|
|
2914 |
sub xql_element
|
|
2915 |
{
|
|
2916 |
my ($node, $elem) = @_;
|
|
2917 |
|
|
2918 |
my @list = ();
|
|
2919 |
if (defined $elem)
|
|
2920 |
{
|
|
2921 |
for my $kid (@{$_[0]->xql_node})
|
|
2922 |
{
|
|
2923 |
# 1: element
|
|
2924 |
push @list, $kid
|
|
2925 |
if $kid->xql_nodeType == 1 && $kid->xql_nodeName eq $elem;
|
|
2926 |
}
|
|
2927 |
}
|
|
2928 |
else
|
|
2929 |
{
|
|
2930 |
for my $kid (@{$_[0]->xql_node})
|
|
2931 |
{
|
|
2932 |
push @list, $kid if $kid->xql_nodeType == 1; # 1: element
|
|
2933 |
}
|
|
2934 |
}
|
|
2935 |
\@list;
|
|
2936 |
}
|
|
2937 |
|
|
2938 |
sub xql_text
|
|
2939 |
{
|
|
2940 |
undef;
|
|
2941 |
}
|
|
2942 |
|
|
2943 |
sub xql_rawText
|
|
2944 |
{
|
|
2945 |
undef;
|
|
2946 |
}
|
|
2947 |
|
|
2948 |
sub xql_rawTextBlocks
|
|
2949 |
{
|
|
2950 |
undef;
|
|
2951 |
}
|
|
2952 |
|
|
2953 |
sub xql_value
|
|
2954 |
{
|
|
2955 |
new XML::XQL::Text ($_[0]->xql_text ($_[1]), $_[0]);
|
|
2956 |
}
|
|
2957 |
|
|
2958 |
# Convert xql_value to Perl string (or undef if xql_value is undefined)
|
|
2959 |
sub xql_toString
|
|
2960 |
{
|
|
2961 |
my $val = $_[0]->xql_value;
|
|
2962 |
return undef if XML::XQL::isEmptyList ($val);
|
|
2963 |
|
|
2964 |
$val->xql_toString;
|
|
2965 |
}
|
|
2966 |
|
|
2967 |
sub xql_setValue
|
|
2968 |
{
|
|
2969 |
# Not implemented for most node types
|
|
2970 |
}
|
|
2971 |
|
|
2972 |
sub xql_data
|
|
2973 |
{
|
|
2974 |
"";
|
|
2975 |
}
|
|
2976 |
|
|
2977 |
sub xql_nodeType
|
|
2978 |
{
|
|
2979 |
0;
|
|
2980 |
}
|
|
2981 |
|
|
2982 |
sub xql_nodeName
|
|
2983 |
{
|
|
2984 |
[];
|
|
2985 |
}
|
|
2986 |
|
|
2987 |
# Java code from "XML:: Namespaces in 20 lines" by James Clark:
|
|
2988 |
# see: http://www.oasis-open.org/cover/clarkNS-980804.html
|
|
2989 |
#
|
|
2990 |
# String expandName(String name, Element element, boolean isAttribute) {
|
|
2991 |
# // The index of the colon character in the name.
|
|
2992 |
# int colonIndex = name.indexOf(':');
|
|
2993 |
# // The name of the attribute that declares the namespace prefix.
|
|
2994 |
# String declAttName;
|
|
2995 |
# if (colonIndex == -1) {
|
|
2996 |
# // Default namespace applies only to element type names.
|
|
2997 |
# if (isAttribute)
|
|
2998 |
# return name;
|
|
2999 |
# declAttName = "xmlns";
|
|
3000 |
# }
|
|
3001 |
# else {
|
|
3002 |
# String prefix = name.substring(0, colonIndex);
|
|
3003 |
# // "xml:" is special
|
|
3004 |
# if (prefix.equals("xml"))
|
|
3005 |
# return name;
|
|
3006 |
# declAttName = "xmlns:" + prefix;
|
|
3007 |
# }
|
|
3008 |
# for (; element != null; element = element.getParent()) {
|
|
3009 |
# String ns = element.getAttributeValue(declAttName);
|
|
3010 |
# if (ns != null) {
|
|
3011 |
# // Handle special meaning of xmlns=""
|
|
3012 |
# if (ns.length() == 0 && colonIndex == -1)
|
|
3013 |
# return name;
|
|
3014 |
# return ns + '+' + name.substring(colonIndex + 1);
|
|
3015 |
# }
|
|
3016 |
# }
|
|
3017 |
# return null;
|
|
3018 |
# }
|
|
3019 |
|
|
3020 |
# From "Namespaces in XML"
|
|
3021 |
# at http://www.w3.org/TR/1998/WD-xml-names-19980916
|
|
3022 |
#
|
|
3023 |
# The prefix xml is by definition bound to the namespace name
|
|
3024 |
# urn:Connolly:input:required. The prefix xmlns is used only for
|
|
3025 |
# namespace bindings and is not itself bound to any namespace name.
|
|
3026 |
|
|
3027 |
my $DEFAULT_NAMESPACE = undef;
|
|
3028 |
my $XML_NAMESPACE = "urn:Connolly:input:required";
|
|
3029 |
#?? default namespace
|
|
3030 |
|
|
3031 |
sub xql_namespace
|
|
3032 |
{
|
|
3033 |
my ($self) = @_;
|
|
3034 |
my $nodeType = $self->xql_nodeType;
|
|
3035 |
my $element = $self;
|
|
3036 |
|
|
3037 |
if ($nodeType == 2) # 2: Attr
|
|
3038 |
{
|
|
3039 |
$element = $self->xql_parent;
|
|
3040 |
}
|
|
3041 |
elsif ($nodeType != 1) # 1: Element
|
|
3042 |
{
|
|
3043 |
return undef;
|
|
3044 |
}
|
|
3045 |
my $name = $self->xql_nodeName;
|
|
3046 |
my $declAttName;
|
|
3047 |
|
|
3048 |
if ($name =~ /([^:]+):([^:]+)/)
|
|
3049 |
{
|
|
3050 |
my ($prefix, $basename) = ($1, $2);
|
|
3051 |
|
|
3052 |
# "xml:" is special
|
|
3053 |
return $XML_NAMESPACE if $prefix eq "xml";
|
|
3054 |
|
|
3055 |
$declAttName = "xmlns:$prefix";
|
|
3056 |
}
|
|
3057 |
else
|
|
3058 |
{
|
|
3059 |
# Default namespace applies only to element type names.
|
|
3060 |
return $DEFAULT_NAMESPACE if $nodeType == 2; # 2: Attr
|
|
3061 |
#?? default namespace?
|
|
3062 |
$declAttName = "xmlns";
|
|
3063 |
}
|
|
3064 |
|
|
3065 |
do
|
|
3066 |
{
|
|
3067 |
my $ns = $element->xql_attribute ($declAttName);
|
|
3068 |
next unless defined $ns;
|
|
3069 |
return $ns->xql_rawText;
|
|
3070 |
|
|
3071 |
$element = $element->xql_parent;
|
|
3072 |
}
|
|
3073 |
while (defined ($element) and $element->xql_nodeType == 1);
|
|
3074 |
|
|
3075 |
# namespace not found
|
|
3076 |
undef;
|
|
3077 |
}
|
|
3078 |
|
|
3079 |
sub xql_basename
|
|
3080 |
{
|
|
3081 |
my ($self) = @_;
|
|
3082 |
my $nodeType = $self->xql_nodeType;
|
|
3083 |
return undef unless $nodeType == 1 || $nodeType == 2;
|
|
3084 |
|
|
3085 |
my $name = $self->xql_nodeName;
|
|
3086 |
$name =~ s/^[^:]://; # strip prefix
|
|
3087 |
$name;
|
|
3088 |
}
|
|
3089 |
|
|
3090 |
sub xql_prefix
|
|
3091 |
{
|
|
3092 |
my ($self) = @_;
|
|
3093 |
my $nodeType = $self->xql_nodeType;
|
|
3094 |
return undef unless $nodeType == 1 || $nodeType == 2;
|
|
3095 |
|
|
3096 |
$self->xql_nodeName =~ /^([^:]+):/;
|
|
3097 |
$1;
|
|
3098 |
}
|
|
3099 |
|
|
3100 |
# Used by ancestor()
|
|
3101 |
sub xql_parent
|
|
3102 |
{
|
|
3103 |
undef;
|
|
3104 |
}
|
|
3105 |
|
|
3106 |
my @NodeTypeString =
|
|
3107 |
(
|
|
3108 |
"", "element", "attribute", "text", "", "", "", "processing_instruction",
|
|
3109 |
"comment", "document"
|
|
3110 |
);
|
|
3111 |
|
|
3112 |
sub xql_nodeTypeString
|
|
3113 |
{
|
|
3114 |
my $i = $_[0]->xql_nodeType;
|
|
3115 |
return $NodeTypeString[$i] if ($i >= 1 && $i <= 3 || $i >= 7 && $i <= 9);
|
|
3116 |
|
|
3117 |
#?? what should this return?
|
|
3118 |
"<unknown xql_nodeType $i>";
|
|
3119 |
}
|
|
3120 |
|
|
3121 |
if (not $XML::XQL::Restricted)
|
|
3122 |
{
|
|
3123 |
require XML::XQL::Plus;
|
|
3124 |
}
|
|
3125 |
|
|
3126 |
# All nodes should implement:
|
|
3127 |
|
|
3128 |
#?? this section must be updated!!
|
|
3129 |
|
|
3130 |
# - xql_document
|
|
3131 |
# - xql_node: return an unblessed list reference with childNodes (not
|
|
3132 |
# attributes)
|
|
3133 |
# - xql_nodeType (default implementation for XML::XQL::Node returns 0):
|
|
3134 |
# Element: 1
|
|
3135 |
# Element Attribute: 2
|
|
3136 |
# Markup-Delimited Region of Text (Text and CDATASection): 3
|
|
3137 |
# Processing Instruction: 7
|
|
3138 |
# Comment: 8
|
|
3139 |
# Document (Entity): 9
|
|
3140 |
# - xql_text
|
|
3141 |
# - xql_value (default implementation is xql_text)
|
|
3142 |
# - xql_parent: return parent node or undef (Document, DocumentFragment)
|
|
3143 |
#
|
|
3144 |
# Element should define/override the following:
|
|
3145 |
# - xql_nodeName: return the element name
|
|
3146 |
# - xql_attribute("attributeName"): return an unblessed reference to a list
|
|
3147 |
# with the attribute, or [] if no such attribute
|
|
3148 |
# - xql_attribute(): return an unblessed reference to a list with
|
|
3149 |
# all attribute nodes
|
|
3150 |
# - xql_baseName, xql_prefix
|
|
3151 |
#
|
|
3152 |
# Attribute:
|
|
3153 |
# - xql_nodeName: return the attribute name
|
|
3154 |
# - xql_baseName, xql_prefix
|
|
3155 |
#
|
|
3156 |
# EntityReference:
|
|
3157 |
# - xql_data: return expanded text value
|
|
3158 |
#
|
|
3159 |
# Text, CDATASection:
|
|
3160 |
# - xql_data: return expanded text value
|
|
3161 |
#
|
|
3162 |
# -xql_element could be overriden to speed up performance
|
|
3163 |
#
|
|
3164 |
|
|
3165 |
1;
|
|
3166 |
|
|
3167 |
__END__
|
|
3168 |
|
|
3169 |
=head1 NAME
|
|
3170 |
|
|
3171 |
XML::XQL - A perl module for querying XML tree structures with XQL
|
|
3172 |
|
|
3173 |
=head1 SYNOPSIS
|
|
3174 |
|
|
3175 |
use XML::XQL;
|
|
3176 |
use XML::XQL::DOM;
|
|
3177 |
|
|
3178 |
$parser = new XML::DOM::Parser;
|
|
3179 |
$doc = $parser->parsefile ("file.xml");
|
|
3180 |
|
|
3181 |
# Return all elements with tagName='title' under the root element 'book'
|
|
3182 |
$query = new XML::XQL::Query (Expr => "book/title");
|
|
3183 |
@result = $query->solve ($doc);
|
|
3184 |
$query->dispose; # Avoid memory leaks - Remove circular references
|
|
3185 |
|
|
3186 |
# Or (to save some typing)
|
|
3187 |
@result = XML::XQL::solve ("book/title", $doc);
|
|
3188 |
|
|
3189 |
# Or (to save even more typing)
|
|
3190 |
@result = $doc->xql ("book/title");
|
|
3191 |
|
|
3192 |
=head1 DESCRIPTION
|
|
3193 |
|
|
3194 |
The XML::XQL module implements the XQL (XML Query Language) proposal
|
|
3195 |
submitted to the XSL Working Group in September 1998.
|
|
3196 |
The spec can be found at: L<http://www.w3.org/TandS/QL/QL98/pp/xql.html>
|
|
3197 |
Most of the contents related to the XQL syntax can also be found in the
|
|
3198 |
L<XML::XQL::Tutorial> that comes with this distribution.
|
|
3199 |
Note that XQL is not the same as XML-QL!
|
|
3200 |
|
|
3201 |
The current implementation only works with the L<XML::DOM> module, but once the
|
|
3202 |
design is stable and the major bugs are flushed out, other extensions might
|
|
3203 |
follow, e.g. for XML::Grove.
|
|
3204 |
|
|
3205 |
XQL was designed to be extensible and this implementation tries to stick to that.
|
|
3206 |
Users can add their own functions, methods, comparison operators and data types.
|
|
3207 |
Plugging in a new XML tree structure (like XML::Grove) should be a piece of cake.
|
|
3208 |
|
|
3209 |
To use the XQL module, either
|
|
3210 |
|
|
3211 |
use XML::XQL;
|
|
3212 |
|
|
3213 |
or
|
|
3214 |
|
|
3215 |
use XML::XQL::Strict;
|
|
3216 |
|
|
3217 |
The Strict module only provides the core XQL functionality as found in the
|
|
3218 |
XQL spec. By default (i.e. by using XML::XQL) you get 'XQL+', which has
|
|
3219 |
some additional features.
|
|
3220 |
|
|
3221 |
See the section L<Additional Features in XQL+> for the differences.
|
|
3222 |
|
|
3223 |
This module is still in development. See the To-do list in XQL.pm for what
|
|
3224 |
still needs to be done. Any suggestions are welcome, the sooner these
|
|
3225 |
implementation issues are resolved, the faster we can all use this module.
|
|
3226 |
|
|
3227 |
If you find a bug, you would do me great favor by sending it to me in the
|
|
3228 |
form of a test case. See the file t/xql_template.t that comes with this distribution.
|
|
3229 |
|
|
3230 |
If you have written a cool comparison operator, function, method or XQL data
|
|
3231 |
type that you would like to share, send it to enno@att.com and I will
|
|
3232 |
add it to this module.
|
|
3233 |
|
|
3234 |
=head1 XML::XQL global functions
|
|
3235 |
|
|
3236 |
=over 4
|
|
3237 |
|
|
3238 |
=item solve (QUERY_STRING, INPUT_LIST...)
|
|
3239 |
|
|
3240 |
@result = XML::XQL::solve ("doc//book", $doc);
|
|
3241 |
|
|
3242 |
This is provided as a shortcut for:
|
|
3243 |
|
|
3244 |
$query = new XML::XQL::Query (Expr => "doc//book");
|
|
3245 |
@result = $query->solve ($doc);
|
|
3246 |
$query->dispose;
|
|
3247 |
|
|
3248 |
Note that with L<XML::XQL::DOM>, you can also write (see L<XML::DOM::Node>
|
|
3249 |
for details):
|
|
3250 |
|
|
3251 |
@result = $doc->xql ("doc//book");
|
|
3252 |
|
|
3253 |
=item setDocParser (PARSER)
|
|
3254 |
|
|
3255 |
Sets the XML::DOM::Parser that is used by the new XQL+ document() method.
|
|
3256 |
By default it uses an XML::DOM::Parser that was created without any arguments,
|
|
3257 |
i.e.
|
|
3258 |
|
|
3259 |
$PARSER = new XML::DOM::Parser;
|
|
3260 |
|
|
3261 |
=item defineFunction (NAME, FUNCREF, ARGCOUNT [, ALLOWED_OUTSIDE [, CONST, [QUERY_ARG]]])
|
|
3262 |
|
|
3263 |
Defines the XQL function (at the global level, i.e. for all newly created
|
|
3264 |
queries) with the specified NAME. The ARGCOUNT parameter can either be a single
|
|
3265 |
number or a reference to a list with numbers.
|
|
3266 |
A single number expands to [ARGCOUNT, ARGCOUNT]. The list contains pairs of
|
|
3267 |
numbers, indicating the number of arguments that the function allows. The value
|
|
3268 |
-1 means infinity. E.g. [2, 5, 7, 9, 12, -1] means that the function can have
|
|
3269 |
2, 3, 4, 5, 7, 8, 9, 12 or more arguments.
|
|
3270 |
The number of arguments is checked when parsing the XQL query string.
|
|
3271 |
|
|
3272 |
The second parameter must be a reference to a Perl function or an anonymous
|
|
3273 |
sub. E.g. '\&my_func' or 'sub { ... code ... }'
|
|
3274 |
|
|
3275 |
If ALLOWED_OUTSIDE (default is 0) is set to 1, the function or method may
|
|
3276 |
also be used outside subqueries in I<node queries>.
|
|
3277 |
(See NodeQuery parameter in Query constructor)
|
|
3278 |
|
|
3279 |
If CONST (default is 0) is set to 1, the function is considered to be
|
|
3280 |
"constant". See L<Constant Function Invocations> for details.
|
|
3281 |
|
|
3282 |
If QUERY_ARG (default is 0) is not -1, the argument with that index is
|
|
3283 |
considered to be a 'query parameter'. If the query parameter is a subquery,
|
|
3284 |
that returns multiple values, the result list of the function invocation will
|
|
3285 |
contain one result value for each value of the subquery.
|
|
3286 |
E.g. 'length(book/author)' will return a list of Numbers, denoting the string
|
|
3287 |
lengths of all the author elements returned by 'book/author'.
|
|
3288 |
|
|
3289 |
Note that only methods (not functions) may appear after a Bang "!" operator.
|
|
3290 |
This is checked when parsing the XQL query string.
|
|
3291 |
|
|
3292 |
See also: defineMethod
|
|
3293 |
|
|
3294 |
=item generateFunction (NAME, FUNCNAME, RETURN_TYPE [, ARGCOUNT [, ALLOWED_OUTSIDE [, CONST [, QUERY_ARG]]]])
|
|
3295 |
|
|
3296 |
Generates and defines an XQL function wrapper for the Perl function with the
|
|
3297 |
name FUNCNAME. The function name will be NAME in XQL query expressions.
|
|
3298 |
The return type should be one of the builtin XQL Data Types or a class derived
|
|
3299 |
from XML::XQL::PrimitiveType (see L<Adding Data Types>.)
|
|
3300 |
See defineFunction for the meaning of ARGCOUNT, ALLOWED_OUTSIDE, CONST and
|
|
3301 |
QUERY_ARG.
|
|
3302 |
|
|
3303 |
Function values are always converted to Perl strings with xql_toString before
|
|
3304 |
they are passed to the Perl function implementation. The function return value
|
|
3305 |
is cast to an object of type RETURN_TYPE, or to the empty list [] if the
|
|
3306 |
result is undef. It uses expandType to expand XQL primitive type names.
|
|
3307 |
If RETURN_TYPE is "*", it returns the function
|
|
3308 |
result as is, unless the function result is undef, in which case it returns [].
|
|
3309 |
|
|
3310 |
=item defineMethod (NAME, FUNCREF, ARGCOUNT [, ALLOWED_OUTSIDE])
|
|
3311 |
|
|
3312 |
Defines the XQL method (at the global level, i.e. for all newly created
|
|
3313 |
queries) with the specified NAME. The ARGCOUNT parameter can either be a single
|
|
3314 |
number or a reference to a list with numbers.
|
|
3315 |
A single number expands to [ARGCOUNT, ARGCOUNT]. The list contains pairs of
|
|
3316 |
numbers, indicating the number of arguments that the method allows. The value
|
|
3317 |
-1 means infinity. E.g. [2, 5, 7, 9, 12, -1] means that the method can have
|
|
3318 |
2, 3, 4, 5, 7, 8, 9, 12 or more arguments.
|
|
3319 |
The number of arguments is checked when parsing the XQL query string.
|
|
3320 |
|
|
3321 |
The second parameter must be a reference to a Perl function or an anonymous
|
|
3322 |
sub. E.g. '\&my_func' or 'sub { ... code ... }'
|
|
3323 |
|
|
3324 |
If ALLOWED_OUTSIDE (default is 0) is set to 1, the function or method may
|
|
3325 |
also be used outside subqueries in I<node queries>.
|
|
3326 |
(See NodeQuery parameter in Query constructor)
|
|
3327 |
|
|
3328 |
Note that only methods (not functions) may appear after a Bang "!" operator.
|
|
3329 |
This is checked when parsing the XQL query string.
|
|
3330 |
|
|
3331 |
See also: defineFunction
|
|
3332 |
|
|
3333 |
=item defineComparisonOperators (NAME => FUNCREF [, NAME => FUNCREF]*)
|
|
3334 |
|
|
3335 |
Defines XQL comparison operators at the global level.
|
|
3336 |
The FUNCREF parameters must be a references to a Perl function or an anonymous
|
|
3337 |
sub. E.g. '\&my_func' or 'sub { ... code ... }'
|
|
3338 |
|
|
3339 |
E.g. define the operators $my_op$ and $my_op2$:
|
|
3340 |
|
|
3341 |
defineComparisonOperators ('my_op' => \&my_op,
|
|
3342 |
'my_op2' => sub { ... insert code here ... });
|
|
3343 |
|
|
3344 |
=item defineElementValueConvertor (TAG_NAME, FUNCREF)
|
|
3345 |
|
|
3346 |
Defines that the result of the value() call for Elements with the specified
|
|
3347 |
TAG_NAME uses the specified function. The function will receive
|
|
3348 |
two parameters. The second one is the TAG_NAME of the Element node
|
|
3349 |
and the first parameter is the Element node itself.
|
|
3350 |
FUNCREF should be a reference to a Perl function, e.g. \&my_sub, or
|
|
3351 |
an anonymous sub.
|
|
3352 |
|
|
3353 |
E.g. to define that all Elements with tag name 'date-of-birth' should return
|
|
3354 |
XML::XQL::Date objects:
|
|
3355 |
|
|
3356 |
defineElementValueConvertor ('date-of-birth', sub {
|
|
3357 |
my $elem = shift;
|
|
3358 |
# Always pass in the node as the second parameter. This is
|
|
3359 |
# the reference node for the object, which is used when
|
|
3360 |
# sorting values in document order.
|
|
3361 |
new XML::XQL::Date ($elem->xql_text, $elem);
|
|
3362 |
});
|
|
3363 |
|
|
3364 |
These convertors can only be specified at a global level, not on a per query
|
|
3365 |
basis. To undefine a convertor, simply pass a FUNCREF of undef.
|
|
3366 |
|
|
3367 |
=item defineAttrValueConvertor (ELEM_TAG_NAME, ATTR_NAME, FUNCREF)
|
|
3368 |
|
|
3369 |
Defines that the result of the value() call for Attributes with the specified
|
|
3370 |
ATTR_NAME and a parent Element with the specified ELEM_TAG_NAME
|
|
3371 |
uses the specified function. An ELEM_TAG_NAME of "*" will match regardless of
|
|
3372 |
the tag name of the parent Element. The function will receive
|
|
3373 |
3 parameters. The third one is the tag name of the parent Element (even if
|
|
3374 |
ELEM_TAG_NAME was "*"), the second is the ATTR_NAME and the first is the
|
|
3375 |
Attribute node itself.
|
|
3376 |
FUNCREF should be a reference to a Perl function, e.g. \&my_sub, or
|
|
3377 |
an anonymous sub.
|
|
3378 |
|
|
3379 |
These convertors can only be specified at a global level, not on a per query
|
|
3380 |
basis. To undefine a convertor, simply pass a FUNCREF of undef.
|
|
3381 |
|
|
3382 |
=item defineTokenQ (Q)
|
|
3383 |
|
|
3384 |
Defines the token for the q// string delimiters at a global level.
|
|
3385 |
The default value for XQL+ is 'q', for XML::XQL::Strict it is undef.
|
|
3386 |
A value of undef will deactivate this feature.
|
|
3387 |
|
|
3388 |
=item defineTokenQQ (QQ)
|
|
3389 |
|
|
3390 |
Defines the token for the qq// string delimiters at a global level.
|
|
3391 |
The default value for XQL+ is 'qq', for XML::XQL::Strict it is undef.
|
|
3392 |
A value of undef will deactivate this feature.
|
|
3393 |
|
|
3394 |
=item expandType (TYPE)
|
|
3395 |
|
|
3396 |
Used internally to expand type names of XQL primitive types.
|
|
3397 |
E.g. it expands "Number" to "XML::XQL::Number" and is not case-sensitive, so
|
|
3398 |
"number" and "NuMbEr" will both expand correctly.
|
|
3399 |
|
|
3400 |
=item defineExpandedTypes (ALIAS, FULL_NAME [, ...])
|
|
3401 |
|
|
3402 |
For each pair of arguments it allows the class name FULL_NAME to be abbreviated
|
|
3403 |
with ALIAS. The definitions are used by expandType().
|
|
3404 |
(ALIAS is always converted to lowercase internally, because expandType
|
|
3405 |
is case-insensitive.)
|
|
3406 |
|
|
3407 |
Overriding the ALIAS for "date", also affects the object type returned by the
|
|
3408 |
date() function.
|
|
3409 |
|
|
3410 |
=item setErrorContextDelimiters (START, END, BOLD_ON, BOLD_OFF)
|
|
3411 |
|
|
3412 |
Sets the delimiters used when printing error messages during query evaluation.
|
|
3413 |
The default delimiters on Unix are `tput smul` (underline on) and `tput rmal`
|
|
3414 |
(underline off). On other systems (that don't have tput), the delimiters are
|
|
3415 |
">>" and "<<" resp.
|
|
3416 |
|
|
3417 |
When printing the error message, the subexpression that caused the error will
|
|
3418 |
be enclosed by the delimiters, i.e. underlined on Unix.
|
|
3419 |
|
|
3420 |
For certain subexpressions the significant keyword, e.g. "$and$" is enclosed in
|
|
3421 |
the bold delimiters BOLD_ON (default: `tput bold` on Unix, "" elsewhere) and
|
|
3422 |
BOLD_OFF (default: (`tput rmul` . `tput smul`) on Unix, "" elsewhere,
|
|
3423 |
see $BoldOff in XML::XQL::XQL.pm for details.)
|
|
3424 |
|
|
3425 |
=item isEmptyList (VAR)
|
|
3426 |
|
|
3427 |
Returns 1 if VAR is [], else 0. Can be used in user defined functions.
|
|
3428 |
|
|
3429 |
=back
|
|
3430 |
|
|
3431 |
=head1 Additional Features in XQL+
|
|
3432 |
|
|
3433 |
=over 4
|
|
3434 |
|
|
3435 |
=item Parent operator '..'
|
|
3436 |
|
|
3437 |
The '..' operator returns the parent of the current node, where '.' would
|
|
3438 |
return the current node. This is not part of any XQL standard, because you
|
|
3439 |
would normally use return operators, which are not implemented here.
|
|
3440 |
|
|
3441 |
=item Sequence operators ';' and ';;'
|
|
3442 |
|
|
3443 |
The sequence operators ';' (precedes) and ';;' (immediately precedes) are
|
|
3444 |
not in the XQL spec, but are described in 'The Design of XQL' by Jonathan Robie
|
|
3445 |
who is one of the designers of XQL. It can be found at
|
|
3446 |
L<http://www.texcel.no/whitepapers/xql-design.html>
|
|
3447 |
See also the XQL Tutorial for a description of what they mean.
|
|
3448 |
|
|
3449 |
=item q// and qq// String Tokens
|
|
3450 |
|
|
3451 |
String tokens a la q// and qq// are allowed. q// evaluates like Perl's single
|
|
3452 |
quotes and qq// like Perl's double quotes. Note that the default XQL strings do
|
|
3453 |
not allow escaping etc., so it's not possible to define a string with both
|
|
3454 |
single and double quotes. If 'q' and 'qq' are not to your liking, you may
|
|
3455 |
redefine them to something else or undefine them altogether, by assigning undef
|
|
3456 |
to them. E.g:
|
|
3457 |
|
|
3458 |
# at a global level - shared by all queries (that don't (re)define 'q')
|
|
3459 |
XML::XQL::defineTokenQ ('k');
|
|
3460 |
XML::XQL::defineTokenQQ (undef);
|
|
3461 |
|
|
3462 |
# at a query level - only defined for this query
|
|
3463 |
$query = new XML::XQL::Query (Expr => "book/title", q => 'k', qq => undef);
|
|
3464 |
|
|
3465 |
From now on k// works like q// did and qq// doesn't work at all anymore.
|
|
3466 |
|
|
3467 |
=item Query strings can have embedded Comments
|
|
3468 |
|
|
3469 |
For example:
|
|
3470 |
|
|
3471 |
$queryExpr = "book/title # this comment is inside the query string
|
|
3472 |
[. = 'Moby Dick']"; # this comment is outside
|
|
3473 |
|
|
3474 |
=item Optional dollar delimiters and case-insensitive XQL keywords
|
|
3475 |
|
|
3476 |
The following XQL keywords are case-insensitive and the dollar sign delimiters
|
|
3477 |
may be omitted: $and$, $or$, $not$, $union$, $intersect$, $to$, $any$, $all$,
|
|
3478 |
$eq$, $ne$, $lt$, $gt$, $ge$, $le$, $ieq$, $ine$, $ilt$, $igt$, $ige$, $ile$.
|
|
3479 |
|
|
3480 |
E.g. $AND$, $And$, $aNd$, and, And, aNd are all valid replacements for $and$.
|
|
3481 |
|
|
3482 |
Note that XQL+ comparison operators ($match$, $no_match$, $isa$, $can$) still
|
|
3483 |
require dollar delimiters and are case-sensitive.
|
|
3484 |
|
|
3485 |
=item Comparison operator: $match$ or '=~'
|
|
3486 |
|
|
3487 |
E.g. "book/title =~ '/(Moby|Dick)/']" will return all book titles containing
|
|
3488 |
Moby or Dick. Note that the match expression needs to be quoted and should
|
|
3489 |
contain the // or m// delimiters for Perl.
|
|
3490 |
|
|
3491 |
When casting the values to be matched, both are converted to Text.
|
|
3492 |
|
|
3493 |
=item Comparison operator: $no_match$ or '!~'
|
|
3494 |
|
|
3495 |
E.g. "book/title !~ '/(Moby|Dick)/']" will return all book titles that don't
|
|
3496 |
contain Moby or Dick. Note that the match expression needs to be quoted and
|
|
3497 |
should contain the // or m// delimiters for Perl.
|
|
3498 |
|
|
3499 |
When casting the values to be matched, both are converted to Text.
|
|
3500 |
|
|
3501 |
=item Comparison operator: $isa$
|
|
3502 |
|
|
3503 |
E.g. '//. $isa$ "XML::XQL::Date"' returns all elements for which the value()
|
|
3504 |
function returns an XML::XQL::Date object. (Note that the value() function can
|
|
3505 |
be overridden to return a specific object type for certain elements and
|
|
3506 |
attributes.) It uses expandType to expand XQL primitive type names.
|
|
3507 |
|
|
3508 |
=item Comparison operator: $can$
|
|
3509 |
|
|
3510 |
E.g. '//. $can$ "swim"' returns all elements for which the value()
|
|
3511 |
function returns an object that implements the (Perl) swim() method.
|
|
3512 |
(Note that the value() function can be overridden to return a specific object
|
|
3513 |
type for certain elements and attributes.)
|
|
3514 |
|
|
3515 |
=item Function: once (QUERY)
|
|
3516 |
|
|
3517 |
E.g. 'once(id("foo"))' will evaluate the QUERY expression only once per query.
|
|
3518 |
Certain query results (like the above example) will always return the same
|
|
3519 |
value within a query. Using once() will cache the QUERY result for the
|
|
3520 |
rest of the query.
|
|
3521 |
|
|
3522 |
Note that "constant" function invocations are always cached.
|
|
3523 |
See also L<Constant Function Invocations>
|
|
3524 |
|
|
3525 |
=item Function: subst (QUERY, EXPR, EXPR [,MODIFIERS, [MODE]])
|
|
3526 |
|
|
3527 |
E.g. 'subst(book/title, "[M|m]oby", "Dick", "g")' will replace Moby or moby
|
|
3528 |
with Dick globally ("g") in all book title elements. Underneath it uses Perl's
|
|
3529 |
substitute operator s///. Don't worry about which delimiters are used underneath.
|
|
3530 |
The function returns all the book/titles for which a substitution occurred.
|
|
3531 |
The default MODIFIERS string is "" (empty.) The function name may be abbreviated
|
|
3532 |
to "s".
|
|
3533 |
|
|
3534 |
For most Node types, it converts the value() to a string (with xql_toString)
|
|
3535 |
to match the string and xql_setValue to set the new value in case it matched.
|
|
3536 |
For XQL primitives (Boolean, Number, Text) and other data types (e.g. Date) it
|
|
3537 |
uses xql_toString to match the String and xql_setValue to set the result.
|
|
3538 |
Beware that performing a substitution on a primitive that was found in the
|
|
3539 |
original XQL query expression, changes the value of that constant.
|
|
3540 |
|
|
3541 |
If MODE is 0 (default), it treats Element nodes differently by matching and
|
|
3542 |
replacing I<text blocks> occurring in the Element node. A text block is defined
|
|
3543 |
as the concatenation of the raw text of subsequent Text, CDATASection and
|
|
3544 |
EntityReference nodes. In this mode it skips embedded Element nodes.
|
|
3545 |
If a text block matches, it is replaced by a single Text node, regardless
|
|
3546 |
of the original node type(s).
|
|
3547 |
|
|
3548 |
If MODE is 1, it treats Element nodes like the other nodes, i.e. it converts
|
|
3549 |
the value() to a string etc. Note that the default implementation of value()
|
|
3550 |
calls text(), which normalizes whitespace and includes embedded Element
|
|
3551 |
descendants (recursively.) This is probably not what you want to use in most
|
|
3552 |
cases, but since I'm not a professional psychic... :-)
|
|
3553 |
|
|
3554 |
=item Function: map (QUERY, CODE)
|
|
3555 |
|
|
3556 |
E.g. 'map(book/title, "s/[M|m]oby/Dick/g; $_")' will replace Moby or moby
|
|
3557 |
with Dick globally ("g") in all book title elements. Underneath it uses Perl's
|
|
3558 |
map operator. The function returns all the book/titles for which a
|
|
3559 |
change occurred.
|
|
3560 |
|
|
3561 |
??? add more specifics
|
|
3562 |
|
|
3563 |
=item Function: eval (EXPR [,TYPE])
|
|
3564 |
|
|
3565 |
Evaluates the Perl expression EXPR and returns an object of the specified TYPE.
|
|
3566 |
It uses expandType to expand XQL primitive type names.
|
|
3567 |
If the result of the eval was undef, the empty list [] is returned.
|
|
3568 |
|
|
3569 |
E.g. 'eval("2 + 5", "Number")' returns a Number object with the value 7, and
|
|
3570 |
'eval("%ENV{USER}")' returns a Text object with the user name.
|
|
3571 |
|
|
3572 |
Consider using once() to cache the return value, when the invocation will
|
|
3573 |
return the same result for each invocation within a query.
|
|
3574 |
|
|
3575 |
??? add more specifics
|
|
3576 |
|
|
3577 |
=item Function: new (TYPE [, QUERY [, PAR] *])
|
|
3578 |
|
|
3579 |
Creates a new object of the specified object TYPE. The constructor may have any
|
|
3580 |
number of arguments. The first argument of the constructor (the 2nd argument
|
|
3581 |
of the new() function) is considered to be a 'query parameter'.
|
|
3582 |
See defineFunction for a definition of I<query parameter>.
|
|
3583 |
It uses expandType to expand XQL primitive type names.
|
|
3584 |
|
|
3585 |
=item Function: document (QUERY) or doc (QUERY)
|
|
3586 |
|
|
3587 |
The document() function creates a new L<XML::XML::Document> for each result
|
|
3588 |
of QUERY (QUERY may be a simple string expression, like "/usr/enno/file.xml".
|
|
3589 |
See t/xql_document.t or below for an example with a more complex QUERY.)
|
|
3590 |
|
|
3591 |
document() may be abbreviated to doc().
|
|
3592 |
|
|
3593 |
document() uses an XML::DOM::Parser underneath, which can be set with
|
|
3594 |
XML::XQL::setDocParser(). By default it uses a parser that was created without
|
|
3595 |
any arguments, i.e.
|
|
3596 |
|
|
3597 |
$PARSER = new XML::DOM::Parser;
|
|
3598 |
|
|
3599 |
Let's try a more complex example, assuming $doc contains:
|
|
3600 |
|
|
3601 |
<doc>
|
|
3602 |
<file name="file1.xml"/>
|
|
3603 |
<file name="file2.xml"/>
|
|
3604 |
</doc>
|
|
3605 |
|
|
3606 |
Then the following query will return two L<XML::XML::Document>s,
|
|
3607 |
one for file1.xml and one for file2.xml:
|
|
3608 |
|
|
3609 |
@result = XML::XQL::solve ("document(doc/file/@name)", $doc);
|
|
3610 |
|
|
3611 |
The resulting documents can be used as input for following queries, e.g.
|
|
3612 |
|
|
3613 |
@result = XML::XQL::solve ("document(doc/file/@name)/root/bla", $doc);
|
|
3614 |
|
|
3615 |
will return all /root/bla elements from the documents returned by document().
|
|
3616 |
|
|
3617 |
=item Method: DOM_nodeType ()
|
|
3618 |
|
|
3619 |
Returns the DOM node type. Note that these are mostly the same as nodeType(),
|
|
3620 |
except for CDATASection and EntityReference nodes. DOM_nodeType() returns
|
|
3621 |
4 and 5 respectively, whereas nodeType() returns 3, because they are
|
|
3622 |
considered text nodes.
|
|
3623 |
|
|
3624 |
=item Function wrappers for Perl builtin functions
|
|
3625 |
|
|
3626 |
XQL function wrappers have been provided for most Perl builtin functions.
|
|
3627 |
When using a Perl builtin function like "substr" in an XQL+ querry, an
|
|
3628 |
XQL function wrapper will be generated on the fly. The arguments to these
|
|
3629 |
functions may be regular XQL+ subqueries (that return one or more values) for
|
|
3630 |
a I<query parameter> (see generateFunction for a definition.)
|
|
3631 |
Most wrappers of Perl builtin functions have argument 0 for a query parameter,
|
|
3632 |
except for: chmod (parameter 1 is the query parameter), chown (2) and utime (2).
|
|
3633 |
The following functions have no query parameter, which means that all parameters
|
|
3634 |
should be a single value: atan2, rand, srand, sprintf, rename, unlink, system.
|
|
3635 |
|
|
3636 |
The function result is casted to the appropriate XQL primitive type (Number,
|
|
3637 |
Text or Boolean), or to an empty list if the result was undef.
|
|
3638 |
|
|
3639 |
=back
|
|
3640 |
|
|
3641 |
=head2 XPath functions and methods
|
|
3642 |
|
|
3643 |
The following functions were found in the XPath specification:
|
|
3644 |
|
|
3645 |
=over 4
|
|
3646 |
|
|
3647 |
=item Function: concat (STRING, STRING, STRING*)
|
|
3648 |
|
|
3649 |
The concat function returns the concatenation of its arguments.
|
|
3650 |
|
|
3651 |
=item Function: starts-with (STRING, STRING)
|
|
3652 |
|
|
3653 |
The starts-with function returns true if the first argument string starts with
|
|
3654 |
the second argument string, and otherwise returns false.
|
|
3655 |
|
|
3656 |
=item Function: contains (STRING, STRING)
|
|
3657 |
|
|
3658 |
The contains function returns true if the first argument string contains the
|
|
3659 |
second argument string, and otherwise returns false.
|
|
3660 |
|
|
3661 |
=item Function: substring-before (STRING, STRING)
|
|
3662 |
|
|
3663 |
The substring-before function returns the substring of the first argument
|
|
3664 |
string that precedes the first occurrence of the second argument string
|
|
3665 |
in the first argument string, or the empty string if the first argument
|
|
3666 |
string does not contain the second argument string. For example,
|
|
3667 |
|
|
3668 |
substring-before("1999/04/01","/") returns 1999.
|
|
3669 |
|
|
3670 |
=item Function: substring-after (STRING, STRING)
|
|
3671 |
|
|
3672 |
The substring-after function returns the substring of the first argument string
|
|
3673 |
that follows the first occurrence of the second argument string in
|
|
3674 |
the first argument string, or the empty string if the first argument string does
|
|
3675 |
not contain the second argument string. For example,
|
|
3676 |
|
|
3677 |
substring-after("1999/04/01","/") returns 04/01,
|
|
3678 |
|
|
3679 |
and
|
|
3680 |
|
|
3681 |
substring-after("1999/04/01","19") returns 99/04/01.
|
|
3682 |
|
|
3683 |
=item Function: substring (STRING, NUMBER [, NUMBER] )
|
|
3684 |
|
|
3685 |
The substring function returns the substring of the first argument starting at
|
|
3686 |
the position specified in the second argument with length specified in
|
|
3687 |
the third argument. For example,
|
|
3688 |
|
|
3689 |
substring("12345",2,3) returns "234".
|
|
3690 |
|
|
3691 |
If the third argument is not specified, it returns the substring
|
|
3692 |
starting at the position specified in the second argument and continuing to
|
|
3693 |
the end of the string. For example,
|
|
3694 |
|
|
3695 |
substring("12345",2) returns "2345".
|
|
3696 |
|
|
3697 |
More precisely, each character in the string is considered
|
|
3698 |
to have a numeric position: the position of the first character is 1,
|
|
3699 |
the position of the second character is 2 and so on.
|
|
3700 |
|
|
3701 |
NOTE: This differs from the B<substr> method , in which the
|
|
3702 |
method treats the position of the first character as 0.
|
|
3703 |
|
|
3704 |
The XPath spec says this about rounding, but that is not true in this
|
|
3705 |
implementation:
|
|
3706 |
I<The returned substring contains those characters for which the position of the
|
|
3707 |
character is greater than or equal to the rounded value of the
|
|
3708 |
second argument and, if the third argument is specified, less than the
|
|
3709 |
sum of the rounded value of the second argument and the rounded value of
|
|
3710 |
the third argument; the comparisons and addition used for the above
|
|
3711 |
follow the standard IEEE 754 rules; rounding is done as if by a call to the
|
|
3712 |
round function.>
|
|
3713 |
|
|
3714 |
=item Method: string-length ( [ QUERY ] )
|
|
3715 |
|
|
3716 |
The string-length returns the number of characters in the string.
|
|
3717 |
If the argument is omitted, it defaults to the context node
|
|
3718 |
converted to a string, in other words the string-value of the context node.
|
|
3719 |
|
|
3720 |
Note that the generated XQL wrapper for the Perl built-in B<substr> does not
|
|
3721 |
allow the argument to be omitted.
|
|
3722 |
|
|
3723 |
=item Method: normalize-space ( [ QUERY ] )
|
|
3724 |
|
|
3725 |
The normalize-space function returns the argument string with whitespace
|
|
3726 |
normalized by stripping leading and trailing whitespace and replacing
|
|
3727 |
sequences of whitespace characters by a single space. Whitespace characters are
|
|
3728 |
the same as those allowed by the S production in XML. If the
|
|
3729 |
argument is omitted, it defaults to the context node converted to a string, in
|
|
3730 |
other words the string-value of the context node.
|
|
3731 |
|
|
3732 |
=item Function: translate (STRING, STRING, STRING)
|
|
3733 |
|
|
3734 |
The translate function returns the first argument string with occurrences of
|
|
3735 |
characters in the second argument string replaced by the character at
|
|
3736 |
the corresponding position in the third argument string. For example,
|
|
3737 |
|
|
3738 |
translate("bar","abc","ABC") returns the string BAr.
|
|
3739 |
|
|
3740 |
If there is a
|
|
3741 |
character in the second argument string with no character at a corresponding
|
|
3742 |
position in the third argument string (because the second argument
|
|
3743 |
string is longer than the third argument string), then occurrences of that
|
|
3744 |
character in the first argument string are removed. For example,
|
|
3745 |
|
|
3746 |
translate("--aaa--","abc-","ABC") returns "AAA".
|
|
3747 |
|
|
3748 |
If a character occurs more than once in the second argument string, then the
|
|
3749 |
first occurrence determines the replacement character. If the third argument
|
|
3750 |
string is longer than the second argument string, then excess characters
|
|
3751 |
are ignored.
|
|
3752 |
|
|
3753 |
NOTE: The translate function is not a sufficient solution for case conversion
|
|
3754 |
in all languages. A future version may
|
|
3755 |
provide additional functions for case conversion.
|
|
3756 |
|
|
3757 |
This function was implemented using tr///d.
|
|
3758 |
|
|
3759 |
=item Function: sum ( QUERY )
|
|
3760 |
|
|
3761 |
The sum function returns the sum of the QUERY results, by
|
|
3762 |
converting the string values of each result to a number.
|
|
3763 |
|
|
3764 |
=item Function: floor (NUMBER)
|
|
3765 |
|
|
3766 |
The floor function returns the largest (closest to positive infinity) number
|
|
3767 |
that is not greater than the argument and that is an integer.
|
|
3768 |
|
|
3769 |
=item Function: ceiling (NUMBER)
|
|
3770 |
|
|
3771 |
The ceiling function returns the smallest (closest to negative infinity) number
|
|
3772 |
that is not less than the argument and that is an integer.
|
|
3773 |
|
|
3774 |
=item Function: round (NUMBER)
|
|
3775 |
|
|
3776 |
The round function returns the number that is closest to the argument
|
|
3777 |
and that is an integer. If there are two such numbers, then the one that is
|
|
3778 |
closest to positive infinity is returned.
|
|
3779 |
|
|
3780 |
=back
|
|
3781 |
|
|
3782 |
=head1 Implementation Details
|
|
3783 |
|
|
3784 |
=over 4
|
|
3785 |
|
|
3786 |
=item XQL Builtin Data Types
|
|
3787 |
|
|
3788 |
The XQL engine uses the following object classes internally. Only Number,
|
|
3789 |
Boolean and Text are considered I<primitive XQL types>:
|
|
3790 |
|
|
3791 |
=over 4
|
|
3792 |
|
|
3793 |
=item * XML::XQL::Number
|
|
3794 |
|
|
3795 |
For integers and floating point numbers.
|
|
3796 |
|
|
3797 |
=item * XML::XQL::Boolean
|
|
3798 |
|
|
3799 |
For booleans, e.g returned by true() and false().
|
|
3800 |
|
|
3801 |
=item * XML::XQL::Text
|
|
3802 |
|
|
3803 |
For string values.
|
|
3804 |
|
|
3805 |
=item * XML::XQL::Date
|
|
3806 |
|
|
3807 |
For date, time and date/time values. E.g. returned by the date() function.
|
|
3808 |
|
|
3809 |
=item * XML::XQL::Node
|
|
3810 |
|
|
3811 |
Superclass of all XML node types. E.g. all subclasses of XML::DOM::Node subclass
|
|
3812 |
from this.
|
|
3813 |
|
|
3814 |
=item * Perl list reference
|
|
3815 |
|
|
3816 |
Lists of values are passed by reference (i.e. using [] delimiters).
|
|
3817 |
The empty list [] has a double meaning. It also means 'undef' in certain
|
|
3818 |
situations, e.g. when a function invocation or comparison failed.
|
|
3819 |
|
|
3820 |
=back
|
|
3821 |
|
|
3822 |
=item Type casting in comparisons
|
|
3823 |
|
|
3824 |
When two values are compared in an XML comparison (e.g. $eq$) the values are
|
|
3825 |
first casted to the same data type. Node values are first replaced by their
|
|
3826 |
value() (i.e. the XQL value() function is used, which returns a Text value by
|
|
3827 |
default, but may return any data type if the user so chooses.)
|
|
3828 |
The resulting values are then casted to the type of the object with the highest
|
|
3829 |
xql_primType() value. They are as follows: Node (0), Text (1), Number (2),
|
|
3830 |
Boolean (3), Date (4), other data types (4 by default, but this may be
|
|
3831 |
overriden by the user.)
|
|
3832 |
|
|
3833 |
E.g. if one value is a Text value and the other is a Number, the Text value is
|
|
3834 |
cast to a Number and the resulting low-level (Perl) comparison is (for $eq$):
|
|
3835 |
|
|
3836 |
$number->xql_toString == $text->xql_toString
|
|
3837 |
|
|
3838 |
If both were Text values, it would have been
|
|
3839 |
|
|
3840 |
$text1->xql_toString eq $text2->xql_toString
|
|
3841 |
|
|
3842 |
Note that the XQL spec is vague and even conflicting where it concerns type
|
|
3843 |
casting. This implementation resulted after talking to Joe Lapp, one of the
|
|
3844 |
spec writers.
|
|
3845 |
|
|
3846 |
=item Adding Data Types
|
|
3847 |
|
|
3848 |
If you want to add your own data type, make sure it derives from
|
|
3849 |
XML::XQL::PrimitiveType and implements the necessary methods.
|
|
3850 |
|
|
3851 |
I will add more stuff here to explain it all, but for now, look at the code
|
|
3852 |
for the primitive XQL types or the Date class (L<XML::XQL::Date> in Date.pm.)
|
|
3853 |
|
|
3854 |
=item Document Order
|
|
3855 |
|
|
3856 |
The XQL spec states that query results always return their values in
|
|
3857 |
I<document order>, which means the order in which they appeared in the original
|
|
3858 |
XML document. Values extracted from Nodes (e.g. with value(), text(), rawText(),
|
|
3859 |
nodeName(), etc.) always have a pointer to the reference node (i.e. the Node
|
|
3860 |
from which the value was extracted.) These pointers are acknowledged when
|
|
3861 |
(intermediate) result lists are sorted. Currently, the only place where a
|
|
3862 |
result list is sorted is in a $union$ expression, which is the only place
|
|
3863 |
where the result list can be unordered.
|
|
3864 |
(If you find that this is not true, let me know.)
|
|
3865 |
|
|
3866 |
Non-node values that have no associated reference node, always end up at the end
|
|
3867 |
of the result list in the order that they were added.
|
|
3868 |
The XQL spec states that the reference node for an XML Attribute is the Element
|
|
3869 |
to which it belongs, and that the order of values with the same reference node
|
|
3870 |
is undefined. This means that the order of an Element and its attributes would
|
|
3871 |
be undefined.
|
|
3872 |
But since the XML::DOM module keeps track of the order of the attributes, the
|
|
3873 |
XQL engine does the same, and therefore, the attributes of an Element are
|
|
3874 |
sorted and appear after their parent Element in a sorted result list.
|
|
3875 |
|
|
3876 |
=item Constant Function Invocations
|
|
3877 |
|
|
3878 |
If a function always returns the same value when given "constant" arguments,
|
|
3879 |
the function is considered to be "constant". A "constant" argument can be
|
|
3880 |
either an XQL primitive (Number, Boolean, Text) or a "constant" function
|
|
3881 |
invocation. E.g.
|
|
3882 |
|
|
3883 |
date("12-03-1998")
|
|
3884 |
true()
|
|
3885 |
sin(0.3)
|
|
3886 |
length("abc")
|
|
3887 |
date(substr("12-03-1998 is the date", 0, 10))
|
|
3888 |
|
|
3889 |
are constant, but not:
|
|
3890 |
|
|
3891 |
length(book[2])
|
|
3892 |
|
|
3893 |
Results of constant function invocations are cached and calculated only once
|
|
3894 |
for each query. See also the CONST parameter in defineFunction.
|
|
3895 |
It is not necessary to wrap constant function invocations in a once() call.
|
|
3896 |
|
|
3897 |
Constant XQL functions are: date, true, false and a lot of the XQL+
|
|
3898 |
wrappers for Perl builtin functions. Function wrappers for certain builtins
|
|
3899 |
are not made constant on purpose to force the invocation to be evaluated
|
|
3900 |
every time, e.g. 'mkdir("/user/enno/my_dir", "0644")' (although constant
|
|
3901 |
in appearance) may return different results for multiple invocations.
|
|
3902 |
See %PerlFunc in Plus.pm for details.
|
|
3903 |
|
|
3904 |
=item Function: count ([QUERY])
|
|
3905 |
|
|
3906 |
The count() function has no parameters in the XQL spec. In this implementation
|
|
3907 |
it will return the number of QUERY results when passed a QUERY parameter.
|
|
3908 |
|
|
3909 |
=item Method: text ([RECURSE])
|
|
3910 |
|
|
3911 |
When expanding an Element node, the text() method adds the expanded text() value
|
|
3912 |
of sub-Elements. When RECURSE is set to 0 (default is 1), it will not include
|
|
3913 |
sub-elements. This is useful e.g. when using the $match$ operator in a recursive
|
|
3914 |
context (using the // operator), so it won't return parent Elements when one of
|
|
3915 |
the children matches.
|
|
3916 |
|
|
3917 |
=item Method: rawText ([RECURSE])
|
|
3918 |
|
|
3919 |
See text().
|
|
3920 |
|
|
3921 |
=back
|
|
3922 |
|
|
3923 |
=head1 SEE ALSO
|
|
3924 |
|
|
3925 |
L<XML::XQL::Query>, L<XML::XQL::DOM>, L<XML::XQL::Date>
|
|
3926 |
|
|
3927 |
The Japanese version of this document can be found on-line at
|
|
3928 |
L<http://member.nifty.ne.jp/hippo2000/perltips/xml/xql.htm>
|
|
3929 |
|
|
3930 |
The L<XML::XQL::Tutorial> manual page. The Japanese version can be found at
|
|
3931 |
L<http://member.nifty.ne.jp/hippo2000/perltips/xml/xql/tutorial.htm>
|
|
3932 |
|
|
3933 |
The XQL spec at L<http://www.w3.org/TandS/QL/QL98/pp/xql.html>
|
|
3934 |
|
|
3935 |
The Design of XQL at L<http://www.texcel.no/whitepapers/xql-design.html>
|
|
3936 |
|
|
3937 |
The DOM Level 1 specification at L<http://www.w3.org/TR/REC-DOM-Level-1>
|
|
3938 |
|
|
3939 |
The XML spec (Extensible Markup Language 1.0) at L<http://www.w3.org/TR/REC-xml>
|
|
3940 |
|
|
3941 |
The L<XML::Parser> and L<XML::Parser::Expat> manual pages.
|
|
3942 |
|
|
3943 |
=head1 AUTHOR
|
|
3944 |
|
|
3945 |
Please send bugs, comments and suggestions to Enno Derksen <F<enno@att.com>>
|
|
3946 |
|
|
3947 |
=cut
|