arabica/XPath/impl/xpath_step.hpp

432 lines
15 KiB
C++
Raw Normal View History

2005-08-04 22:42:30 +02:00
#ifndef ARABICA_XPATHIC_XPATH_STEP_H
#define ARABICA_XPATHIC_XPATH_STEP_H
#include <DOM/Document.h>
#include <algorithm>
#include "xpath_object.hpp"
#include "xpath_value.hpp"
#include "xpath_axis_enumerator.hpp"
#include "xpath_node_test.hpp"
#include "xpath_ast.hpp"
#include "xpath_ast_ids.hpp"
#include "xpath_namespace_context.hpp"
#include "xpath_compile_context.hpp"
namespace Arabica
{
namespace XPath
{
namespace impl
{
2005-08-04 22:42:30 +02:00
template<class string_type, class string_adaptor>
class StepExpression : public XPathExpression<string_type, string_adaptor>
2005-08-04 22:42:30 +02:00
{
public:
StepExpression() { }
StepExpression(const std::vector<XPathExpression<string_type, string_adaptor> *>& predicates) : predicates_(predicates) { }
2005-08-04 22:42:30 +02:00
virtual ~StepExpression()
{
2005-08-21 14:48:00 +02:00
for(typename std::vector<XPathExpression<string_type, string_adaptor>*>::iterator p = predicates_.begin(), e = predicates_.end(); p != e; ++p)
2005-08-04 22:42:30 +02:00
delete *p;
} // ~StepExpression
virtual XPathValuePtr<string_type> evaluate(const DOM::Node<string_type>& context, const ExecutionContext<string_type, string_adaptor>& executionContext) const = 0;
virtual XPathValuePtr<string_type> evaluate(NodeSet<string_type>& context, const ExecutionContext<string_type, string_adaptor>& executionContext) const = 0;
2005-08-04 22:42:30 +02:00
bool has_predicates() const { return !predicates_.empty(); }
protected:
NodeSet<string_type> applyPredicates(NodeSet<string_type>& nodes, const ExecutionContext<string_type, string_adaptor>& parentContext) const
2005-08-04 22:42:30 +02:00
{
2005-08-21 14:48:00 +02:00
for(typename std::vector<XPathExpression<string_type, string_adaptor>*>::const_iterator p = predicates_.begin(), e = predicates_.end();
2005-08-04 22:42:30 +02:00
(p != e) && (!nodes.empty()); ++p)
nodes = applyPredicate(nodes, *p, parentContext);
return nodes;
} // applyPredicates
private:
NodeSet<string_type> applyPredicate(NodeSet<string_type>& nodes,
XPathExpression<string_type, string_adaptor>* predicate,
const ExecutionContext<string_type, string_adaptor>& parentContext) const
2005-08-04 22:42:30 +02:00
{
ExecutionContext<string_type, string_adaptor> executionContext(nodes.size(), parentContext);
NodeSet<string_type> results(nodes.forward());
2005-08-04 22:42:30 +02:00
unsigned int position = 1;
2005-08-21 14:48:00 +02:00
for(typename NodeSet<string_type>::iterator i = nodes.begin(); i != nodes.end(); ++i, ++position)
2005-08-04 22:42:30 +02:00
{
executionContext.setPosition(position);
XPathValuePtr<string_type> v = predicate->evaluate(*i, executionContext);
2005-08-04 22:42:30 +02:00
if((v->type() == NUMBER) && (position != v->asNumber()))
continue;
if(v->asBool() == false)
continue;
results.push_back(*i);
} // for ...
return results;
} // applyPredicate
std::vector<XPathExpression<string_type, string_adaptor>*> predicates_;
2005-08-04 22:42:30 +02:00
}; // StepExpression
2005-08-18 22:54:26 +02:00
template<class string_type, class string_adaptor>
class TestStepExpression : public StepExpression<string_type, string_adaptor>
2005-08-04 22:42:30 +02:00
{
2005-08-18 22:54:26 +02:00
typedef StepExpression<string_type, string_adaptor> baseT;
2005-08-04 22:42:30 +02:00
public:
2005-08-18 22:54:26 +02:00
TestStepExpression(Axis axis, NodeTest<string_type>* test) :
StepExpression<string_type, string_adaptor>(),
2005-08-04 22:42:30 +02:00
axis_(axis),
test_(test)
{
} // TestStepExpression
2005-08-18 22:54:26 +02:00
TestStepExpression(Axis axis, NodeTest<string_type>* test,
const std::vector<XPathExpression<string_type, string_adaptor>*>& predicates) :
StepExpression<string_type, string_adaptor>(predicates),
2005-08-04 22:42:30 +02:00
axis_(axis),
test_(test)
{
} // TestStepExpression
virtual ~TestStepExpression()
{
delete test_;
} // StepExpression
2005-08-18 22:54:26 +02:00
virtual XPathValuePtr<string_type> evaluate(const DOM::Node<string_type>& context, const ExecutionContext<string_type, string_adaptor>& executionContext) const
2005-08-04 22:42:30 +02:00
{
2005-08-18 22:54:26 +02:00
NodeSet<string_type> nodes;
2005-08-04 22:42:30 +02:00
enumerateOver(context, nodes, executionContext);
2005-08-18 22:54:26 +02:00
return XPathValuePtr<string_type>(new NodeSetValue<string_type, string_adaptor>(nodes));
2005-08-04 22:42:30 +02:00
} // evaluate
2005-08-18 22:54:26 +02:00
virtual XPathValuePtr<string_type> evaluate(NodeSet<string_type>& context, const ExecutionContext<string_type, string_adaptor>& executionContext) const
2005-08-04 22:42:30 +02:00
{
2005-08-18 22:54:26 +02:00
NodeSet<string_type> nodes;
2005-08-21 14:48:00 +02:00
for(typename NodeSet<string_type>::iterator n = context.begin(); n != context.end(); ++n)
2005-08-04 22:42:30 +02:00
enumerateOver(*n, nodes, executionContext);
2005-08-18 22:54:26 +02:00
return XPathValuePtr<string_type>(new NodeSetValue<string_type, string_adaptor>(nodes));
2005-08-04 22:42:30 +02:00
} // evaluate
private:
2005-08-18 22:54:26 +02:00
void enumerateOver(const DOM::Node<string_type>& context,
NodeSet<string_type>& results,
const ExecutionContext<string_type, string_adaptor>& parentContext) const
2005-08-04 22:42:30 +02:00
{
2005-08-19 11:05:11 +02:00
AxisEnumerator<string_type, string_adaptor> enumerator(context, axis_);
2005-08-18 22:54:26 +02:00
NodeSet<string_type> intermediate(enumerator.forward());
NodeSet<string_type>& d = (!baseT::has_predicates()) ? results : intermediate;
2005-08-04 22:42:30 +02:00
while(*enumerator != 0)
{
// if test
2005-08-18 22:54:26 +02:00
DOM::Node<string_type> node = *enumerator;
2005-08-04 22:42:30 +02:00
if((*test_)(node))
d.push_back(node);
++enumerator;
} // while ...
2005-08-18 22:54:26 +02:00
if(!baseT::has_predicates())
2005-08-04 22:42:30 +02:00
{
results.forward(enumerator.forward());
return;
} // if ...
2005-08-18 22:54:26 +02:00
intermediate = baseT::applyPredicates(intermediate, parentContext);
2005-08-04 22:42:30 +02:00
results.swap(intermediate);
} // enumerateOver
Axis axis_;
2005-08-18 22:54:26 +02:00
NodeTest<string_type>* test_;
2005-08-04 22:42:30 +02:00
}; // class TestStepExpression
2005-08-18 23:41:33 +02:00
template<class string_type, class string_adaptor>
class ExprStepExpression : public StepExpression<string_type, string_adaptor>
2005-08-04 22:42:30 +02:00
{
2005-08-18 23:41:33 +02:00
typedef StepExpression<string_type, string_adaptor> baseT;
2005-08-04 22:42:30 +02:00
public:
2005-08-18 23:41:33 +02:00
ExprStepExpression(XPathExpression<string_type, string_adaptor>* expr,
const std::vector<XPathExpression<string_type, string_adaptor>*>& predicates) :
StepExpression<string_type, string_adaptor>(predicates),
2005-08-04 22:42:30 +02:00
expr_(expr)
{
} // ExprStepExpression
virtual ~ExprStepExpression()
{
delete expr_;
} // ExprStepExpression
2005-08-18 23:41:33 +02:00
virtual XPathValuePtr<string_type> evaluate(const DOM::Node<string_type>& context, const ExecutionContext<string_type, string_adaptor>& executionContext) const
2005-08-04 22:42:30 +02:00
{
2005-08-18 23:41:33 +02:00
if(!baseT::has_predicates())
2005-08-04 22:42:30 +02:00
return expr_->evaluate(context, executionContext);
2005-08-18 23:41:33 +02:00
NodeSet<string_type> ns = expr_->evaluate(context, executionContext)->asNodeSet();
return XPathValuePtr<string_type>(new NodeSetValue<string_type, string_adaptor>(baseT::applyPredicates(ns, executionContext)));
2005-08-04 22:42:30 +02:00
} // evaluate
2005-08-18 23:41:33 +02:00
virtual XPathValuePtr<string_type> evaluate(NodeSet<string_type>& context, const ExecutionContext<string_type, string_adaptor>& executionContext) const
2005-08-04 22:42:30 +02:00
{
2005-08-18 23:41:33 +02:00
DOM::Node<string_type> c = context.top();
2005-08-04 22:42:30 +02:00
return evaluate(c, executionContext);
} // evaluate
private:
2005-08-18 23:41:33 +02:00
XPathExpression<string_type, string_adaptor>* expr_;
2005-08-21 14:48:00 +02:00
std::vector<XPathExpression<string_type, string_adaptor>*> predicates_;
2005-08-04 22:42:30 +02:00
}; // class ExprStepExpression
2005-08-18 23:45:14 +02:00
template<class string_type, class string_adaptor>
2005-08-04 22:42:30 +02:00
class StepFactory
{
public:
2005-08-18 23:45:14 +02:00
static StepExpression<string_type, string_adaptor>*
2005-09-25 22:09:49 +02:00
createStep(typename types<string_adaptor>::node_iter_t& node,
typename types<string_adaptor>::node_iter_t const& end,
2005-08-18 23:45:14 +02:00
CompilationContext<string_type, string_adaptor>& context)
2005-08-04 22:42:30 +02:00
{
Axis axis = getAxis(node);
2005-08-18 23:45:14 +02:00
NodeTest<string_type>* test = getTest(node, context.namespaceContext());
XPathExpression<string_type, string_adaptor>* thing = 0;
2005-08-04 22:42:30 +02:00
if(!test)
2005-08-18 23:45:14 +02:00
thing = XPath<string_type>::compile_expression(node++, context);
2005-08-04 22:42:30 +02:00
2005-08-18 23:45:14 +02:00
std::vector<XPathExpression<string_type, string_adaptor>*> preds;
2005-08-04 22:42:30 +02:00
2005-09-25 22:09:49 +02:00
while((node != end) && (getNodeId<string_adaptor>(node) == impl::Predicate_id))
2005-08-04 22:42:30 +02:00
{
2005-09-25 22:09:49 +02:00
typename types<string_adaptor>::node_iter_t c = node->children.begin();
assert(getNodeId<string_adaptor>(c) == impl::LeftSquare_id);
2005-08-04 22:42:30 +02:00
++c;
2005-08-18 23:45:14 +02:00
preds.push_back(XPath<string_type>::compile_expression(c, context));
2005-08-04 22:42:30 +02:00
++c;
2005-09-25 22:09:49 +02:00
assert(getNodeId<string_adaptor>(c) == impl::RightSquare_id);
2005-08-04 22:42:30 +02:00
++node;
} // if ...
if(!test)
2005-08-18 23:45:14 +02:00
return new ExprStepExpression<string_type, string_adaptor>(thing, preds);
return new TestStepExpression<string_type, string_adaptor>(axis, test, preds);
2005-08-04 22:42:30 +02:00
} // createStep
2005-09-25 22:09:49 +02:00
static StepExpression<string_type, string_adaptor>* createStep(typename types<string_adaptor>::node_iter_t& node, CompilationContext<string_type, string_adaptor>& context)
2005-08-04 22:42:30 +02:00
{
Axis axis = getAxis(node);
2005-08-18 23:45:14 +02:00
NodeTest<string_type>* test = getTest(node, context.namespaceContext());
return new TestStepExpression<string_type, string_adaptor>(axis, test);
2005-08-04 22:42:30 +02:00
} // createStep
private:
2005-09-25 22:09:49 +02:00
static Axis getAxis(typename types<string_adaptor>::node_iter_t& node)
2005-08-04 22:42:30 +02:00
{
2005-09-25 22:09:49 +02:00
long id = getNodeId<string_adaptor>(node);
2005-08-04 22:42:30 +02:00
switch(id)
{
2005-08-16 19:54:20 +02:00
case impl::Slash_id:
case impl::SelfSelect_id:
2005-08-04 22:42:30 +02:00
return SELF; // don't advance node, SelfSelect is axis specifier and node test in one
2005-08-16 19:54:20 +02:00
case impl::ParentSelect_id:
2005-08-04 22:42:30 +02:00
return PARENT;
2005-08-16 19:54:20 +02:00
case impl::SlashSlash_id:
2005-08-04 22:42:30 +02:00
return DESCENDANT_OR_SELF;
2005-08-16 19:54:20 +02:00
case impl::AbbreviatedAxisSpecifier_id:
2005-08-04 22:42:30 +02:00
++node;
return ATTRIBUTE;
2005-08-16 19:54:20 +02:00
case impl::AxisSpecifier_id:
2005-08-04 22:42:30 +02:00
// skip on to the next bit
break;
default:
return CHILD;
} // switch(id)
2005-09-25 22:09:49 +02:00
typename types<string_adaptor>::node_iter_t axis_node = node->children.begin();
long axis = getNodeId<string_adaptor>(skipWhitespace<string_adaptor>(axis_node));
2005-08-04 22:42:30 +02:00
++node;
switch(axis)
{
2005-08-16 19:54:20 +02:00
case impl::AncestorOrSelf_id:
2005-08-04 22:42:30 +02:00
return ANCESTOR_OR_SELF;
2005-08-16 19:54:20 +02:00
case impl::Ancestor_id:
2005-08-04 22:42:30 +02:00
return ANCESTOR;
2005-08-16 19:54:20 +02:00
case impl::AbbreviatedAxisSpecifier_id:
case impl::Attribute_id:
2005-08-04 22:42:30 +02:00
return ATTRIBUTE;
2005-08-16 19:54:20 +02:00
case impl::Child_id:
2005-08-04 22:42:30 +02:00
return CHILD;
2005-08-16 19:54:20 +02:00
case impl::DescendantOrSelf_id:
2005-08-04 22:42:30 +02:00
return DESCENDANT_OR_SELF;
2005-08-16 19:54:20 +02:00
case impl::Descendant_id:
2005-08-04 22:42:30 +02:00
return DESCENDANT;
2005-08-16 19:54:20 +02:00
case impl::FollowingSibling_id:
2005-08-04 22:42:30 +02:00
return FOLLOWING_SIBLING;
2005-08-16 19:54:20 +02:00
case impl::Following_id:
2005-08-04 22:42:30 +02:00
return FOLLOWING;
2005-08-16 19:54:20 +02:00
case impl::Namespace_id:
2005-08-04 22:42:30 +02:00
return NAMESPACE;
2005-08-16 19:54:20 +02:00
case impl::Parent_id:
2005-08-04 22:42:30 +02:00
return PARENT;
2005-08-16 19:54:20 +02:00
case impl::PrecedingSibling_id:
2005-08-04 22:42:30 +02:00
return PRECEDING_SIBLING;
2005-08-16 19:54:20 +02:00
case impl::Preceding_id:
2005-08-04 22:42:30 +02:00
return PRECEDING;
2005-08-16 19:54:20 +02:00
case impl::Self_id:
2005-08-04 22:42:30 +02:00
return SELF;
} // switch ...
assert(false);
return CHILD;
} // getAxis
2005-09-25 22:09:49 +02:00
static NodeTest<string_type>* getTest(typename types<string_adaptor>::node_iter_t& node, const NamespaceContext<string_type, string_adaptor>& namespaceContext)
2005-08-04 22:42:30 +02:00
{
2005-09-25 22:09:49 +02:00
long id = getNodeId<string_adaptor>(skipWhitespace<string_adaptor>(node));
2005-08-04 22:42:30 +02:00
switch(id)
{
2005-08-16 19:54:20 +02:00
case impl::NodeTest_id:
2005-08-04 22:42:30 +02:00
{
2005-09-25 22:09:49 +02:00
typename types<string_adaptor>::node_iter_t c = node->children.begin();
2005-08-18 23:45:14 +02:00
NodeTest<string_type>* t = getTest(c, namespaceContext);
2005-08-04 22:42:30 +02:00
++node;
return t;
} // case NodeTest_id
2005-08-16 19:54:20 +02:00
case impl::QName_id:
2005-08-04 22:42:30 +02:00
{
2005-09-25 22:09:49 +02:00
typename types<string_adaptor>::node_iter_t c = node->children.begin();
2005-09-30 23:36:11 +02:00
string_type prefix = string_adaptor::construct(c->value.begin(), c->value.end());
2005-08-18 23:45:14 +02:00
string_type uri = namespaceContext.namespaceURI(prefix);
2005-08-04 22:42:30 +02:00
++c;
2005-09-30 23:36:11 +02:00
string_type name = string_adaptor::construct(c->value.begin(), c->value.end());
2005-08-04 22:42:30 +02:00
++node;
2005-08-18 23:45:14 +02:00
return new QNameNodeTest<string_type>(uri, name);
2005-08-04 22:42:30 +02:00
} //case QName_id
2005-08-16 19:54:20 +02:00
case impl::NCName_id:
2005-08-04 22:42:30 +02:00
{
2005-09-30 23:36:11 +02:00
string_type name = string_adaptor::construct(node->value.begin(), node->value.end());
2005-08-04 22:42:30 +02:00
++node;
return new NameNodeTest<string_type, string_adaptor>(name);
2005-08-04 22:42:30 +02:00
} // case NameNodeTest
2005-08-16 19:54:20 +02:00
case impl::Comment_id:
2005-08-04 22:42:30 +02:00
{
++node;
2005-08-18 23:45:14 +02:00
return new CommentNodeTest<string_type>();
2005-08-04 22:42:30 +02:00
} // case CommentTest_id
2005-08-16 19:54:20 +02:00
case impl::Text_id:
2005-08-04 22:42:30 +02:00
{
++node;
2005-08-18 23:45:14 +02:00
return new TextNodeTest<string_type>();
2005-08-04 22:42:30 +02:00
} // case Text_id
2005-08-16 19:54:20 +02:00
case impl::ProcessingInstruction_id:
2005-08-04 22:42:30 +02:00
{
++node;
2005-09-25 22:09:49 +02:00
if(getNodeId<string_adaptor>(node) != impl::Literal_id) // not sure if this is always safe
return new ProcessingInstructionNodeTest<string_type, string_adaptor>();
2005-08-04 22:42:30 +02:00
2005-09-30 23:36:11 +02:00
string_type target = string_adaptor::construct(node->value.begin(), node->value.end());
2005-08-04 22:42:30 +02:00
++node;
return new ProcessingInstructionNodeTest<string_type, string_adaptor>(target);
2005-08-04 22:42:30 +02:00
} // case ProcessingInstruction_id
2005-08-16 19:54:20 +02:00
case impl::SlashSlash_id:
case impl::Node_id:
2005-08-04 22:42:30 +02:00
{
++node;
2005-08-18 23:45:14 +02:00
return new AnyNodeTest<string_type>();
2005-08-04 22:42:30 +02:00
} // case Node_id
2005-08-16 19:54:20 +02:00
case impl::Slash_id:
2005-08-18 23:45:14 +02:00
return new RootNodeTest<string_type>();
2005-08-04 22:42:30 +02:00
2005-08-16 19:54:20 +02:00
case impl::AnyName_id:
case impl::SelfSelect_id:
case impl::ParentSelect_id:
2005-08-04 22:42:30 +02:00
{
++node;
2005-08-18 23:45:14 +02:00
return new StarNodeTest<string_type>();
2005-08-04 22:42:30 +02:00
} // case AnyName_id:
2005-08-16 19:54:20 +02:00
case impl::NameTest_id:
2005-08-04 22:42:30 +02:00
{
2005-09-25 22:09:49 +02:00
typename types<string_adaptor>::node_iter_t prefixNode = node->children.begin();
2005-08-04 22:42:30 +02:00
++node;
2005-09-30 23:36:11 +02:00
string_type prefix = string_adaptor::construct(prefixNode->value.begin(), prefixNode->value.end());
2005-08-18 23:45:14 +02:00
string_type uri = namespaceContext.namespaceURI(prefix);
return new QStarNodeTest<string_type>(uri);
2005-08-04 22:42:30 +02:00
} // case
} // switch(id)
return 0;
} // getTest
StepFactory();
}; // class StepFactory
template<class string_type, class string_adaptor>
class RelativeLocationPath : public XPathExpression<string_type, string_adaptor>
2005-08-04 22:42:30 +02:00
{
public:
RelativeLocationPath(StepExpression<string_type, string_adaptor>* step) : steps_() { steps_.push_back(step); }
RelativeLocationPath(const StepList<string_type, string_adaptor>& steps) : steps_(steps) { }
2005-08-04 22:42:30 +02:00
virtual ~RelativeLocationPath()
{
2005-08-21 14:48:00 +02:00
for(typename StepList<string_type, string_adaptor>::const_iterator i = steps_.begin(); i != steps_.end(); ++i)
2005-08-04 22:42:30 +02:00
delete *i;
} // ~LocationPath
virtual XPathValuePtr<string_type> evaluate(const DOM::Node<string_type>& context, const ExecutionContext<string_type, string_adaptor>& executionContext) const
2005-08-04 22:42:30 +02:00
{
NodeSet<string_type> nodes;
2005-08-04 22:42:30 +02:00
nodes.push_back(context);
2005-08-21 14:48:00 +02:00
for(typename StepList<string_type, string_adaptor>::const_iterator i = steps_.begin(); i != steps_.end(); ++i)
2005-08-04 22:42:30 +02:00
{
XPathValuePtr<string_type> v = (*i)->evaluate(nodes, executionContext);
2005-08-04 22:42:30 +02:00
nodes = v->asNodeSet();
} // for ...
return XPathValuePtr<string_type>(new NodeSetValue<string_type, string_adaptor>(nodes));
2005-08-04 22:42:30 +02:00
} // do_evaluate
private:
StepList<string_type, string_adaptor> steps_;
2005-08-04 22:42:30 +02:00
}; // LocationPath
template<class string_type, class string_adaptor>
class AbsoluteLocationPath : public RelativeLocationPath<string_type, string_adaptor>
2005-08-04 22:42:30 +02:00
{
public:
AbsoluteLocationPath(StepExpression<string_type, string_adaptor>* step) : RelativeLocationPath<string_type, string_adaptor>(step) { }
AbsoluteLocationPath(const StepList<string_type, string_adaptor>& steps) : RelativeLocationPath<string_type, string_adaptor>(steps) { }
2005-08-04 22:42:30 +02:00
virtual XPathValuePtr<string_type> evaluate(const DOM::Node<string_type>& context, const ExecutionContext<string_type, string_adaptor>& executionContext) const
2005-08-04 22:42:30 +02:00
{
int type = context.getNodeType();
if((type == DOM::Node<string_type>::DOCUMENT_NODE) ||
(type == DOM::Node<string_type>::DOCUMENT_FRAGMENT_NODE))
return RelativeLocationPath<string_type, string_adaptor>::evaluate(context, executionContext);
2005-08-04 22:42:30 +02:00
DOM::Document<string_type> document = context.getOwnerDocument();
return RelativeLocationPath<string_type, string_adaptor>::evaluate(document, executionContext);
2005-08-04 22:42:30 +02:00
} // evaluate
}; // class AbsoluteLocationPath
} // impl
2005-08-04 22:42:30 +02:00
} // XPath
} // Arabica
#endif