Newer
Older
"""RQL Syntax tree annotator
:organization: Logilab
:copyright: 2003-2008 LOGILAB S.A. (Paris, FRANCE), all rights reserved.
:contact: http://www.logilab.fr/ -- mailto:contact@logilab.fr
from logilab.common.compat import any
from rql.utils import function_description
from rql.nodes import (VariableRef, Constant, Not, Exists, Function,
Variable, variable_refs)
class GoTo(Exception):
"""exception used to control the visit of the tree"""
def __init__(self, node):
self.node = node
class RQLSTChecker(object):
""" check a RQL syntax tree for errors not detected on parsing and
Some simple rewriting of the tree may be done too:
* if a OR is used on a symetric relation
* IN function with a single child
use assertions for internal error but specific `BadRQLQuery ` exception for
errors due to a bad rql input
errors = []
self._visit(node, errors)
if errors:
raise BadRQLQuery('%s\n** %s' % (node, '\n** '.join(errors)))
#if node.TYPE == 'select' and \
# not node.defined_vars and not node.get_restriction():
# result = []
# for term in node.selected_terms():
# result.append(term.eval(kwargs))
try:
node.accept(self, errors)
except GoTo, ex:
self._visit(ex.node, errors)
for c in node.children:
self._visit(c, errors)
node.leave(self, errors)
for i, term in enumerate(node.selection):
# selected terms are not included by the default visit,
# accept manually each of them
self._visit(term, errors)
def _check_selected(self, term, termtype, errors):
"""check that variables referenced in the given term are selected"""
# no stinfo yet, use references
for ovref in vref.variable.references():
rel = ovref.relation()
if rel is not None:
break
else:
msg = 'variable %s used in %s is not referenced by any relation'
# statement nodes #########################################################
nbselected = len(node.children[0].selection)
if not len(select.selection) == nbselected:
errors.append('when using union, all subqueries should have '
'the same number of selected terms')
def leave_union(self, node, errors):
pass
def visit_select(self, node, errors):
self._visit_selectedterm(node, errors)
# #XXX from should be added to children, no ?
# for subquery in node.from_:
# self.visit_union(subquery, errors)
# if node.sortterms:
# self._visit(node.sortterms, errors)
def leave_select(self, node, errors):
selected = node.selection
# check selected variable are used in restriction
if node.where is not None or len(selected) > 1:
self._check_selected(term, 'selection', errors)
if node.groupby:
# check that selected variables are used in groups
for var in node.selection:
if isinstance(var, VariableRef) and not var in node.groupby:
errors.append('variable %s should be grouped' % var)
for group in node.groupby:
self._check_selected(group, 'group', errors)
# # check that variables referenced in the given term are selected
# for term in node.orderby:
# for vref in term.iget_nodes(VariableRef):
# # no stinfo yet, use references
# try:
# for ovref in node.defined_vars[vref.name].references():
# rel = ovref.relation()
# if rel is not None:
# break
# else:
# msg = 'variable %s used in %s is not referenced by %s'
# errors.append(msg % (vref.name, termtype, node.as_string()))
# except KeyError:
# msg = 'variable %s used in %s is not referenced by %s'
# errors.append(msg % (vref.name, termtype, node.as_string()))
def visit_insert(self, insert, errors):
self._visit_selectedterm(insert, errors)
def leave_insert(self, node, errors):
def visit_delete(self, delete, errors):
self._visit_selectedterm(delete, errors)
def visit_set(self, update, errors):
def leave_set(self, node, errors):
# tree nodes ##############################################################
def visit_exists(self, node, errors):
pass
def leave_exists(self, node, errors):
pass
def visit_subquery(self, node, errors):
def leave_subquery(self, node, errors):
pass
def visit_sortterm(self, sortterm, errors):
if isinstance(term, Constant):
for select in sortterm.root.children:
if len(select.selection) < term.value:
for vref in tvref.variable.references():
if vref.relation() or vref in stmt.selection:
break
else:
msg = 'sort variable %s is not referenced any where else'
errors.append(msg % tvref.name)
def leave_sortterm(self, node, errors):
pass
def visit_and(self, et, errors):
assert len(et.children) == 2, len(et.children)
def leave_and(self, node, errors):
pass
def visit_or(self, ou, errors):
assert len(ou.children) == 2, len(ou.children)
try:
r1type = r1.r_type
r2type = r2.r_type
except AttributeError:
return # can't be
if r1type == r2type and self.schema.rschema(r1type).symetric:
lhs1, rhs1 = r1.get_variable_parts()
lhs2, rhs2 = r2.get_variable_parts()
try:
if (lhs1.variable is rhs2.variable and
rhs1.variable is lhs2.variable):
for vref in r2.get_nodes(VariableRef):
def leave_or(self, node, errors):
pass
def visit_not(self, not_, errors):
pass
def leave_not(self, not_, errors):
pass
def visit_relation(self, relation, errors):
errors.append("can use optional relation under NOT (%s)"
% relation.as_string())
# special case "X identity Y"
if relation.r_type == 'identity':
assert not isinstance(relation.parent, Not)
elif relation.r_type == 'is':
# special case "C is NULL"
if relation.children[1].operator == 'IS':
lhs, rhs = relation.children
assert isinstance(lhs, VariableRef), lhs
assert isinstance(rhs.children[0], Constant)
assert rhs.operator == 'IS', rhs.operator
assert rhs.children[0].type == None
elif not relation.r_type in self.schema:
errors.append('unknown relation %s' % relation.r_type)
#assert isinstance(lhs, VariableRef), '%s: %s' % (lhs.__class__,
assert len(comparison.children) in (1,2), len(comparison.children)
def leave_comparison(self, node, errors):
pass
def visit_mathexpression(self, mathexpr, errors):
assert len(mathexpr.children) == 2, len(mathexpr.children)
def leave_mathexpression(self, node, errors):
pass
try:
funcdescr = function_description(function.name)
except KeyError:
errors.append('unknown function "%s"' % function.name)
else:
try:
funcdescr.check_nbargs(len(function.children))
except BadRQLQuery, ex:
errors.append(str(ex))
if funcdescr.aggregat:
if isinstance(function.children[0], Function) and \
errors.append('can\'t nest aggregat functions')
if funcdescr.name == 'IN':
assert function.parent.operator == '='
if len(function.children) == 1:
function.parent.append(function.children[0])
function.parent.remove(function)
else:
assert len(function.children) >= 1
def leave_function(self, node, errors):
pass
def visit_variableref(self, variableref, errors):
assert len(variableref.children)==0
## try:
## assert variableref.variable in variableref.root().defined_vars.values(), \
## (variableref.root(), variableref.variable, variableref.root().defined_vars)
## except AttributeError:
## raise Exception((variableref.root(), variableref.variable))
def leave_variableref(self, node, errors):
pass
def visit_constant(self, constant, errors):
assert len(constant.children)==0
if constant.type == 'etype':
if constant.relation().r_type != 'is':
msg ='using an entity type in only allowed with "is" relation'
errors.append(msg)
if not constant.value in self.schema:
errors.append('unknown entity type %s' % constant.value)
def leave_constant(self, node, errors):
pass
class RQLSTAnnotator(object):
""" annotate RQL syntax tree to ease further code generation from it.
If an optional variable is shared among multiple scopes, it's rewritten to
use identity relation.
"""
def __init__(self, schema, special_relations=None):
self.schema = schema
self.special_relations = special_relations or {}
def annotate(self, node):
node.annotated = True
def _visit_stmt(self, node):
for var in node.defined_vars.itervalues():
var.prepare_annotation()
for i, term in enumerate(node.selection):
for func in term.iget_nodes(Function):
if func.descr().aggregat:
node.has_aggregat = True
break
for vref in variable_refs(term):
vref.variable.stinfo['selected'].add(i)
vref.variable.set_scope(node)
if node.where is not None:
node.where.accept(self, node)
visit_insert = visit_delete = visit_set = _visit_stmt
def visit_union(self, node):
for select in node.children:
self.visit_select(select)
def visit_select(self, node):
if node.with_ is not None:
for subquery in node.with_:
self.visit_union(subquery.query)
self._visit_stmt(node)
def rewrite_shared_optional(self, exists, var):
"""if variable is shared across multiple scopes, need some tree
rewriting
"""
newvar = var.stmt.make_variable()
Sylvain
committed
newvar.prepare_annotation()
if vref.scope is exists:
newvref = VariableRef(newvar)
vref.parent.replace(vref, newvref)
# update stinfo structure which may have already been
# partially processed
if rel in var.stinfo['rhsrelations']:
lhs, rhs = rel.get_parts()
if vref is rhs.children[0] and \
self.schema.rschema(rel.r_type).is_final():
update_attrvars(newvar, rel, lhs)
lhsvar = getattr(lhs, 'variable', None)
var.stinfo['attrvars'].remove( (lhsvar, rel.r_type) )
if var.stinfo['attrvar'] is lhsvar:
if var.stinfo['attrvars']:
var.stinfo['attrvar'] = iter(var.stinfo['attrvars']).next()
else:
var.stinfo['attrvar'] = None
var.stinfo['rhsrelations'].remove(rel)
newvar.stinfo['rhsrelations'].add(rel)
for stinfokey in ('blocsimplification','typerels', 'uidrels',
'relations', 'optrelations'):
try:
var.stinfo[stinfokey].remove(rel)
newvar.stinfo[stinfokey].add(rel)
except KeyError:
continue
# shared references
newvar.stinfo['constnode'] = var.stinfo['constnode']
if newvar.stmt.solutions: # solutions already computed
newvar.stinfo['possibletypes'] = var.stinfo['possibletypes']
for sol in newvar.stmt.solutions:
sol[newvar.name] = sol[var.name]
rel = exists.add_relation(var, 'identity', newvar)
# we have to force visit of the introduced relation
self.visit_relation(rel, exists)
return newvar
return None
# tree nodes ##############################################################
def visit_exists(self, node, scope):
node.children[0].accept(self, node)
def visit_not(self, node, scope):
node.children[0].accept(self, scope)
def visit_and(self, node, scope):
node.children[0].accept(self, scope)
node.children[1].accept(self, scope)
visit_or = visit_and
def visit_relation(self, relation, scope):
assert relation.parent, repr(relation)
# may be a constant once rqlst has been simplified
lhsvar = getattr(lhs, 'variable', None)
if not isinstance(lhsvar, Variable):
if relation.is_types_restriction():
assert rhs.operator == '='
assert not relation.optional
if lhsvar is not None:
lhsvar.stinfo['typerels'].add(relation)
return
if relation.optional is not None:
exists = relation.scope
if not isinstance(exists, Exists):
exists = None
if lhsvar is not None:
if exists is not None:
newvar = self.rewrite_shared_optional(exists, lhsvar)
if newvar is not None:
lhsvar = newvar
if relation.optional == 'right':
elif relation.optional == 'both':
lhsvar.stinfo['optrelations'].add(relation)
elif relation.optional == 'left':
lhsvar.stinfo['optrelations'].add(relation)
try:
rhsvar = rhs.children[0].variable
if exists is not None:
newvar = self.rewrite_shared_optional(exists, rhsvar)
if newvar is not None:
rhsvar = newvar
if relation.optional == 'right':
rhsvar.stinfo['optrelations'].add(relation)
elif relation.optional == 'both':
rhsvar.stinfo['optrelations'].add(relation)
elif relation.optional == 'left':
except AttributeError:
# may have been rewritten as well
pass
rtype = relation.r_type
try:
rschema = self.schema.rschema(rtype)
except KeyError:
raise BadRQLQuery('no relation %s' % rtype)
if lhsvar is not None:
lhsvar.set_scope(scope)
lhsvar.stinfo['relations'].add(relation)
if rtype in self.special_relations:
key = '%srels' % self.special_relations[rtype]
if key == 'uidrels':
constnode = relation.get_variable_parts()[1]
if not (relation.operator() != '=' or
isinstance(relation.parent, Not)):
if isinstance(constnode, Constant):
lhsvar.stinfo['constnode'] = constnode
lhsvar.stinfo.setdefault(key, set()).add(relation)
else:
lhsvar.stinfo.setdefault(key, set()).add(relation)
elif rschema.is_final() or rschema.inlined:
lhsvar.stinfo['blocsimplification'].add(relation)
for vref in variable_refs(rhs):
var = vref.variable
var.set_scope(scope)
var.stinfo['relations'].add(relation)
var.stinfo['rhsrelations'].add(relation)
update_attrvars(var, relation, lhs)
def update_attrvars(var, relation, lhs):
lhsvar = getattr(lhs, 'variable', None)
var.stinfo['attrvars'].add( (lhsvar, relation.r_type) )
# give priority to variable which is not in an EXISTS as
# "main" attribute variable
if var.stinfo['attrvar'] is None or not isinstance(relation.scope, Exists):
var.stinfo['attrvar'] = lhsvar or lhs