Skip to content
Snippets Groups Projects
stcheck.py 19.2 KiB
Newer Older
"""RQL Syntax tree annotator

:organization: Logilab
:copyright: 2003-2008 LOGILAB S.A. (Paris, FRANCE), all rights reserved.
:contact: http://www.logilab.fr/ -- mailto:contact@logilab.fr
Nicolas Chauvat's avatar
Nicolas Chauvat committed
"""
__docformat__ = "restructuredtext en"
Nicolas Chauvat's avatar
Nicolas Chauvat committed

from logilab.common.compat import any

Nicolas Chauvat's avatar
Nicolas Chauvat committed
from rql._exceptions import BadRQLQuery
from rql.utils import function_description
from rql.nodes import (VariableRef, Constant, Not, Exists, Function,
                       Variable, variable_refs)
Sylvain Thenault's avatar
Sylvain Thenault committed
from rql.stmts import Union
Sylvain's avatar
Sylvain committed

Sylvain's avatar
Sylvain committed
class GoTo(Exception):
    """exception used to control the visit of the tree"""
    def __init__(self, node):
        self.node = node
        

Sylvain's avatar
Sylvain committed
class RQLSTChecker(object):
    """ check a RQL syntax tree for errors not detected on parsing and

    Some simple rewriting of the tree may be done too:
    * if a OR is used on a symetric relation
    * IN function with a single child
Nicolas Chauvat's avatar
Nicolas Chauvat committed
    
Sylvain's avatar
Sylvain committed
    use assertions for internal error but specific `BadRQLQuery ` exception for
    errors due to a bad rql input
Nicolas Chauvat's avatar
Nicolas Chauvat committed
    """

Sylvain's avatar
Sylvain committed
    def __init__(self, schema):
Nicolas Chauvat's avatar
Nicolas Chauvat committed
        self.schema = schema

Sylvain's avatar
Sylvain committed
    def check(self, node):
Nicolas Chauvat's avatar
Nicolas Chauvat committed
        errors = []
        self._visit(node, errors)
        if errors:
Sylvain's avatar
Sylvain committed
            raise BadRQLQuery('%s\n** %s' % (node, '\n** '.join(errors)))
Sylvain's avatar
Sylvain committed
        #if node.TYPE == 'select' and \
        #       not node.defined_vars and not node.get_restriction():
        #    result = []
        #    for term in node.selected_terms():
        #        result.append(term.eval(kwargs))
            
Nicolas Chauvat's avatar
Nicolas Chauvat committed
    def _visit(self, node, errors):
Sylvain's avatar
Sylvain committed
        try:
            node.accept(self, errors)
        except GoTo, ex:
            self._visit(ex.node, errors)
Sylvain's avatar
Sylvain committed
            for c in node.children:
                self._visit(c, errors)
Sylvain's avatar
Sylvain committed
            
    def _visit_selectedterm(self, node, errors):
        for i, term in enumerate(node.selection):
Sylvain's avatar
Sylvain committed
            # selected terms are not included by the default visit,
            # accept manually each of them
            self._visit(term, errors)
Sylvain's avatar
Sylvain committed
                    
    def _check_selected(self, term, termtype, errors):
        """check that variables referenced in the given term are selected"""
Sylvain Thenault's avatar
Sylvain Thenault committed
        for vref in variable_refs(term):
Sylvain's avatar
Sylvain committed
            # no stinfo yet, use references
            for ovref in vref.variable.references():
                rel = ovref.relation()
                if rel is not None:
                    break
            else:
                msg = 'variable %s used in %s is not referenced by any relation'
Sylvain's avatar
Sylvain committed
                errors.append(msg % (vref.name, termtype))
Sylvain's avatar
Sylvain committed
                
Sylvain's avatar
Sylvain committed
    # statement nodes #########################################################
Nicolas Chauvat's avatar
Nicolas Chauvat committed

Sylvain's avatar
Sylvain committed
    def visit_union(self, node, errors):
        nbselected = len(node.children[0].selection)
Sylvain's avatar
Sylvain committed
        for select in node.children[1:]:
            if not len(select.selection) == nbselected:
Sylvain's avatar
Sylvain committed
                errors.append('when using union, all subqueries should have '
                              'the same number of selected terms')            
Sylvain's avatar
Sylvain committed
    def leave_union(self, node, errors):
        pass
    
    def visit_select(self, node, errors):
        self._visit_selectedterm(node, errors)
#         #XXX from should be added to children, no ?
#         for subquery in node.from_:
#             self.visit_union(subquery, errors)
#         if node.sortterms:
#             self._visit(node.sortterms, errors)            
    def leave_select(self, node, errors):
        selected = node.selection
Sylvain's avatar
Sylvain committed
        # check selected variable are used in restriction
        if node.where is not None or len(selected) > 1:
Sylvain's avatar
Sylvain committed
            for term in selected:
                self._check_selected(term, 'selection', errors)
        if node.groupby:
            # check that selected variables are used in groups
            for var in node.selection:
                if isinstance(var, VariableRef) and not var in node.groupby:
                    errors.append('variable %s should be grouped' % var)
            for group in node.groupby:
                self._check_selected(group, 'group', errors)
#         # check that variables referenced in the given term are selected
#         for term in node.orderby:
#             for vref in term.iget_nodes(VariableRef):
#                 # no stinfo yet, use references
#                 try:
#                     for ovref in node.defined_vars[vref.name].references():
#                         rel = ovref.relation()
#                         if rel is not None:
#                             break
#                     else:
#                         msg = 'variable %s used in %s is not referenced by %s'
#                         errors.append(msg % (vref.name, termtype, node.as_string()))
#                 except KeyError:
#                     msg = 'variable %s used in %s is not referenced by %s'
#                     errors.append(msg % (vref.name, termtype, node.as_string()))
Sylvain's avatar
Sylvain committed

    def visit_insert(self, insert, errors):
        self._visit_selectedterm(insert, errors)
    def leave_insert(self, node, errors):
Sylvain's avatar
Sylvain committed
        pass
Sylvain's avatar
Sylvain committed

    def visit_delete(self, delete, errors):
        self._visit_selectedterm(delete, errors)
Sylvain's avatar
Sylvain committed
    def leave_delete(self, node, errors):
        pass
Sylvain's avatar
Sylvain committed
        
    def visit_set(self, update, errors):
Sylvain's avatar
Sylvain committed
        self._visit_selectedterm(update, errors)
    def leave_set(self, node, errors):
Sylvain's avatar
Sylvain committed
        pass                
Sylvain's avatar
Sylvain committed

    # tree nodes ##############################################################
Sylvain's avatar
Sylvain committed
    
    def visit_exists(self, node, errors):
        pass
    def leave_exists(self, node, errors):
        pass
    
    def visit_subquery(self, node, errors):
Sylvain's avatar
Sylvain committed
        pass
    def leave_subquery(self, node, errors):
        pass 
Sylvain's avatar
Sylvain committed
    
    def visit_sortterm(self, sortterm, errors):
Sylvain's avatar
Sylvain committed
        term = sortterm.term
        if isinstance(term, Constant):
            for select in sortterm.root.children:
                if len(select.selection) < term.value:
Sylvain Thenault's avatar
Sylvain Thenault committed
                    errors.append('order column out of bound %s' % term.value)
Sylvain's avatar
Sylvain committed
        else:
            stmt = term.stmt
Sylvain's avatar
Sylvain committed
            for tvref in variable_refs(term):
Sylvain's avatar
Sylvain committed
                for vref in tvref.variable.references():
                    if vref.relation() or vref in stmt.selection:
                        break
                else:
                    msg = 'sort variable %s is not referenced any where else'
                    errors.append(msg % tvref.name)
                    
    def leave_sortterm(self, node, errors):
        pass
Nicolas Chauvat's avatar
Nicolas Chauvat committed
    
    def visit_and(self, et, errors):
        assert len(et.children) == 2, len(et.children)
    def leave_and(self, node, errors):
        pass
Nicolas Chauvat's avatar
Nicolas Chauvat committed
        
    def visit_or(self, ou, errors):
        assert len(ou.children) == 2, len(ou.children)
Sylvain's avatar
Sylvain committed
        # simplify Ored expression of a symetric relation
Nicolas Chauvat's avatar
Nicolas Chauvat committed
        r1, r2 = ou.children[0], ou.children[1]
Sylvain's avatar
Sylvain committed
        try:
            r1type = r1.r_type
            r2type = r2.r_type
        except AttributeError:
            return # can't be
syt's avatar
syt committed
        if r1type == r2type and self.schema.rschema(r1type).symetric:
Nicolas Chauvat's avatar
Nicolas Chauvat committed
            lhs1, rhs1 = r1.get_variable_parts()
            lhs2, rhs2 = r2.get_variable_parts()
            try:
                if (lhs1.variable is rhs2.variable and
                    rhs1.variable is lhs2.variable):
Sylvain's avatar
Sylvain committed
                    ou.parent.replace(ou, r1)
                    for vref in r2.get_nodes(VariableRef):
                        vref.unregister_reference()
Sylvain's avatar
Sylvain committed
                    raise GoTo(r1)
Nicolas Chauvat's avatar
Nicolas Chauvat committed
            except AttributeError:
Sylvain's avatar
Sylvain committed
                pass
    def leave_or(self, node, errors):
        pass

    def visit_not(self, not_, errors):
        pass
    def leave_not(self, not_, errors):
        pass
    
    def visit_relation(self, relation, errors):
Sylvain's avatar
Sylvain committed
        if relation.optional and relation.neged():
                errors.append("can use optional relation under NOT (%s)"
                              % relation.as_string())
        # special case "X identity Y"
        if relation.r_type == 'identity':
Sylvain's avatar
Sylvain committed
            lhs, rhs = relation.children
            assert not isinstance(relation.parent, Not)
            assert rhs.operator == '='
Sylvain's avatar
Sylvain committed
        elif relation.r_type == 'is':
            # special case "C is NULL"
            if relation.children[1].operator == 'IS':
                lhs, rhs = relation.children
                assert isinstance(lhs, VariableRef), lhs
                assert isinstance(rhs.children[0], Constant)
                assert rhs.operator == 'IS', rhs.operator
                assert rhs.children[0].type == None
        elif not relation.r_type in self.schema:
            errors.append('unknown relation %s' % relation.r_type)
        
Sylvain's avatar
Sylvain committed
    def leave_relation(self, relation, errors):
Sylvain's avatar
Sylvain committed
        pass
        #assert isinstance(lhs, VariableRef), '%s: %s' % (lhs.__class__,
Sylvain's avatar
Sylvain committed
        #                                                       relation)
Sylvain's avatar
Sylvain committed
        
Nicolas Chauvat's avatar
Nicolas Chauvat committed
    def visit_comparison(self, comparison, errors):
Sylvain's avatar
Sylvain committed
        assert len(comparison.children) in (1,2), len(comparison.children)
    def leave_comparison(self, node, errors):
        pass
Nicolas Chauvat's avatar
Nicolas Chauvat committed
    
    def visit_mathexpression(self, mathexpr, errors):
        assert len(mathexpr.children) == 2, len(mathexpr.children)
    def leave_mathexpression(self, node, errors):
        pass
Nicolas Chauvat's avatar
Nicolas Chauvat committed
        
    def visit_function(self, function, errors):
        try:
            funcdescr = function_description(function.name)
        except KeyError:
Sylvain's avatar
Sylvain committed
            errors.append('unknown function "%s"' % function.name)
        else:
            try:
                funcdescr.check_nbargs(len(function.children))
            except BadRQLQuery, ex:
                errors.append(str(ex))
            if funcdescr.aggregat:
                if isinstance(function.children[0], Function) and \
Sylvain's avatar
Sylvain committed
                       function.children[0].descr().aggregat:
                    errors.append('can\'t nest aggregat functions')
            if funcdescr.name == 'IN':
                assert function.parent.operator == '='
                if len(function.children) == 1:
                    function.parent.append(function.children[0])
                    function.parent.remove(function)
                else:
                    assert len(function.children) >= 1
    def leave_function(self, node, errors):
        pass
Nicolas Chauvat's avatar
Nicolas Chauvat committed

    def visit_variableref(self, variableref, errors):
        assert len(variableref.children)==0
Sylvain's avatar
Sylvain committed
        assert not variableref.parent is variableref
##         try:
##             assert variableref.variable in variableref.root().defined_vars.values(), \
##                    (variableref.root(), variableref.variable, variableref.root().defined_vars)
##         except AttributeError:
##             raise Exception((variableref.root(), variableref.variable))
Sylvain Thenault's avatar
Sylvain Thenault committed
    def leave_variableref(self, node, errors):
        pass

Nicolas Chauvat's avatar
Nicolas Chauvat committed
    def visit_constant(self, constant, errors):
        assert len(constant.children)==0
Sylvain's avatar
Sylvain committed
        if constant.type == 'etype':
            if constant.relation().r_type != 'is':
                msg ='using an entity type in only allowed with "is" relation'
                errors.append(msg)
            if not constant.value in self.schema:
                errors.append('unknown entity type %s' % constant.value)
                
    def leave_constant(self, node, errors):
        pass 
Sylvain's avatar
Sylvain committed

Sylvain's avatar
Sylvain committed
class RQLSTAnnotator(object):
    """ annotate RQL syntax tree to ease further code generation from it.
    
    If an optional variable is shared among multiple scopes, it's rewritten to
    use identity relation.
    """

    def __init__(self, schema, special_relations=None):
        self.schema = schema
        self.special_relations = special_relations or {}

    def annotate(self, node):
        #assert not node.annotated
        node.annotated = True
        
    def _visit_stmt(self, node):
        for var in node.defined_vars.itervalues():
            var.prepare_annotation()
        for i, term in enumerate(node.selection):
            for func in term.iget_nodes(Function):
                if func.descr().aggregat:
                    node.has_aggregat = True
                    break
Sylvain's avatar
Sylvain committed
            # register the selection column index
Sylvain Thenault's avatar
Sylvain Thenault committed
            for vref in variable_refs(term):
                vref.variable.stinfo['selected'].add(i)
                vref.variable.set_scope(node)
        if node.where is not None:
            node.where.accept(self, node)

    visit_insert = visit_delete = visit_set = _visit_stmt
    
    def visit_union(self, node):
        for select in node.children:
            self.visit_select(select)
            
    def visit_select(self, node):
        if node.with_ is not None:
            for subquery in node.with_:
                self.visit_union(subquery.query)
        self._visit_stmt(node)
Sylvain's avatar
Sylvain committed
    def rewrite_shared_optional(self, exists, var):
        """if variable is shared across multiple scopes, need some tree
        rewriting
        """
        if var.scope is var.stmt:
Sylvain's avatar
Sylvain committed
            # allocate a new variable
            newvar = var.stmt.make_variable()
Sylvain's avatar
Sylvain committed
            for vref in var.references():
Sylvain's avatar
Sylvain committed
                    rel = vref.relation()
                    vref.unregister_reference()
                    newvref = VariableRef(newvar)
                    vref.parent.replace(vref, newvref)
                    # update stinfo structure which may have already been
                    # partially processed
                    if rel in var.stinfo['rhsrelations']:
                        lhs, rhs = rel.get_parts()
                        if vref is rhs.children[0] and \
                               self.schema.rschema(rel.r_type).is_final():
                            update_attrvars(newvar, rel, lhs)
                            lhsvar = getattr(lhs, 'variable', None)
                            var.stinfo['attrvars'].remove( (lhsvar, rel.r_type) )
                            if var.stinfo['attrvar'] is lhsvar:
                                if var.stinfo['attrvars']:
                                    var.stinfo['attrvar'] = iter(var.stinfo['attrvars']).next()
                                else:
                                    var.stinfo['attrvar'] = None
                        var.stinfo['rhsrelations'].remove(rel)
                        newvar.stinfo['rhsrelations'].add(rel)
                    for stinfokey in ('blocsimplification','typerels', 'uidrels',
                                      'relations', 'optrelations'):
                        try:
                            var.stinfo[stinfokey].remove(rel)
                            newvar.stinfo[stinfokey].add(rel)
                        except KeyError:
                            continue
            # shared references
            newvar.stinfo['constnode'] = var.stinfo['constnode']
            if newvar.stmt.solutions: # solutions already computed
                newvar.stinfo['possibletypes'] = var.stinfo['possibletypes']
                for sol in newvar.stmt.solutions:
                    sol[newvar.name] = sol[var.name]
Sylvain's avatar
Sylvain committed
            rel = exists.add_relation(var, 'identity', newvar)
            # we have to force visit of the introduced relation
            self.visit_relation(rel, exists)
            return newvar
        return None
Sylvain's avatar
Sylvain committed
    # tree nodes ##############################################################
    
    def visit_exists(self, node, scope):
        node.children[0].accept(self, node)
        
    def visit_not(self, node, scope):
        node.children[0].accept(self, scope)
        
Sylvain's avatar
Sylvain committed
    def visit_and(self, node, scope):
        node.children[0].accept(self, scope)
        node.children[1].accept(self, scope)
    visit_or = visit_and
        
    def visit_relation(self, relation, scope):
        assert relation.parent, repr(relation)
Sylvain's avatar
Sylvain committed
        lhs, rhs = relation.get_parts()
        # may be a constant once rqlst has been simplified
        lhsvar = getattr(lhs, 'variable', None)
        if not isinstance(lhsvar, Variable):
Sylvain Thenault's avatar
Sylvain Thenault committed
            lhsvar = None
Sylvain's avatar
Sylvain committed
        if relation.is_types_restriction():
            assert rhs.operator == '='
            assert not relation.optional
            if lhsvar is not None:
                lhsvar.stinfo['typerels'].add(relation)
            return
        if relation.optional is not None:
            if not isinstance(exists, Exists):
Sylvain's avatar
Sylvain committed
            if lhsvar is not None:
                if exists is not None:
                    newvar = self.rewrite_shared_optional(exists, lhsvar)
                    if newvar is not None:
                        lhsvar = newvar
Sylvain's avatar
Sylvain committed
                    lhsvar.stinfo['blocsimplification'].add(relation)
Sylvain's avatar
Sylvain committed
                    lhsvar.stinfo['blocsimplification'].add(relation)
                    lhsvar.stinfo['optrelations'].add(relation)
                elif relation.optional == 'left':
                    lhsvar.stinfo['optrelations'].add(relation)
Sylvain's avatar
Sylvain committed
            try:
                rhsvar = rhs.children[0].variable
                if exists is not None:
                    newvar = self.rewrite_shared_optional(exists, rhsvar)
                    if newvar is not None:
                        rhsvar = newvar
                if relation.optional == 'right':
                    rhsvar.stinfo['optrelations'].add(relation)
                elif relation.optional == 'both':
Sylvain's avatar
Sylvain committed
                    rhsvar.stinfo['blocsimplification'].add(relation)
                    rhsvar.stinfo['optrelations'].add(relation)
                elif relation.optional == 'left':
Sylvain's avatar
Sylvain committed
                    rhsvar.stinfo['blocsimplification'].add(relation)
Sylvain's avatar
Sylvain committed
            except AttributeError:
                # may have been rewritten as well
                pass
        rtype = relation.r_type
        try:
            rschema = self.schema.rschema(rtype)
        except KeyError:
            raise BadRQLQuery('no relation %s' % rtype)
Sylvain's avatar
Sylvain committed
        if lhsvar is not None:
            lhsvar.set_scope(scope)
            lhsvar.stinfo['relations'].add(relation)
            if rtype in self.special_relations:
                key = '%srels' % self.special_relations[rtype]
                if key == 'uidrels':
                    constnode = relation.get_variable_parts()[1]
                    if not (relation.operator() != '=' or
                            isinstance(relation.parent, Not)):
                        if isinstance(constnode, Constant):
                            lhsvar.stinfo['constnode'] = constnode
                        lhsvar.stinfo.setdefault(key, set()).add(relation)
                else:
                    lhsvar.stinfo.setdefault(key, set()).add(relation)
Sylvain's avatar
Sylvain committed
            elif rschema.is_final() or rschema.inlined:
                lhsvar.stinfo['blocsimplification'].add(relation)
Sylvain Thenault's avatar
Sylvain Thenault committed
        for vref in variable_refs(rhs):
            var = vref.variable
Sylvain's avatar
Sylvain committed
            var.set_scope(scope)
            var.stinfo['relations'].add(relation)
            var.stinfo['rhsrelations'].add(relation)
Sylvain Thenault's avatar
Sylvain Thenault committed
            if vref is rhs.children[0] and rschema.is_final():
                update_attrvars(var, relation, lhs)

def update_attrvars(var, relation, lhs):
    lhsvar = getattr(lhs, 'variable', None)
    var.stinfo['attrvars'].add( (lhsvar, relation.r_type) )
    # give priority to variable which is not in an EXISTS as
    # "main" attribute variable
    if var.stinfo['attrvar'] is None or not isinstance(relation.scope, Exists):
        var.stinfo['attrvar'] = lhsvar or lhs