author | Nicolas Chauvat <nicolas.chauvat@logilab.fr> |
Thu, 23 Jul 2009 13:03:50 +0200 | |
changeset 2433 | 1d46c016a564 |
parent 2431 | 93c061eac647 |
child 2435 | 85be7a811afe |
permissions | -rw-r--r-- |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
1 |
"""SPARQL -> RQL translator |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
2 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
3 |
:organization: Logilab |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
4 |
:copyright: 2009 LOGILAB S.A. (Paris, FRANCE), license is LGPL v2. |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
5 |
:contact: http://www.logilab.fr/ -- mailto:contact@logilab.fr |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
6 |
:license: GNU Lesser General Public License, v2.1 - http://www.gnu.org/licenses |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
7 |
""" |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
8 |
from logilab.common import make_domains |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
9 |
from rql import TypeResolverException |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
10 |
from fyzz.yappsparser import parse |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
11 |
from fyzz import ast |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
12 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
13 |
from cubicweb.xy import xy |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
14 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
15 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
16 |
class UnsupportedQuery(Exception): pass |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
17 |
|
2431
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
18 |
def order_limit_offset(sparqlst): |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
19 |
addons = '' |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
20 |
if sparqlst.orderby: |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
21 |
sortterms = ', '.join('%s %s' % (var.name.upper(), ascdesc.upper()) |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
22 |
for var, ascdesc in sparqlst.orderby) |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
23 |
addons += ' ORDERBY %s' % sortterms |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
24 |
if sparqlst.limit: |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
25 |
addons += ' LIMIT %s' % sparqlst.limit |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
26 |
if sparqlst.offset: |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
27 |
addons += ' OFFSET %s' % sparqlst.offset |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
28 |
return addons |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
29 |
|
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
30 |
class QueryInfo(object): |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
31 |
"""wrapper class containing necessary information to generate a RQL query |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
32 |
from a sparql syntax tree |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
33 |
""" |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
34 |
def __init__(self, sparqlst): |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
35 |
self.sparqlst = sparqlst |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
36 |
if sparqlst.selected == ['*']: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
37 |
self.selection = [var.upper() for var in sparqlst.variables] |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
38 |
else: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
39 |
self.selection = [var.name.upper() for var in sparqlst.selected] |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
40 |
self.possible_types = {} |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
41 |
self.infer_types_info = [] |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
42 |
self.union_params = [] |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
43 |
self.restrictions = [] |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
44 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
45 |
def finalize(self): |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
46 |
"""return corresponding rql query""" |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
47 |
for varname, ptypes in self.possible_types.iteritems(): |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
48 |
if len(ptypes) == 1: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
49 |
self.restrictions.append('%s is %s' % (varname, iter(ptypes).next())) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
50 |
unions = [] |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
51 |
for releq, subjvar, objvar in self.union_params: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
52 |
thisunions = [] |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
53 |
for st, rt, ot in releq: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
54 |
thisunions.append(['%s %s %s' % (subjvar, rt, objvar)]) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
55 |
if st != '*': |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
56 |
thisunions[-1].append('%s is %s' % (subjvar, st)) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
57 |
if ot != '*': |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
58 |
thisunions[-1].append('%s is %s' % (objvar, ot)) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
59 |
if not unions: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
60 |
unions = thisunions |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
61 |
else: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
62 |
unions = zip(*make_domains([unions, thisunions])) |
2431
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
63 |
selection = 'Any ' + ', '.join(self.selection) |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
64 |
sparqlst = self.sparqlst |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
65 |
if sparqlst.distinct: |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
66 |
selection = 'DISTINCT ' + selection |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
67 |
if not unions: |
2431
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
68 |
return '%s%s WHERE %s' % (selection, order_limit_offset(sparqlst), |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
69 |
', '.join(self.restrictions)) |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
70 |
baserql = '%s WHERE %s' % (selection, ', '.join(self.restrictions)) |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
71 |
rqls = ['(%s, %s)' % (baserql, ', '.join(unionrestrs)) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
72 |
for unionrestrs in unions] |
2431
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
73 |
rql = ' UNION '.join(rqls) |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
74 |
if sparqlst.orderby or sparqlst.limit or sparqlst.offset: |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
75 |
rql = '%s%s WITH %s BEING (%s)' % ( |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
76 |
selection, order_limit_offset(sparqlst), |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
77 |
', '.join(self.selection), rql) |
93c061eac647
sparql support for limit/offset/orderby
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2430
diff
changeset
|
78 |
return rql |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
79 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
80 |
def set_possible_types(self, var, varpossibletypes): |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
81 |
"""set/restrict possible types for the given variable. |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
82 |
|
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
83 |
:return: True if something changed, else false. |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
84 |
:raise: TypeResolverException if no more type allowed |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
85 |
""" |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
86 |
varpossibletypes = set(varpossibletypes) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
87 |
try: |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
88 |
ctypes = self.possible_types[var] |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
89 |
nbctypes = len(ctypes) |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
90 |
ctypes &= varpossibletypes |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
91 |
if not ctypes: |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
92 |
raise TypeResolverException() |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
93 |
return len(ctypes) != nbctypes |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
94 |
except KeyError: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
95 |
self.possible_types[var] = varpossibletypes |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
96 |
return True |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
97 |
|
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
98 |
def infer_types(self): |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
99 |
# XXX should use something similar to rql.analyze for proper type inference |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
100 |
modified = True |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
101 |
# loop to infer types until nothing changed |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
102 |
while modified: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
103 |
modified = False |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
104 |
for yams_predicates, subjvar, obj in self.infer_types_info: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
105 |
nbchoices = len(yams_predicates) |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
106 |
# get possible types for the subject variable, according to the |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
107 |
# current predicate |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
108 |
svptypes = set(s for s, r, o in yams_predicates) |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
109 |
if not '*' in svptypes: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
110 |
if self.set_possible_types(subjvar, svptypes): |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
111 |
modified = True |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
112 |
# restrict predicates according to allowed subject var types |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
113 |
if subjvar in self.possible_types: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
114 |
yams_predicates = [(s, r, o) for s, r, o in yams_predicates |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
115 |
if s == '*' or s in self.possible_types[subjvar]] |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
116 |
if isinstance(obj, ast.SparqlVar): |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
117 |
# make a valid rql var name |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
118 |
objvar = obj.name.upper() |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
119 |
# get possible types for the object variable, according to |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
120 |
# the current predicate |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
121 |
ovptypes = set(o for s, r, o in yams_predicates) |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
122 |
if not '*' in ovptypes: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
123 |
if self.set_possible_types(objvar, ovptypes): |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
124 |
modified = True |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
125 |
# restrict predicates according to allowed object var types |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
126 |
if objvar in self.possible_types: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
127 |
yams_predicates = [(s, r, o) for s, r, o in yams_predicates |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
128 |
if o == '*' or o in self.possible_types[objvar]] |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
129 |
# ensure this still make sense |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
130 |
if not yams_predicates: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
131 |
raise TypeResolverException() |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
132 |
if len(yams_predicates) != nbchoices: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
133 |
modified = True |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
134 |
# now, for each predicate |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
135 |
for yams_predicates, subjvar, obj in self.infer_types_info: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
136 |
rel = yams_predicates[0] |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
137 |
objvar = obj.name.upper() |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
138 |
# if there are several yams relation type equivalences, we will have |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
139 |
# to generate several unioned rql queries |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
140 |
for s, r, o in yams_predicates[1:]: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
141 |
if r != rel[1]: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
142 |
self.union_params.append((yams_predicates, subjvar, objvar)) |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
143 |
break |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
144 |
else: |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
145 |
# else we can simply add it to base rql restrictions |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
146 |
self.restrictions.append('%s %s %s' % (subjvar, rel[1], objvar)) |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
147 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
148 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
149 |
class Sparql2rqlTranslator(object): |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
150 |
def __init__(self, yschema): |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
151 |
self.yschema = yschema |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
152 |
|
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
153 |
def translate(self, sparql): |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
154 |
sparqlst = parse(sparql) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
155 |
if sparqlst.type != 'select': |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
156 |
raise UnsupportedQuery() |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
157 |
qi = QueryInfo(sparqlst) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
158 |
for subj, predicate, obj in sparqlst.where: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
159 |
if not isinstance(subj, ast.SparqlVar): |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
160 |
raise UnsupportedQuery() |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
161 |
# make a valid rql var name |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
162 |
subjvar = subj.name.upper() |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
163 |
if predicate == ('', 'a'): |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
164 |
# special 'is' relation |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
165 |
if not isinstance(obj, tuple): |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
166 |
raise UnsupportedQuery() |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
167 |
# restrict possible types for the subject variable |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
168 |
qi.set_possible_types( |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
169 |
subjvar, xy.yeq(':'.join(obj), isentity=True)) |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
170 |
else: |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
171 |
# 'regular' relation (eg not 'is') |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
172 |
if not isinstance(predicate, tuple): |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
173 |
raise UnsupportedQuery() |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
174 |
# list of 3-uple |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
175 |
# (yams etype (subject), yams rtype, yams etype (object)) |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
176 |
# where subject / object entity type may '*' if not specified |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
177 |
yams_predicates = xy.yeq(':'.join(predicate)) |
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
178 |
qi.infer_types_info.append((yams_predicates, subjvar, obj)) |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
179 |
if isinstance(obj, ast.SparqlVar): |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
180 |
# make a valid rql var name |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
181 |
objvar = obj.name.upper() |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
182 |
else: |
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
183 |
raise UnsupportedQuery() |
2430
7d9ed6c740ec
cleanup/document/refactor
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2427
diff
changeset
|
184 |
qi.infer_types() |
2422
96da7dc42eb5
quick and dirty support from simple sparql queries + base ui
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
diff
changeset
|
185 |
return qi |