author | Sylvain Thénault <sylvain.thenault@logilab.fr> |
Mon, 03 Aug 2009 09:24:08 +0200 | |
changeset 2648 | 4ae7d02ce063 |
parent 2647 | b0a2e779845c |
child 2650 | 18aec79ec3a3 |
permissions | -rw-r--r-- |
0 | 1 |
"""The `ResultSet` class which is returned as result of a rql query |
2 |
||
3 |
:organization: Logilab |
|
1977
606923dff11b
big bunch of copyright / docstring update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1922
diff
changeset
|
4 |
:copyright: 2001-2009 LOGILAB S.A. (Paris, FRANCE), license is LGPL v2. |
0 | 5 |
:contact: http://www.logilab.fr/ -- mailto:contact@logilab.fr |
1977
606923dff11b
big bunch of copyright / docstring update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1922
diff
changeset
|
6 |
:license: GNU Lesser General Public License, v2.1 - http://www.gnu.org/licenses |
0 | 7 |
""" |
8 |
__docformat__ = "restructuredtext en" |
|
9 |
||
10 |
from logilab.common.decorators import cached, clear_cache, copy_cache |
|
11 |
||
12 |
from rql import nodes |
|
13 |
||
14 |
from cubicweb import NotAnEntity |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
15 |
|
0 | 16 |
|
17 |
class ResultSet(object): |
|
18 |
"""a result set wrap a RQL query result. This object implements a partial |
|
19 |
list protocol to allow direct use as a list of result rows. |
|
20 |
||
21 |
:type rowcount: int |
|
22 |
:ivar rowcount: number of rows in the result |
|
23 |
||
24 |
:type rows: list |
|
25 |
:ivar rows: list of rows of result |
|
26 |
||
27 |
:type description: list |
|
28 |
:ivar description: |
|
29 |
result's description, using the same structure as the result itself |
|
30 |
||
31 |
:type rql: str or unicode |
|
32 |
:ivar rql: the original RQL query string |
|
33 |
""" |
|
34 |
def __init__(self, results, rql, args=None, description=(), cachekey=None, |
|
35 |
rqlst=None): |
|
36 |
self.rows = results |
|
37 |
self.rowcount = results and len(results) or 0 |
|
38 |
# original query and arguments |
|
39 |
self.rql = rql |
|
40 |
self.args = args |
|
41 |
self.cachekey = cachekey |
|
42 |
# entity types for each cell (same shape as rows) |
|
43 |
# maybe discarded if specified when the query has been executed |
|
44 |
self.description = description |
|
45 |
# parsed syntax tree |
|
46 |
if rqlst is not None: |
|
47 |
rqlst.schema = None # reset schema in case of pyro transfert |
|
48 |
self._rqlst = rqlst |
|
49 |
# set to (limit, offset) when a result set is limited using the |
|
50 |
# .limit method |
|
51 |
self.limited = None |
|
52 |
# set by the cursor which returned this resultset |
|
53 |
self.vreg = None |
|
54 |
self.req = None |
|
1381
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
55 |
# actions cache |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
56 |
self._rsetactions = None |
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
57 |
|
0 | 58 |
def __str__(self): |
59 |
if not self.rows: |
|
60 |
return '<empty resultset %s>' % self.rql |
|
61 |
return '<resultset %s (%s rows)>' % (self.rql, len(self.rows)) |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
62 |
|
0 | 63 |
def __repr__(self): |
64 |
if not self.rows: |
|
170
455ff18ef28e
use repr (instead of str) to print rql in __repr__ method of a result set
Stephanie Marcu <stephanie.marcu@logilab.fr>
parents:
0
diff
changeset
|
65 |
return '<empty resultset for %r>' % self.rql |
616
545a7e18c47f
don't display too much rset rows
sylvain.thenault@logilab.fr
parents:
572
diff
changeset
|
66 |
rows = self.rows |
545a7e18c47f
don't display too much rset rows
sylvain.thenault@logilab.fr
parents:
572
diff
changeset
|
67 |
if len(rows) > 10: |
545a7e18c47f
don't display too much rset rows
sylvain.thenault@logilab.fr
parents:
572
diff
changeset
|
68 |
rows = rows[:10] + ['...'] |
0 | 69 |
if not self.description: |
616
545a7e18c47f
don't display too much rset rows
sylvain.thenault@logilab.fr
parents:
572
diff
changeset
|
70 |
return '<resultset %r (%s rows): %s>' % (self.rql, len(self.rows), |
545a7e18c47f
don't display too much rset rows
sylvain.thenault@logilab.fr
parents:
572
diff
changeset
|
71 |
'\n'.join(str(r) for r in rows)) |
545a7e18c47f
don't display too much rset rows
sylvain.thenault@logilab.fr
parents:
572
diff
changeset
|
72 |
return '<resultset %r (%s rows): %s>' % (self.rql, len(self.rows), |
545a7e18c47f
don't display too much rset rows
sylvain.thenault@logilab.fr
parents:
572
diff
changeset
|
73 |
'\n'.join('%s (%s)' % (r, d) |
545a7e18c47f
don't display too much rset rows
sylvain.thenault@logilab.fr
parents:
572
diff
changeset
|
74 |
for r, d in zip(rows, self.description))) |
0 | 75 |
|
1381
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
76 |
def possible_actions(self, **kwargs): |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
77 |
if self._rsetactions is None: |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
78 |
self._rsetactions = {} |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
79 |
if kwargs: |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
80 |
key = tuple(sorted(kwargs.iteritems())) |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
81 |
else: |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
82 |
key = None |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
83 |
try: |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
84 |
return self._rsetactions[key] |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
85 |
except KeyError: |
2058
7ef12c03447c
nicer vreg api, try to make rset an optional named argument in select and derivated (including selectors)
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
86 |
actions = self.vreg.possible_vobjects('actions', self.req, |
7ef12c03447c
nicer vreg api, try to make rset an optional named argument in select and derivated (including selectors)
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
87 |
rset=self, **kwargs) |
1381
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
88 |
self._rsetactions[key] = actions |
6042f1b342bb
consider kwargs in possible_actions
sylvain.thenault@logilab.fr
parents:
616
diff
changeset
|
89 |
return actions |
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
90 |
|
0 | 91 |
def __len__(self): |
92 |
"""returns the result set's size""" |
|
93 |
return self.rowcount |
|
94 |
||
95 |
def __nonzero__(self): |
|
96 |
return self.rowcount |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
97 |
|
0 | 98 |
def __getitem__(self, i): |
99 |
"""returns the ith element of the result set""" |
|
100 |
return self.rows[i] #ResultSetRow(self.rows[i]) |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
101 |
|
0 | 102 |
def __getslice__(self, i, j): |
103 |
"""returns slice [i:j] of the result set""" |
|
104 |
return self.rows[i:j] |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
105 |
|
0 | 106 |
def __iter__(self): |
107 |
"""Returns an iterator over rows""" |
|
108 |
return iter(self.rows) |
|
109 |
||
110 |
def __add__(self, rset): |
|
111 |
# XXX buggy implementation (.rql and .args attributes at least much |
|
112 |
# probably differ) |
|
113 |
# at least rql could be fixed now that we have union and sub-queries |
|
114 |
# but I tend to think that since we have that, we should not need this |
|
115 |
# method anymore (syt) |
|
116 |
rset = ResultSet(self.rows+rset.rows, self.rql, self.args, |
|
117 |
self.description +rset.description) |
|
118 |
return self.req.decorate_rset(rset) |
|
119 |
||
120 |
def _prepare_copy(self, rows, descr): |
|
121 |
rset = ResultSet(rows, self.rql, self.args, descr) |
|
122 |
return self.req.decorate_rset(rset) |
|
123 |
||
124 |
def transformed_rset(self, transformcb): |
|
125 |
""" the result set according to a given column types |
|
126 |
||
127 |
:type transormcb: callable(row, desc) |
|
128 |
:param transformcb: |
|
129 |
a callable which should take a row and its type description as |
|
130 |
parameters, and return the transformed row and type description. |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
131 |
|
0 | 132 |
|
133 |
:type col: int |
|
134 |
:param col: the column index |
|
135 |
||
136 |
:rtype: `ResultSet` |
|
137 |
""" |
|
138 |
rows, descr = [], [] |
|
139 |
rset = self._prepare_copy(rows, descr) |
|
140 |
for row, desc in zip(self.rows, self.description): |
|
141 |
nrow, ndesc = transformcb(row, desc) |
|
142 |
if ndesc: # transformcb returns None for ndesc to skip that row |
|
143 |
rows.append(nrow) |
|
144 |
descr.append(ndesc) |
|
145 |
rset.rowcount = len(rows) |
|
146 |
return rset |
|
147 |
||
148 |
def filtered_rset(self, filtercb, col=0): |
|
149 |
"""filter the result set according to a given filtercb |
|
150 |
||
151 |
:type filtercb: callable(entity) |
|
152 |
:param filtercb: |
|
153 |
a callable which should take an entity as argument and return |
|
154 |
False if it should be skipped, else True |
|
155 |
||
156 |
:type col: int |
|
157 |
:param col: the column index |
|
158 |
||
159 |
:rtype: `ResultSet` |
|
160 |
""" |
|
161 |
rows, descr = [], [] |
|
162 |
rset = self._prepare_copy(rows, descr) |
|
163 |
for i in xrange(len(self)): |
|
164 |
if not filtercb(self.get_entity(i, col)): |
|
165 |
continue |
|
166 |
rows.append(self.rows[i]) |
|
167 |
descr.append(self.description[i]) |
|
168 |
rset.rowcount = len(rows) |
|
169 |
return rset |
|
170 |
||
171 |
||
172 |
def sorted_rset(self, keyfunc, reverse=False, col=0): |
|
173 |
"""sorts the result set according to a given keyfunc |
|
174 |
||
175 |
:type keyfunc: callable(entity) |
|
176 |
:param keyfunc: |
|
177 |
a callable which should take an entity as argument and return |
|
178 |
the value used to compare and sort |
|
179 |
||
180 |
:type reverse: bool |
|
181 |
:param reverse: if the result should be reversed |
|
182 |
||
183 |
:type col: int |
|
184 |
:param col: the column index. if col = -1, the whole row are used |
|
185 |
||
186 |
:rtype: `ResultSet` |
|
187 |
""" |
|
188 |
rows, descr = [], [] |
|
189 |
rset = self._prepare_copy(rows, descr) |
|
190 |
if col >= 0: |
|
191 |
entities = sorted(enumerate(self.entities(col)), |
|
192 |
key=lambda (i, e): keyfunc(e), reverse=reverse) |
|
193 |
else: |
|
194 |
entities = sorted(enumerate(self), |
|
195 |
key=lambda (i, e): keyfunc(e), reverse=reverse) |
|
1132 | 196 |
for index, _ in entities: |
0 | 197 |
rows.append(self.rows[index]) |
198 |
descr.append(self.description[index]) |
|
199 |
rset.rowcount = len(rows) |
|
200 |
return rset |
|
201 |
||
202 |
def split_rset(self, keyfunc=None, col=0, return_dict=False): |
|
203 |
"""Splits the result set in multiple result set according to a given key |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
204 |
|
0 | 205 |
:type keyfunc: callable(entity or FinalType) |
206 |
:param keyfunc: |
|
207 |
a callable which should take a value of the rset in argument and |
|
208 |
return the value used to group the value. If not define, raw value |
|
209 |
of the specified columns is used. |
|
210 |
||
211 |
:type col: int |
|
212 |
:param col: the column index. if col = -1, the whole row are used |
|
213 |
||
214 |
:type return_dict: Boolean |
|
215 |
:param return_dict: If true, the function return a mapping |
|
216 |
(key -> rset) instead of a list of rset |
|
217 |
||
218 |
:rtype: List of `ResultSet` or mapping of `ResultSet` |
|
219 |
||
220 |
""" |
|
221 |
result = [] |
|
222 |
mapping = {} |
|
223 |
for idx, line in enumerate(self): |
|
224 |
if col >= 0: |
|
225 |
try: |
|
1132 | 226 |
key = self.get_entity(idx, col) |
0 | 227 |
except NotAnEntity: |
228 |
key = line[col] |
|
229 |
else: |
|
230 |
key = line |
|
231 |
if keyfunc is not None: |
|
232 |
key = keyfunc(key) |
|
233 |
||
234 |
if key not in mapping: |
|
235 |
rows, descr = [], [] |
|
236 |
rset = self._prepare_copy(rows, descr) |
|
237 |
mapping[key] = rset |
|
238 |
result.append(rset) |
|
239 |
else: |
|
240 |
rset = mapping[key] |
|
241 |
rset.rows.append(self.rows[idx]) |
|
242 |
rset.description.append(self.description[idx]) |
|
243 |
||
244 |
||
245 |
for rset in result: |
|
246 |
rset.rowcount = len(rset.rows) |
|
247 |
if return_dict: |
|
248 |
return mapping |
|
249 |
else: |
|
250 |
return result |
|
251 |
||
252 |
def limit(self, limit, offset=0, inplace=False): |
|
253 |
"""limit the result set to the given number of rows optionaly starting |
|
254 |
from an index different than 0 |
|
255 |
||
256 |
:type limit: int |
|
257 |
:param limit: the maximum number of results |
|
258 |
||
259 |
:type offset: int |
|
260 |
:param offset: the offset index |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
261 |
|
0 | 262 |
:type inplace: bool |
263 |
:param inplace: |
|
264 |
if true, the result set is modified in place, else a new result set |
|
265 |
is returned and the original is left unmodified |
|
266 |
||
267 |
:rtype: `ResultSet` |
|
268 |
""" |
|
269 |
stop = limit+offset |
|
270 |
rows = self.rows[offset:stop] |
|
271 |
descr = self.description[offset:stop] |
|
272 |
if inplace: |
|
273 |
rset = self |
|
274 |
rset.rows, rset.description = rows, descr |
|
275 |
rset.rowcount = len(rows) |
|
276 |
clear_cache(rset, 'description_struct') |
|
277 |
if offset: |
|
278 |
clear_cache(rset, 'get_entity') |
|
279 |
# we also have to fix/remove from the request entity cache entities |
|
280 |
# which get a wrong rset reference by this limit call |
|
281 |
for entity in self.req.cached_entities(): |
|
282 |
if entity.rset is self: |
|
283 |
if offset <= entity.row < stop: |
|
284 |
entity.row = entity.row - offset |
|
285 |
else: |
|
286 |
self.req.drop_entity_cache(entity.eid) |
|
287 |
else: |
|
288 |
rset = self._prepare_copy(rows, descr) |
|
289 |
if not offset: |
|
290 |
# can copy built entity caches |
|
291 |
copy_cache(rset, 'get_entity', self) |
|
292 |
rset.limited = (limit, offset) |
|
293 |
return rset |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
294 |
|
0 | 295 |
def printable_rql(self, encoded=False): |
296 |
"""return the result set's origin rql as a string, with arguments |
|
297 |
substitued |
|
298 |
""" |
|
299 |
encoding = self.req.encoding |
|
300 |
rqlstr = self.syntax_tree().as_string(encoding, self.args) |
|
301 |
# sounds like we get encoded or unicode string due to a bug in as_string |
|
302 |
if not encoded: |
|
303 |
if isinstance(rqlstr, unicode): |
|
304 |
return rqlstr |
|
305 |
return unicode(rqlstr, encoding) |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
306 |
else: |
0 | 307 |
if isinstance(rqlstr, unicode): |
308 |
return rqlstr.encode(encoding) |
|
309 |
return rqlstr |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
310 |
|
0 | 311 |
# client helper methods ################################################### |
312 |
||
313 |
def entities(self, col=0): |
|
314 |
"""iter on entities with eid in the `col` column of the result set""" |
|
315 |
for i in xrange(len(self)): |
|
316 |
# may have None values in case of outer join (or aggregat on eid |
|
317 |
# hacks) |
|
318 |
if self.rows[i][col] is not None: |
|
319 |
yield self.get_entity(i, col) |
|
320 |
||
321 |
@cached |
|
322 |
def get_entity(self, row, col=None): |
|
323 |
"""special method for query retreiving a single entity, returns a |
|
324 |
partially initialized Entity instance. |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
325 |
|
0 | 326 |
WARNING: due to the cache wrapping this function, you should NEVER |
327 |
give row as a named parameter (i.e. rset.get_entity(req, 0) |
|
328 |
is OK but rset.get_entity(row=0, req=req) isn't |
|
329 |
||
330 |
:type row,col: int, int |
|
331 |
:param row,col: |
|
332 |
row and col numbers localizing the entity among the result's table |
|
333 |
||
334 |
:return: the partially initialized `Entity` instance |
|
335 |
""" |
|
336 |
if col is None: |
|
337 |
from warnings import warn |
|
338 |
msg = 'col parameter will become mandatory in future version' |
|
339 |
warn(msg, DeprecationWarning, stacklevel=3) |
|
340 |
col = 0 |
|
341 |
etype = self.description[row][col] |
|
342 |
try: |
|
343 |
eschema = self.vreg.schema.eschema(etype) |
|
344 |
if eschema.is_final(): |
|
345 |
raise NotAnEntity(etype) |
|
346 |
except KeyError: |
|
347 |
raise NotAnEntity(etype) |
|
348 |
return self._build_entity(row, col) |
|
349 |
||
2647
b0a2e779845c
enable server side entity caching, 25% speedup on codenaf insertion. ALL CW TESTS OK
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2381
diff
changeset
|
350 |
def _build_entity(self, row, col): |
0 | 351 |
"""internal method to get a single entity, returns a |
352 |
partially initialized Entity instance. |
|
353 |
||
354 |
partially means that only attributes selected in the RQL |
|
355 |
query will be directly assigned to the entity. |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
356 |
|
0 | 357 |
:type row,col: int, int |
358 |
:param row,col: |
|
359 |
row and col numbers localizing the entity among the result's table |
|
360 |
||
361 |
:return: the partially initialized `Entity` instance |
|
362 |
""" |
|
363 |
req = self.req |
|
364 |
if req is None: |
|
365 |
raise AssertionError('dont call get_entity with no req on the result set') |
|
366 |
rowvalues = self.rows[row] |
|
367 |
eid = rowvalues[col] |
|
368 |
assert eid is not None |
|
369 |
# return cached entity if exists. This also avoids potential recursion |
|
370 |
# XXX should we consider updating a cached entity with possible |
|
371 |
# new attributes found in this resultset ? |
|
372 |
try: |
|
2648
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
373 |
entity = req.entity_cache(eid) |
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
374 |
if entity.rset is None: |
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
375 |
# entity has no rset set, this means entity has been cached by |
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
376 |
# the repository (req is a repository session) which had no rset |
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
377 |
# info. Add id. |
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
378 |
entity.rset = self |
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
379 |
entity.row = row |
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
380 |
entity.col = col |
4ae7d02ce063
F [rset repo cache] set entity.rset when no set on entities retreived from the cache
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2647
diff
changeset
|
381 |
return entity |
0 | 382 |
except KeyError: |
383 |
pass |
|
384 |
# build entity instance |
|
385 |
etype = self.description[row][col] |
|
386 |
entity = self.vreg.etype_class(etype)(req, self, row, col) |
|
387 |
entity.set_eid(eid) |
|
388 |
# cache entity |
|
389 |
req.set_entity_cache(entity) |
|
390 |
eschema = entity.e_schema |
|
391 |
# try to complete the entity if there are some additional columns |
|
392 |
if len(rowvalues) > 1: |
|
393 |
rqlst = self.syntax_tree() |
|
394 |
if rqlst.TYPE == 'select': |
|
395 |
# UNION query, find the subquery from which this entity has been |
|
396 |
# found |
|
397 |
rqlst = rqlst.locate_subquery(col, etype, self.args) |
|
398 |
# take care, due to outer join support, we may find None |
|
399 |
# values for non final relation |
|
400 |
for i, attr, x in attr_desc_iterator(rqlst, col): |
|
401 |
if x == 'subject': |
|
402 |
rschema = eschema.subject_relation(attr) |
|
403 |
if rschema.is_final(): |
|
404 |
entity[attr] = rowvalues[i] |
|
405 |
continue |
|
406 |
tetype = rschema.objects(etype)[0] |
|
407 |
card = rschema.rproperty(etype, tetype, 'cardinality')[0] |
|
408 |
else: |
|
409 |
rschema = eschema.object_relation(attr) |
|
410 |
tetype = rschema.subjects(etype)[0] |
|
411 |
card = rschema.rproperty(tetype, etype, 'cardinality')[1] |
|
412 |
# only keep value if it can't be multivalued |
|
413 |
if card in '1?': |
|
414 |
if rowvalues[i] is None: |
|
415 |
if x == 'subject': |
|
416 |
rql = 'Any Y WHERE X %s Y, X eid %s' |
|
417 |
else: |
|
418 |
rql = 'Any Y WHERE Y %s X, X eid %s' |
|
419 |
rrset = ResultSet([], rql % (attr, entity.eid)) |
|
420 |
req.decorate_rset(rrset) |
|
421 |
else: |
|
2647
b0a2e779845c
enable server side entity caching, 25% speedup on codenaf insertion. ALL CW TESTS OK
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
2381
diff
changeset
|
422 |
rrset = self._build_entity(row, i).as_rset() |
0 | 423 |
entity.set_related_cache(attr, x, rrset) |
424 |
return entity |
|
425 |
||
426 |
@cached |
|
427 |
def syntax_tree(self): |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
428 |
"""get the syntax tree for the source query. |
0 | 429 |
|
430 |
:rtype: rql.stmts.Statement |
|
431 |
:return: the RQL syntax tree of the originating query |
|
432 |
""" |
|
433 |
if self._rqlst: |
|
434 |
rqlst = self._rqlst.copy() |
|
435 |
# to avoid transport overhead when pyro is used, the schema has been |
|
436 |
# unset from the syntax tree |
|
437 |
rqlst.schema = self.vreg.schema |
|
438 |
self.vreg.rqlhelper.annotate(rqlst) |
|
439 |
else: |
|
440 |
rqlst = self.vreg.parse(self.req, self.rql, self.args) |
|
441 |
return rqlst |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
442 |
|
0 | 443 |
@cached |
444 |
def column_types(self, col): |
|
445 |
"""return the list of different types in the column with the given col |
|
446 |
index default to 0 (ie the first column) |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
447 |
|
0 | 448 |
:type col: int |
449 |
:param col: the index of the desired column |
|
450 |
||
451 |
:rtype: list |
|
452 |
:return: the different entities type found in the column |
|
453 |
""" |
|
454 |
return frozenset(struc[-1][col] for struc in self.description_struct()) |
|
455 |
||
456 |
@cached |
|
457 |
def description_struct(self): |
|
458 |
"""return a list describing sequence of results with the same |
|
459 |
description, e.g. : |
|
460 |
[[0, 4, ('Bug',)] |
|
461 |
[[0, 4, ('Bug',), [5, 8, ('Story',)] |
|
462 |
[[0, 3, ('Project', 'Version',)]] |
|
463 |
""" |
|
464 |
result = [] |
|
465 |
last = None |
|
466 |
for i, row in enumerate(self.description): |
|
467 |
if row != last: |
|
468 |
if last is not None: |
|
469 |
result[-1][1] = i - 1 |
|
470 |
result.append( [i, None, row] ) |
|
471 |
last = row |
|
472 |
if last is not None: |
|
473 |
result[-1][1] = i |
|
474 |
return result |
|
475 |
||
476 |
@cached |
|
477 |
def related_entity(self, row, col): |
|
478 |
"""try to get the related entity to extract format information if any""" |
|
479 |
locate_query_col = col |
|
480 |
rqlst = self.syntax_tree() |
|
481 |
etype = self.description[row][col] |
|
482 |
if self.vreg.schema.eschema(etype).is_final(): |
|
572
9849fed789c9
test and fix potential error with None optional relation
sylvain.thenault@logilab.fr
parents:
170
diff
changeset
|
483 |
# final type, find a better one to locate the correct subquery |
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
484 |
# (ambiguous if possible) |
0 | 485 |
for i in xrange(len(rqlst.children[0].selection)): |
486 |
if i == col: |
|
487 |
continue |
|
488 |
coletype = self.description[row][i] |
|
489 |
if coletype is None: |
|
490 |
continue |
|
491 |
if not self.vreg.schema.eschema(coletype).is_final(): |
|
492 |
etype = coletype |
|
493 |
locate_query_col = i |
|
494 |
if len(self.column_types(i)) > 1: |
|
495 |
break |
|
572
9849fed789c9
test and fix potential error with None optional relation
sylvain.thenault@logilab.fr
parents:
170
diff
changeset
|
496 |
# UNION query, find the subquery from which this entity has been found |
0 | 497 |
select = rqlst.locate_subquery(locate_query_col, etype, self.args) |
498 |
try: |
|
499 |
myvar = select.selection[col].variable |
|
500 |
except AttributeError: |
|
572
9849fed789c9
test and fix potential error with None optional relation
sylvain.thenault@logilab.fr
parents:
170
diff
changeset
|
501 |
# not a variable |
0 | 502 |
return None, None |
503 |
rel = myvar.main_relation() |
|
504 |
if rel is not None: |
|
505 |
index = rel.children[0].variable.selected_index() |
|
572
9849fed789c9
test and fix potential error with None optional relation
sylvain.thenault@logilab.fr
parents:
170
diff
changeset
|
506 |
if index is not None and self.rows[row][index]: |
0 | 507 |
return self.get_entity(row, index), rel.r_type |
508 |
return None, None |
|
509 |
||
510 |
@cached |
|
511 |
def searched_text(self): |
|
512 |
"""returns the searched text in case of full-text search |
|
513 |
||
514 |
:return: searched text or `None` if the query is not |
|
515 |
a full-text query |
|
516 |
""" |
|
517 |
rqlst = self.syntax_tree() |
|
518 |
for rel in rqlst.iget_nodes(nodes.Relation): |
|
519 |
if rel.r_type == 'has_text': |
|
520 |
__, rhs = rel.get_variable_parts() |
|
521 |
return rhs.eval(self.args) |
|
522 |
return None |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
1477
diff
changeset
|
523 |
|
0 | 524 |
|
525 |
def attr_desc_iterator(rqlst, index=0): |
|
526 |
"""return an iterator on a list of 2-uple (index, attr_relation) |
|
527 |
localizing attribute relations of the main variable in a result's row |
|
528 |
||
529 |
:type rqlst: rql.stmts.Select |
|
530 |
:param rqlst: the RQL syntax tree to describe |
|
531 |
||
532 |
:return: |
|
533 |
a generator on (index, relation, target) describing column being |
|
534 |
attribute of the main variable |
|
535 |
""" |
|
536 |
main = rqlst.selection[index] |
|
537 |
for i, term in enumerate(rqlst.selection): |
|
538 |
if i == index: |
|
539 |
continue |
|
2352
734eb79680e9
handle attribute selection on variable selected using MAX()
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
540 |
# XXX rewritten const |
734eb79680e9
handle attribute selection on variable selected using MAX()
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
541 |
# use iget_nodes for (hack) case where we have things like MAX(V) |
734eb79680e9
handle attribute selection on variable selected using MAX()
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
542 |
for vref in term.iget_nodes(nodes.VariableRef): |
734eb79680e9
handle attribute selection on variable selected using MAX()
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
543 |
var = vref.variable |
734eb79680e9
handle attribute selection on variable selected using MAX()
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
544 |
break |
734eb79680e9
handle attribute selection on variable selected using MAX()
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
545 |
else: |
0 | 546 |
continue |
547 |
#varname = var.name |
|
548 |
for ref in var.references(): |
|
549 |
rel = ref.relation() |
|
550 |
if rel is None or rel.is_types_restriction(): |
|
551 |
continue |
|
552 |
lhs, rhs = rel.get_variable_parts() |
|
553 |
if main.is_equivalent(lhs): |
|
554 |
if rhs.is_equivalent(term): |
|
555 |
yield (i, rel.r_type, 'subject') |
|
556 |
elif main.is_equivalent(rhs): |
|
557 |
if lhs.is_equivalent(term): |
|
558 |
yield (i, rel.r_type, 'object') |