author | Christophe de Vienne <christophe@unlish.com> |
Tue, 02 Sep 2014 10:30:28 +0200 | |
changeset 9941 | 8dc1c96d29f1 |
parent 9940 | 292f786009ba |
child 9942 | 4b99196102f0 |
permissions | -rw-r--r-- |
7879
9aae456abab5
[pylint] fix pylint detected errors and tweak it so that pylint -E will be much less verbose next time (+ update some copyrights on the way)
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
5426
diff
changeset
|
1 |
# copyright 2003-2011 LOGILAB S.A. (Paris, FRANCE), all rights reserved. |
5421
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
2 |
# contact http://www.logilab.fr/ -- mailto:contact@logilab.fr |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
3 |
# |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
4 |
# This file is part of CubicWeb. |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
5 |
# |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
6 |
# CubicWeb is free software: you can redistribute it and/or modify it under the |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
7 |
# terms of the GNU Lesser General Public License as published by the Free |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
8 |
# Software Foundation, either version 2.1 of the License, or (at your option) |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
9 |
# any later version. |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
10 |
# |
5424
8ecbcbff9777
replace logilab-common by CubicWeb in disclaimer
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
5421
diff
changeset
|
11 |
# CubicWeb is distributed in the hope that it will be useful, but WITHOUT |
5421
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
12 |
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
13 |
# FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
14 |
# details. |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
15 |
# |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
16 |
# You should have received a copy of the GNU Lesser General Public License along |
8167de96c523
proper licensing information (LGPL-2.1). Hope I get it right this time.
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
4212
diff
changeset
|
17 |
# with CubicWeb. If not, see <http://www.gnu.org/licenses/>. |
0 | 18 |
"""WSGI request adapter for cubicweb |
19 |
||
20 |
NOTE: each docstring tagged with ``COME FROM DJANGO`` means that |
|
21 |
the code has been taken (or adapted) from Djanco source code : |
|
22 |
http://www.djangoproject.com/ |
|
23 |
||
24 |
""" |
|
25 |
||
26 |
__docformat__ = "restructuredtext en" |
|
27 |
||
28 |
from StringIO import StringIO |
|
29 |
from urllib import quote |
|
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
30 |
from urlparse import parse_qs |
0 | 31 |
|
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
32 |
from cubicweb.multipart import copy_file, parse_form_data |
0 | 33 |
from cubicweb.web.request import CubicWebRequestBase |
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
34 |
from cubicweb.wsgi import pformat, normalize_header |
0 | 35 |
|
36 |
||
37 |
class CubicWebWsgiRequest(CubicWebRequestBase): |
|
8752
e19f4bba89cd
Add CubicWebRequestBase.content (closes #2742453)
Julien Cristau <julien.cristau@logilab.fr>
parents:
8316
diff
changeset
|
38 |
"""most of this code COMES FROM DJANGO |
0 | 39 |
""" |
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
0
diff
changeset
|
40 |
|
8309
48ef505aa9f9
[request] gather all base_url logic in a single place (closes #2200756)
Pierre-Yves David <pierre-yves.david@logilab.fr>
parents:
7879
diff
changeset
|
41 |
def __init__(self, environ, vreg): |
0 | 42 |
self.environ = environ |
43 |
self.path = environ['PATH_INFO'] |
|
44 |
self.method = environ['REQUEST_METHOD'].upper() |
|
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
45 |
|
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
46 |
# content_length "may be empty or absent" |
9563
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
47 |
try: |
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
48 |
length = int(environ['CONTENT_LENGTH']) |
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
49 |
except (KeyError, ValueError): |
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
50 |
length = 0 |
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
51 |
# wsgi.input is not seekable, so copy the request contents to a temporary file |
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
52 |
if length < 100000: |
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
53 |
self.content = StringIO() |
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
54 |
else: |
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
55 |
self.content = tempfile.TemporaryFile() |
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
56 |
copy_file(environ['wsgi.input'], self.content, maxread=length) |
9563
48f0ff3e2a32
[wsgi] make sure request.content is available for consumption
Julien Cristau <julien.cristau@logilab.fr>
parents:
8752
diff
changeset
|
57 |
self.content.seek(0, 0) |
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
58 |
environ['wsgi.input'] = self.content |
8314
cfd6ab461849
[Web-Request] Use rich header (closes #2204164)
Pierre-Yves David <pierre-yves.david@logilab.fr>
parents:
8309
diff
changeset
|
59 |
|
cfd6ab461849
[Web-Request] Use rich header (closes #2204164)
Pierre-Yves David <pierre-yves.david@logilab.fr>
parents:
8309
diff
changeset
|
60 |
headers_in = dict((normalize_header(k[5:]), v) for k, v in self.environ.items() |
cfd6ab461849
[Web-Request] Use rich header (closes #2204164)
Pierre-Yves David <pierre-yves.david@logilab.fr>
parents:
8309
diff
changeset
|
61 |
if k.startswith('HTTP_')) |
9939
46a8ed48636f
[wsgi] Honor the 'CONTENT_TYPE' wsgi variable
Christophe de Vienne <christophe@unlish.com>
parents:
9735
diff
changeset
|
62 |
if 'CONTENT_TYPE' in environ: |
46a8ed48636f
[wsgi] Honor the 'CONTENT_TYPE' wsgi variable
Christophe de Vienne <christophe@unlish.com>
parents:
9735
diff
changeset
|
63 |
headers_in['Content-Type'] = environ['CONTENT_TYPE'] |
9941
8dc1c96d29f1
[wsgi] Fix https detection
Christophe de Vienne <christophe@unlish.com>
parents:
9940
diff
changeset
|
64 |
https = environ["wsgi.url_scheme"] == 'https' |
8dc1c96d29f1
[wsgi] Fix https detection
Christophe de Vienne <christophe@unlish.com>
parents:
9940
diff
changeset
|
65 |
if self.path.startswith('/https/'): |
8dc1c96d29f1
[wsgi] Fix https detection
Christophe de Vienne <christophe@unlish.com>
parents:
9940
diff
changeset
|
66 |
self.path = self.path[6:] |
8dc1c96d29f1
[wsgi] Fix https detection
Christophe de Vienne <christophe@unlish.com>
parents:
9940
diff
changeset
|
67 |
self.environ['PATH_INFO'] = self.path |
8dc1c96d29f1
[wsgi] Fix https detection
Christophe de Vienne <christophe@unlish.com>
parents:
9940
diff
changeset
|
68 |
https = True |
8dc1c96d29f1
[wsgi] Fix https detection
Christophe de Vienne <christophe@unlish.com>
parents:
9940
diff
changeset
|
69 |
|
0 | 70 |
post, files = self.get_posted_data() |
8314
cfd6ab461849
[Web-Request] Use rich header (closes #2204164)
Pierre-Yves David <pierre-yves.david@logilab.fr>
parents:
8309
diff
changeset
|
71 |
|
cfd6ab461849
[Web-Request] Use rich header (closes #2204164)
Pierre-Yves David <pierre-yves.david@logilab.fr>
parents:
8309
diff
changeset
|
72 |
super(CubicWebWsgiRequest, self).__init__(vreg, https, post, |
cfd6ab461849
[Web-Request] Use rich header (closes #2204164)
Pierre-Yves David <pierre-yves.david@logilab.fr>
parents:
8309
diff
changeset
|
73 |
headers= headers_in) |
9940
292f786009ba
[wsgi] Re-set the request content after calling the inherited constructor.
Christophe de Vienne <christophe@unlish.com>
parents:
9939
diff
changeset
|
74 |
self.content = environ['wsgi.input'] |
0 | 75 |
if files is not None: |
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
76 |
for key, part in files.iteritems(): |
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
77 |
name = None |
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
78 |
if part.filename is not None: |
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
79 |
name = unicode(part.filename, self.encoding) |
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
80 |
self.form[key] = (name, part.file) |
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
0
diff
changeset
|
81 |
|
0 | 82 |
def __repr__(self): |
83 |
# Since this is called as part of error handling, we need to be very |
|
84 |
# robust against potentially malformed input. |
|
85 |
form = pformat(self.form) |
|
86 |
meta = pformat(self.environ) |
|
87 |
return '<CubicWebWsgiRequest\FORM:%s,\nMETA:%s>' % \ |
|
88 |
(form, meta) |
|
89 |
||
90 |
## cubicweb request interface ################################################ |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
0
diff
changeset
|
91 |
|
0 | 92 |
def http_method(self): |
93 |
"""returns 'POST', 'GET', 'HEAD', etc.""" |
|
94 |
return self.method |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
0
diff
changeset
|
95 |
|
0 | 96 |
def relative_path(self, includeparams=True): |
97 |
"""return the normalized path of the request (ie at least relative |
|
2476
1294a6bdf3bf
application -> instance where it makes sense
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
98 |
to the instance's root, but some other normalization may be needed |
0 | 99 |
so that the returned path may be used to compare to generated urls |
100 |
||
101 |
:param includeparams: |
|
102 |
boolean indicating if GET form parameters should be kept in the path |
|
103 |
""" |
|
104 |
path = self.environ['PATH_INFO'] |
|
105 |
path = path[1:] # remove leading '/' |
|
106 |
if includeparams: |
|
107 |
qs = self.environ.get('QUERY_STRING') |
|
108 |
if qs: |
|
109 |
return '%s?%s' % (path, qs) |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
0
diff
changeset
|
110 |
|
0 | 111 |
return path |
112 |
||
113 |
## wsgi request helpers ################################################### |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
0
diff
changeset
|
114 |
|
2476
1294a6bdf3bf
application -> instance where it makes sense
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
115 |
def instance_uri(self): |
1294a6bdf3bf
application -> instance where it makes sense
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
116 |
"""Return the instance's base URI (no PATH_INFO or QUERY_STRING) |
0 | 117 |
|
2476
1294a6bdf3bf
application -> instance where it makes sense
Sylvain Thénault <sylvain.thenault@logilab.fr>
parents:
1977
diff
changeset
|
118 |
see python2.5's wsgiref.util.instance_uri code |
0 | 119 |
""" |
120 |
environ = self.environ |
|
121 |
url = environ['wsgi.url_scheme'] + '://' |
|
122 |
if environ.get('HTTP_HOST'): |
|
123 |
url += environ['HTTP_HOST'] |
|
124 |
else: |
|
125 |
url += environ['SERVER_NAME'] |
|
126 |
if environ['wsgi.url_scheme'] == 'https': |
|
127 |
if environ['SERVER_PORT'] != '443': |
|
128 |
url += ':' + environ['SERVER_PORT'] |
|
129 |
else: |
|
130 |
if environ['SERVER_PORT'] != '80': |
|
131 |
url += ':' + environ['SERVER_PORT'] |
|
132 |
url += quote(environ.get('SCRIPT_NAME') or '/') |
|
133 |
return url |
|
1802
d628defebc17
delete-trailing-whitespace + some copyright update
Adrien Di Mascio <Adrien.DiMascio@logilab.fr>
parents:
0
diff
changeset
|
134 |
|
0 | 135 |
def get_full_path(self): |
136 |
return '%s%s' % (self.path, self.environ.get('QUERY_STRING', '') and ('?' + self.environ.get('QUERY_STRING', '')) or '') |
|
137 |
||
138 |
def is_secure(self): |
|
139 |
return 'wsgi.url_scheme' in self.environ \ |
|
140 |
and self.environ['wsgi.url_scheme'] == 'https' |
|
141 |
||
142 |
def get_posted_data(self): |
|
8314
cfd6ab461849
[Web-Request] Use rich header (closes #2204164)
Pierre-Yves David <pierre-yves.david@logilab.fr>
parents:
8309
diff
changeset
|
143 |
# The WSGI spec says 'QUERY_STRING' may be absent. |
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
144 |
post = parse_qs(self.environ.get('QUERY_STRING', '')) |
0 | 145 |
files = None |
146 |
if self.method == 'POST': |
|
9735
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
147 |
forms, files = parse_form_data(self.environ, strict=True, |
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
148 |
mem_limit=self.vreg.config['max-post-length']) |
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
149 |
post.update(forms) |
b71158815bc8
[wsgi] avoid reading the entire request body in memory
Julien Cristau <julien.cristau@logilab.fr>
parents:
9563
diff
changeset
|
150 |
self.content.seek(0, 0) |
0 | 151 |
return post, files |