author | sylvain.thenault@logilab.fr |
Wed, 29 Apr 2009 10:55:57 +0200 | |
branch | tls-sprint |
changeset 1536 | 1e695b78d085 |
parent 1520 | b097057e629d |
child 1542 | 2965fcfaeca1 |
permissions | -rw-r--r-- |
0 | 1 |
"""twisted server for CubicWeb web applications |
2 |
||
3 |
:organization: Logilab |
|
1016
26387b836099
use datetime instead of mx.DateTime
sylvain.thenault@logilab.fr
parents:
151
diff
changeset
|
4 |
:copyright: 2001-2009 LOGILAB S.A. (Paris, FRANCE), all rights reserved. |
0 | 5 |
:contact: http://www.logilab.fr/ -- mailto:contact@logilab.fr |
6 |
""" |
|
7 |
__docformat__ = "restructuredtext en" |
|
8 |
||
9 |
import sys |
|
10 |
import select |
|
1016
26387b836099
use datetime instead of mx.DateTime
sylvain.thenault@logilab.fr
parents:
151
diff
changeset
|
11 |
from time import mktime |
26387b836099
use datetime instead of mx.DateTime
sylvain.thenault@logilab.fr
parents:
151
diff
changeset
|
12 |
from datetime import date, timedelta |
1520
b097057e629d
provide an option to substitute the base-url (left-most part) subdomain by the one of the current http query to easy multiple subdomains website management
Florent <florent@secondweb.fr>
parents:
1420
diff
changeset
|
13 |
from urlparse import urlsplit, urlunsplit |
0 | 14 |
|
15 |
from twisted.application import service, strports |
|
16 |
from twisted.internet import reactor, task, threads |
|
17 |
from twisted.internet.defer import maybeDeferred |
|
18 |
from twisted.web2 import channel, http, server, iweb |
|
19 |
from twisted.web2 import static, resource, responsecode |
|
20 |
||
21 |
from cubicweb import ObjectNotFound |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
22 |
from cubicweb.web import (AuthenticationError, NotFound, Redirect, |
0 | 23 |
RemoteCallFailed, DirectResponse, StatusResponse, |
24 |
ExplicitLogin) |
|
25 |
from cubicweb.web.application import CubicWebPublisher |
|
26 |
||
27 |
from cubicweb.etwist.request import CubicWebTwistedRequestAdapter |
|
28 |
||
29 |
||
30 |
def start_task(interval, func): |
|
31 |
lc = task.LoopingCall(func) |
|
32 |
lc.start(interval) |
|
33 |
||
34 |
def start_looping_tasks(repo): |
|
35 |
for interval, func in repo._looping_tasks: |
|
36 |
repo.info('starting twisted task %s with interval %.2fs', |
|
37 |
func.__name__, interval) |
|
38 |
def catch_error_func(repo=repo, func=func): |
|
39 |
try: |
|
40 |
func() |
|
41 |
except: |
|
42 |
repo.exception('error in looping task') |
|
43 |
start_task(interval, catch_error_func) |
|
44 |
# ensure no tasks will be further added |
|
45 |
repo._looping_tasks = () |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
46 |
|
0 | 47 |
|
48 |
class LongTimeExpiringFile(static.File): |
|
49 |
"""overrides static.File and sets a far futre ``Expires`` date |
|
50 |
on the resouce. |
|
51 |
||
52 |
versions handling is done by serving static files by different |
|
53 |
URLs for each version. For instance:: |
|
54 |
||
55 |
http://localhost:8080/data-2.48.2/cubicweb.css |
|
56 |
http://localhost:8080/data-2.49.0/cubicweb.css |
|
57 |
etc. |
|
58 |
||
59 |
""" |
|
60 |
def renderHTTP(self, request): |
|
61 |
def setExpireHeader(response): |
|
62 |
response = iweb.IResponse(response) |
|
63 |
# Don't provide additional resource information to error responses |
|
64 |
if response.code < 400: |
|
65 |
# the HTTP RFC recommands not going further than 1 year ahead |
|
1016
26387b836099
use datetime instead of mx.DateTime
sylvain.thenault@logilab.fr
parents:
151
diff
changeset
|
66 |
expires = date.today() + timedelta(days=6*30) |
26387b836099
use datetime instead of mx.DateTime
sylvain.thenault@logilab.fr
parents:
151
diff
changeset
|
67 |
response.headers.setHeader('Expires', mktime(expires.timetuple())) |
0 | 68 |
return response |
69 |
d = maybeDeferred(super(LongTimeExpiringFile, self).renderHTTP, request) |
|
70 |
return d.addCallback(setExpireHeader) |
|
71 |
||
72 |
||
73 |
class CubicWebRootResource(resource.PostableResource): |
|
74 |
addSlash = False |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
75 |
|
0 | 76 |
def __init__(self, config, debug=None): |
77 |
self.appli = CubicWebPublisher(config, debug=debug) |
|
78 |
self.debugmode = debug |
|
79 |
self.config = config |
|
80 |
self.base_url = config['base-url'] or config.default_base_url() |
|
81 |
self.versioned_datadir = 'data%s' % config.instance_md5_version() |
|
82 |
assert self.base_url[-1] == '/' |
|
83 |
self.https_url = config['https-url'] |
|
84 |
assert not self.https_url or self.https_url[-1] == '/' |
|
85 |
# when we have an in-memory repository, clean unused sessions every XX |
|
86 |
# seconds and properly shutdown the server |
|
87 |
if config.repo_method == 'inmemory': |
|
88 |
reactor.addSystemEventTrigger('before', 'shutdown', |
|
89 |
self.shutdown_event) |
|
1115 | 90 |
# monkey patch start_looping_task to get proper reactor integration |
0 | 91 |
self.appli.repo.__class__.start_looping_tasks = start_looping_tasks |
92 |
if config.pyro_enabled(): |
|
93 |
# if pyro is enabled, we have to register to the pyro name |
|
94 |
# server, create a pyro daemon, and create a task to handle pyro |
|
95 |
# requests |
|
96 |
self.pyro_daemon = self.appli.repo.pyro_register() |
|
97 |
self.pyro_listen_timeout = 0.02 |
|
98 |
start_task(1, self.pyro_loop_event) |
|
99 |
self.appli.repo.start_looping_tasks() |
|
100 |
try: |
|
101 |
self.url_rewriter = self.appli.vreg.select_component('urlrewriter') |
|
102 |
except ObjectNotFound: |
|
103 |
self.url_rewriter = None |
|
104 |
interval = min(config['cleanup-session-time'] or 120, |
|
105 |
config['cleanup-anonymous-session-time'] or 720) / 2. |
|
106 |
start_task(interval, self.appli.session_handler.clean_sessions) |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
107 |
|
0 | 108 |
def shutdown_event(self): |
109 |
"""callback fired when the server is shutting down to properly |
|
110 |
clean opened sessions |
|
111 |
""" |
|
112 |
self.appli.repo.shutdown() |
|
113 |
||
114 |
def pyro_loop_event(self): |
|
115 |
"""listen for pyro events""" |
|
116 |
try: |
|
117 |
self.pyro_daemon.handleRequests(self.pyro_listen_timeout) |
|
118 |
except select.error: |
|
119 |
return |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
120 |
|
0 | 121 |
def locateChild(self, request, segments): |
122 |
"""Indicate which resource to use to process down the URL's path""" |
|
123 |
if segments: |
|
124 |
if segments[0] == 'https': |
|
125 |
segments = segments[1:] |
|
126 |
if len(segments) >= 2: |
|
151
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
127 |
if segments[0] in (self.versioned_datadir, 'data', 'static'): |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
128 |
# Anything in data/, static/ is treated as static files |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
129 |
if segments[0] == 'static': |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
130 |
# instance static directory |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
131 |
datadir = self.config.static_directory |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
132 |
else: |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
133 |
# cube static data file |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
134 |
datadir = self.config.locate_resource(segments[1]) |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
135 |
if datadir is None: |
343e7a18675d
static files support
Sylvain Thenault <sylvain.thenault@logilab.fr>
parents:
0
diff
changeset
|
136 |
return None, [] |
0 | 137 |
self.info('static file %s from %s', segments[-1], datadir) |
138 |
if segments[0] == 'data': |
|
139 |
return static.File(str(datadir)), segments[1:] |
|
140 |
else: |
|
141 |
return LongTimeExpiringFile(datadir), segments[1:] |
|
142 |
elif segments[0] == 'fckeditor': |
|
143 |
fckeditordir = self.config.ext_resources['FCKEDITOR_PATH'] |
|
144 |
return static.File(fckeditordir), segments[1:] |
|
145 |
# Otherwise we use this single resource |
|
146 |
return self, () |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
147 |
|
0 | 148 |
def render(self, request): |
149 |
"""Render a page from the root resource""" |
|
150 |
# reload modified files (only in development or debug mode) |
|
151 |
if self.config.mode == 'dev' or self.debugmode: |
|
152 |
self.appli.vreg.register_objects(self.config.vregistry_path()) |
|
153 |
if self.config['profile']: # default profiler don't trace threads |
|
154 |
return self.render_request(request) |
|
155 |
else: |
|
156 |
return threads.deferToThread(self.render_request, request) |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
157 |
|
0 | 158 |
def render_request(self, request): |
159 |
origpath = request.path |
|
160 |
host = request.host |
|
161 |
# dual http/https access handling: expect a rewrite rule to prepend |
|
162 |
# 'https' to the path to detect https access |
|
163 |
if origpath.split('/', 2)[1] == 'https': |
|
164 |
origpath = origpath[6:] |
|
165 |
request.uri = request.uri[6:] |
|
166 |
https = True |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
167 |
baseurl = self.https_url or self.base_url |
0 | 168 |
else: |
169 |
https = False |
|
170 |
baseurl = self.base_url |
|
1520
b097057e629d
provide an option to substitute the base-url (left-most part) subdomain by the one of the current http query to easy multiple subdomains website management
Florent <florent@secondweb.fr>
parents:
1420
diff
changeset
|
171 |
if self.config['use-request-subdomain']: |
b097057e629d
provide an option to substitute the base-url (left-most part) subdomain by the one of the current http query to easy multiple subdomains website management
Florent <florent@secondweb.fr>
parents:
1420
diff
changeset
|
172 |
scheme, netloc, url, query, fragment = urlsplit(baseurl) |
b097057e629d
provide an option to substitute the base-url (left-most part) subdomain by the one of the current http query to easy multiple subdomains website management
Florent <florent@secondweb.fr>
parents:
1420
diff
changeset
|
173 |
if '.' in netloc: |
b097057e629d
provide an option to substitute the base-url (left-most part) subdomain by the one of the current http query to easy multiple subdomains website management
Florent <florent@secondweb.fr>
parents:
1420
diff
changeset
|
174 |
netloc = '.'.join(host.split('.')[:1] + netloc.split('.')[1:]) |
b097057e629d
provide an option to substitute the base-url (left-most part) subdomain by the one of the current http query to easy multiple subdomains website management
Florent <florent@secondweb.fr>
parents:
1420
diff
changeset
|
175 |
baseurl = urlunsplit((scheme, netloc, url, query, fragment)) |
b097057e629d
provide an option to substitute the base-url (left-most part) subdomain by the one of the current http query to easy multiple subdomains website management
Florent <florent@secondweb.fr>
parents:
1420
diff
changeset
|
176 |
self.warning('base_url is %s for this request', baseurl) |
0 | 177 |
req = CubicWebTwistedRequestAdapter(request, self.appli.vreg, https, baseurl) |
178 |
if req.authmode == 'http': |
|
179 |
# activate realm-based auth |
|
180 |
realm = self.config['realm'] |
|
181 |
req.set_header('WWW-Authenticate', [('Basic', {'realm' : realm })], raw=False) |
|
182 |
try: |
|
183 |
self.appli.connect(req) |
|
184 |
except AuthenticationError: |
|
185 |
return self.request_auth(req) |
|
186 |
except Redirect, ex: |
|
187 |
return self.redirect(req, ex.location) |
|
188 |
if https and req.cnx.anonymous_connection: |
|
189 |
# don't allow anonymous on https connection |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
190 |
return self.request_auth(req) |
0 | 191 |
if self.url_rewriter is not None: |
1115 | 192 |
# XXX should occur before authentication? |
0 | 193 |
try: |
194 |
path = self.url_rewriter.rewrite(host, origpath) |
|
195 |
except Redirect, ex: |
|
196 |
return self.redirect(req, ex.location) |
|
197 |
request.uri.replace(origpath, path, 1) |
|
198 |
else: |
|
199 |
path = origpath |
|
200 |
if not path or path == "/": |
|
201 |
path = 'view' |
|
202 |
try: |
|
203 |
result = self.appli.publish(path, req) |
|
204 |
except DirectResponse, ex: |
|
205 |
return ex.response |
|
206 |
except StatusResponse, ex: |
|
207 |
return http.Response(stream=ex.content, code=ex.status, |
|
208 |
headers=req.headers_out or None) |
|
209 |
except RemoteCallFailed, ex: |
|
210 |
req.set_header('content-type', 'application/json') |
|
211 |
return http.Response(stream=ex.dumps(), |
|
212 |
code=responsecode.INTERNAL_SERVER_ERROR) |
|
213 |
except NotFound: |
|
214 |
result = self.appli.notfound_content(req) |
|
215 |
return http.Response(stream=result, code=responsecode.NOT_FOUND, |
|
216 |
headers=req.headers_out or None) |
|
217 |
except ExplicitLogin: # must be before AuthenticationError |
|
218 |
return self.request_auth(req) |
|
219 |
except AuthenticationError: |
|
220 |
if self.config['auth-mode'] == 'cookie': |
|
221 |
# in cookie mode redirecting to the index view is enough : |
|
222 |
# either anonymous connection is allowed and the page will |
|
223 |
# be displayed or we'll be redirected to the login form |
|
224 |
msg = req._('you have been logged out') |
|
225 |
if req.https: |
|
226 |
req._base_url = self.base_url |
|
227 |
req.https = False |
|
228 |
url = req.build_url('view', vid='index', __message=msg) |
|
229 |
return self.redirect(req, url) |
|
230 |
else: |
|
231 |
# in http we have to request auth to flush current http auth |
|
232 |
# information |
|
233 |
return self.request_auth(req, loggedout=True) |
|
234 |
except Redirect, ex: |
|
235 |
return self.redirect(req, ex.location) |
|
236 |
# request may be referenced by "onetime callback", so clear its entity |
|
237 |
# cache to avoid memory usage |
|
238 |
req.drop_entity_cache() |
|
239 |
return http.Response(stream=result, code=responsecode.OK, |
|
240 |
headers=req.headers_out or None) |
|
241 |
||
242 |
def redirect(self, req, location): |
|
243 |
req.headers_out.setHeader('location', str(location)) |
|
244 |
self.debug('redirecting to %s', location) |
|
245 |
# 303 See other |
|
246 |
return http.Response(code=303, headers=req.headers_out) |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
247 |
|
0 | 248 |
def request_auth(self, req, loggedout=False): |
249 |
if self.https_url and req.base_url() != self.https_url: |
|
250 |
req.headers_out.setHeader('location', self.https_url + 'login') |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
251 |
return http.Response(code=303, headers=req.headers_out) |
0 | 252 |
if self.config['auth-mode'] == 'http': |
253 |
code = responsecode.UNAUTHORIZED |
|
254 |
else: |
|
255 |
code = responsecode.FORBIDDEN |
|
256 |
if loggedout: |
|
257 |
if req.https: |
|
258 |
req._base_url = self.base_url |
|
259 |
req.https = False |
|
260 |
content = self.appli.loggedout_content(req) |
|
261 |
else: |
|
262 |
content = self.appli.need_login_content(req) |
|
263 |
return http.Response(code, req.headers_out, content) |
|
264 |
||
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
265 |
|
0 | 266 |
# This part gets run when you run this file via: "twistd -noy demo.py" |
267 |
def main(appid, cfgname): |
|
268 |
"""Starts an cubicweb twisted server for an application |
|
269 |
||
270 |
appid: application's identifier |
|
271 |
cfgname: name of the configuration to use (twisted or all-in-one) |
|
272 |
""" |
|
273 |
from cubicweb.cwconfig import CubicWebConfiguration |
|
274 |
from cubicweb.etwist import twconfig # trigger configuration registration |
|
275 |
config = CubicWebConfiguration.config_for(appid, cfgname) |
|
276 |
# XXX why calling init_available_cubes here ? |
|
277 |
config.init_available_cubes() |
|
278 |
# create the site and application objects |
|
279 |
if '-n' in sys.argv: # debug mode |
|
280 |
cubicweb = CubicWebRootResource(config, debug=True) |
|
281 |
else: |
|
282 |
cubicweb = CubicWebRootResource(config) |
|
283 |
#toplevel = vhost.VHostURIRewrite(base_url, cubicweb) |
|
284 |
toplevel = cubicweb |
|
285 |
website = server.Site(toplevel) |
|
286 |
application = service.Application("cubicweb") |
|
287 |
# serve it via standard HTTP on port set in the configuration |
|
288 |
s = strports.service('tcp:%04d' % (config['port'] or 8080), |
|
289 |
channel.HTTPFactory(website)) |
|
290 |
s.setServiceParent(application) |
|
291 |
return application |
|
292 |
||
293 |
||
294 |
from twisted.python import failure |
|
295 |
from twisted.internet import defer |
|
296 |
from twisted.web2 import fileupload |
|
297 |
||
298 |
# XXX set max file size to 100Mo: put max upload size in the configuration |
|
299 |
# line below for twisted >= 8.0, default param value for earlier version |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
300 |
resource.PostableResource.maxSize = 100*1024*1024 |
0 | 301 |
def parsePOSTData(request, maxMem=100*1024, maxFields=1024, |
302 |
maxSize=100*1024*1024): |
|
303 |
if request.stream.length == 0: |
|
304 |
return defer.succeed(None) |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
305 |
|
0 | 306 |
ctype = request.headers.getHeader('content-type') |
307 |
||
308 |
if ctype is None: |
|
309 |
return defer.succeed(None) |
|
310 |
||
311 |
def updateArgs(data): |
|
312 |
args = data |
|
313 |
request.args.update(args) |
|
314 |
||
315 |
def updateArgsAndFiles(data): |
|
316 |
args, files = data |
|
317 |
request.args.update(args) |
|
318 |
request.files.update(files) |
|
319 |
||
320 |
def error(f): |
|
321 |
f.trap(fileupload.MimeFormatError) |
|
322 |
raise http.HTTPError(responsecode.BAD_REQUEST) |
|
1420
25c13e5b12bd
stop complaining about empty response, remove trailing spaces
sylvain.thenault@logilab.fr
parents:
1263
diff
changeset
|
323 |
|
0 | 324 |
if ctype.mediaType == 'application' and ctype.mediaSubtype == 'x-www-form-urlencoded': |
325 |
d = fileupload.parse_urlencoded(request.stream, keep_blank_values=True) |
|
326 |
d.addCallbacks(updateArgs, error) |
|
327 |
return d |
|
328 |
elif ctype.mediaType == 'multipart' and ctype.mediaSubtype == 'form-data': |
|
329 |
boundary = ctype.params.get('boundary') |
|
330 |
if boundary is None: |
|
331 |
return defer.fail(http.HTTPError( |
|
332 |
http.StatusResponse(responsecode.BAD_REQUEST, |
|
333 |
"Boundary not specified in Content-Type."))) |
|
334 |
d = fileupload.parseMultipartFormData(request.stream, boundary, |
|
335 |
maxMem, maxFields, maxSize) |
|
336 |
d.addCallbacks(updateArgsAndFiles, error) |
|
337 |
return d |
|
338 |
else: |
|
339 |
raise http.HTTPError(responsecode.BAD_REQUEST) |
|
340 |
||
341 |
server.parsePOSTData = parsePOSTData |
|
342 |
||
343 |
||
344 |
from logging import getLogger |
|
345 |
from cubicweb import set_log_methods |
|
346 |
set_log_methods(CubicWebRootResource, getLogger('cubicweb.twisted')) |
|
347 |
||
348 |
||
349 |
||
350 |
def _gc_debug(): |
|
351 |
import gc |
|
352 |
from pprint import pprint |
|
353 |
from cubicweb.vregistry import VObject |
|
354 |
gc.collect() |
|
355 |
count = 0 |
|
356 |
acount = 0 |
|
357 |
ocount = {} |
|
358 |
for obj in gc.get_objects(): |
|
359 |
if isinstance(obj, CubicWebTwistedRequestAdapter): |
|
360 |
count += 1 |
|
361 |
elif isinstance(obj, VObject): |
|
362 |
acount += 1 |
|
363 |
else: |
|
364 |
try: |
|
1132 | 365 |
ocount[obj.__class__] += 1 |
0 | 366 |
except KeyError: |
367 |
ocount[obj.__class__] = 1 |
|
368 |
except AttributeError: |
|
369 |
pass |
|
370 |
print 'IN MEM REQUESTS', count |
|
371 |
print 'IN MEM APPOBJECTS', acount |
|
372 |
ocount = sorted(ocount.items(), key=lambda x: x[1], reverse=True)[:20] |
|
373 |
pprint(ocount) |
|
374 |
print 'UNREACHABLE', gc.garbage |