mirror of
https://github.com/jupyterhub/jupyterhub.git
synced 2025-10-15 14:03:02 +00:00
Merge pull request #1393 from minrk/spawn-future
improve reporting of spawn failure
This commit is contained in:
@@ -376,6 +376,9 @@ class BaseHandler(RequestHandler):
|
|||||||
|
|
||||||
@gen.coroutine
|
@gen.coroutine
|
||||||
def spawn_single_user(self, user, server_name='', options=None):
|
def spawn_single_user(self, user, server_name='', options=None):
|
||||||
|
# in case of error, include 'try again from /hub/home' message
|
||||||
|
self.extra_error_html = self.spawn_home_error
|
||||||
|
|
||||||
user_server_name = user.name
|
user_server_name = user.name
|
||||||
if self.allow_named_servers and not server_name:
|
if self.allow_named_servers and not server_name:
|
||||||
server_name = default_server_name(user)
|
server_name = default_server_name(user)
|
||||||
@@ -440,11 +443,7 @@ class BaseHandler(RequestHandler):
|
|||||||
otherwise it is called immediately.
|
otherwise it is called immediately.
|
||||||
"""
|
"""
|
||||||
# wait for spawn Future
|
# wait for spawn Future
|
||||||
try:
|
|
||||||
yield spawn_future
|
yield spawn_future
|
||||||
except Exception:
|
|
||||||
spawner._spawn_pending = False
|
|
||||||
raise
|
|
||||||
toc = IOLoop.current().time()
|
toc = IOLoop.current().time()
|
||||||
self.log.info("User %s took %.3f seconds to start", user_server_name, toc-tic)
|
self.log.info("User %s took %.3f seconds to start", user_server_name, toc-tic)
|
||||||
self.statsd.timing('spawner.success', (toc - tic) * 1000)
|
self.statsd.timing('spawner.success', (toc - tic) * 1000)
|
||||||
@@ -459,10 +458,22 @@ class BaseHandler(RequestHandler):
|
|||||||
spawner.add_poll_callback(self.user_stopped, user, server_name)
|
spawner.add_poll_callback(self.user_stopped, user, server_name)
|
||||||
finally:
|
finally:
|
||||||
spawner._proxy_pending = False
|
spawner._proxy_pending = False
|
||||||
|
|
||||||
|
# hook up spawner._spawn_future so that other requests can await
|
||||||
|
# this result
|
||||||
|
finish_spawn_future = spawner._spawn_future = finish_user_spawn()
|
||||||
|
def _clear_spawn_future(f):
|
||||||
|
# clear spawner._spawn_future when it's done
|
||||||
|
# keep an exception around, though, to prevent repeated implicit spawns
|
||||||
|
# if spawn is failing
|
||||||
|
if f.exception() is None:
|
||||||
|
spawner._spawn_future = None
|
||||||
|
# Now we're all done. clear _spawn_pending flag
|
||||||
spawner._spawn_pending = False
|
spawner._spawn_pending = False
|
||||||
|
finish_spawn_future.add_done_callback(_clear_spawn_future)
|
||||||
|
|
||||||
try:
|
try:
|
||||||
yield gen.with_timeout(timedelta(seconds=self.slow_spawn_timeout), finish_user_spawn())
|
yield gen.with_timeout(timedelta(seconds=self.slow_spawn_timeout), finish_spawn_future)
|
||||||
except gen.TimeoutError:
|
except gen.TimeoutError:
|
||||||
# waiting_for_response indicates server process has started,
|
# waiting_for_response indicates server process has started,
|
||||||
# but is yet to become responsive.
|
# but is yet to become responsive.
|
||||||
@@ -479,7 +490,8 @@ class BaseHandler(RequestHandler):
|
|||||||
if status is not None:
|
if status is not None:
|
||||||
toc = IOLoop.current().time()
|
toc = IOLoop.current().time()
|
||||||
self.statsd.timing('spawner.failure', (toc - tic) * 1000)
|
self.statsd.timing('spawner.failure', (toc - tic) * 1000)
|
||||||
raise web.HTTPError(500, "Spawner failed to start [status=%s]" % status)
|
raise web.HTTPError(500, "Spawner failed to start [status=%s]. The logs for %s may contain details." % (
|
||||||
|
status, spawner._log_name))
|
||||||
|
|
||||||
if spawner._waiting_for_response:
|
if spawner._waiting_for_response:
|
||||||
# hit timeout waiting for response, but server's running.
|
# hit timeout waiting for response, but server's running.
|
||||||
@@ -549,6 +561,19 @@ class BaseHandler(RequestHandler):
|
|||||||
# template rendering
|
# template rendering
|
||||||
#---------------------------------------------------------------
|
#---------------------------------------------------------------
|
||||||
|
|
||||||
|
@property
|
||||||
|
def spawn_home_error(self):
|
||||||
|
"""Extra message pointing users to try spawning again from /hub/home.
|
||||||
|
|
||||||
|
Should be added to `self.extra_error_html` for any handler
|
||||||
|
that could serve a failed spawn message.
|
||||||
|
"""
|
||||||
|
home = url_path_join(self.hub.base_url, 'home')
|
||||||
|
return (
|
||||||
|
"You can try restarting your server from the "
|
||||||
|
"<a href='{home}'>home page</a>.".format(home=home)
|
||||||
|
)
|
||||||
|
|
||||||
def get_template(self, name):
|
def get_template(self, name):
|
||||||
"""Return the jinja template object for a given name"""
|
"""Return the jinja template object for a given name"""
|
||||||
return self.settings['jinja2_env'].get_template(name)
|
return self.settings['jinja2_env'].get_template(name)
|
||||||
@@ -596,6 +621,7 @@ class BaseHandler(RequestHandler):
|
|||||||
status_code=status_code,
|
status_code=status_code,
|
||||||
status_message=status_message,
|
status_message=status_message,
|
||||||
message=message,
|
message=message,
|
||||||
|
extra_error_html=getattr(self, 'extra_error_html', ''),
|
||||||
exception=exception,
|
exception=exception,
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -649,10 +675,13 @@ class UserSpawnHandler(BaseHandler):
|
|||||||
current_user = self.get_current_user()
|
current_user = self.get_current_user()
|
||||||
|
|
||||||
if current_user and current_user.name == name:
|
if current_user and current_user.name == name:
|
||||||
|
# if spawning fails for any reason, point users to /hub/home to retry
|
||||||
|
self.extra_error_html = self.spawn_home_error
|
||||||
|
|
||||||
# If people visit /user/:name directly on the Hub,
|
# If people visit /user/:name directly on the Hub,
|
||||||
# the redirects will just loop, because the proxy is bypassed.
|
# the redirects will just loop, because the proxy is bypassed.
|
||||||
# Try to check for that and warn,
|
# Try to check for that and warn,
|
||||||
# though the user-facing behavior is unchainged
|
# though the user-facing behavior is unchanged
|
||||||
host_info = urlparse(self.request.full_url())
|
host_info = urlparse(self.request.full_url())
|
||||||
port = host_info.port
|
port = host_info.port
|
||||||
if not port:
|
if not port:
|
||||||
@@ -664,8 +693,34 @@ class UserSpawnHandler(BaseHandler):
|
|||||||
Make sure to connect to the proxied public URL %s
|
Make sure to connect to the proxied public URL %s
|
||||||
""", self.request.full_url(), self.proxy.public_url)
|
""", self.request.full_url(), self.proxy.public_url)
|
||||||
|
|
||||||
# logged in as correct user, spawn the server
|
# logged in as correct user, check for pending spawn
|
||||||
spawner = current_user.spawner
|
spawner = current_user.spawner
|
||||||
|
|
||||||
|
# First, check for previous failure.
|
||||||
|
if (
|
||||||
|
not spawner.active
|
||||||
|
and spawner._spawn_future
|
||||||
|
and spawner._spawn_future.done()
|
||||||
|
and spawner._spawn_future.exception()
|
||||||
|
):
|
||||||
|
# Condition: spawner not active and _spawn_future exists and contains an Exception
|
||||||
|
# Implicit spawn on /user/:name is not allowed if the user's last spawn failed.
|
||||||
|
# We should point the user to Home if the most recent spawn failed.
|
||||||
|
self.log.error("Preventing implicit spawn for %s because last spawn failed: %s",
|
||||||
|
spawner._log_name, spawner._spawn_future.exception())
|
||||||
|
raise spawner._spawn_future.exception()
|
||||||
|
|
||||||
|
# check for pending spawn
|
||||||
|
if spawner.pending and spawner._spawn_future:
|
||||||
|
# wait on the pending spawn
|
||||||
|
self.log.debug("Waiting for %s pending %s", spawner._log_name, spawner.pending)
|
||||||
|
try:
|
||||||
|
yield gen.with_timeout(timedelta(seconds=self.slow_spawn_timeout), spawner._spawn_future)
|
||||||
|
except gen.TimeoutError:
|
||||||
|
self.log.info("Pending spawn for %s didn't finish in %.1f seconds", spawner._log_name, self.slow_spawn_timeout)
|
||||||
|
pass
|
||||||
|
|
||||||
|
# we may have waited above, check pending again:
|
||||||
if spawner.pending:
|
if spawner.pending:
|
||||||
self.log.info("%s is pending %s", spawner._log_name, spawner.pending)
|
self.log.info("%s is pending %s", spawner._log_name, spawner.pending)
|
||||||
# spawn has started, but not finished
|
# spawn has started, but not finished
|
||||||
@@ -679,6 +734,8 @@ class UserSpawnHandler(BaseHandler):
|
|||||||
status = yield spawner.poll()
|
status = yield spawner.poll()
|
||||||
else:
|
else:
|
||||||
status = 0
|
status = 0
|
||||||
|
|
||||||
|
# server is not running, trigger spawn
|
||||||
if status is not None:
|
if status is not None:
|
||||||
if spawner.options_form:
|
if spawner.options_form:
|
||||||
self.redirect(url_concat(url_path_join(self.hub.base_url, 'spawn'),
|
self.redirect(url_concat(url_path_join(self.hub.base_url, 'spawn'),
|
||||||
@@ -687,6 +744,15 @@ class UserSpawnHandler(BaseHandler):
|
|||||||
else:
|
else:
|
||||||
yield self.spawn_single_user(current_user)
|
yield self.spawn_single_user(current_user)
|
||||||
|
|
||||||
|
# spawn didn't finish, show pending page
|
||||||
|
if spawner.pending:
|
||||||
|
self.log.info("%s is pending %s", spawner._log_name, spawner.pending)
|
||||||
|
# spawn has started, but not finished
|
||||||
|
self.statsd.incr('redirects.user_spawn_pending', 1)
|
||||||
|
html = self.render_template("spawn_pending.html", user=current_user)
|
||||||
|
self.finish(html)
|
||||||
|
return
|
||||||
|
|
||||||
# We do exponential backoff here - since otherwise we can get stuck in a redirect loop!
|
# We do exponential backoff here - since otherwise we can get stuck in a redirect loop!
|
||||||
# This is important in many distributed proxy implementations - those are often eventually
|
# This is important in many distributed proxy implementations - those are often eventually
|
||||||
# consistent and can take upto a couple of seconds to actually apply throughout the cluster.
|
# consistent and can take upto a couple of seconds to actually apply throughout the cluster.
|
||||||
|
@@ -67,9 +67,13 @@ class HomeHandler(BaseHandler):
|
|||||||
if user.running:
|
if user.running:
|
||||||
# trigger poll_and_notify event in case of a server that died
|
# trigger poll_and_notify event in case of a server that died
|
||||||
yield user.spawner.poll_and_notify()
|
yield user.spawner.poll_and_notify()
|
||||||
|
# send the user to /spawn if they aren't running,
|
||||||
|
# to establish that this is an explicit spawn request rather
|
||||||
|
# than an implicit one, which can be caused by any link to `/user/:name`
|
||||||
|
url = user.url if user.running else url_path_join(self.hub.base_url, 'spawn')
|
||||||
html = self.render_template('home.html',
|
html = self.render_template('home.html',
|
||||||
user=user,
|
user=user,
|
||||||
url=user.url,
|
url=url,
|
||||||
)
|
)
|
||||||
self.finish(html)
|
self.finish(html)
|
||||||
|
|
||||||
@@ -92,7 +96,10 @@ class SpawnHandler(BaseHandler):
|
|||||||
|
|
||||||
@web.authenticated
|
@web.authenticated
|
||||||
def get(self):
|
def get(self):
|
||||||
"""GET renders form for spawning with user-specified options"""
|
"""GET renders form for spawning with user-specified options
|
||||||
|
|
||||||
|
or triggers spawn via redirect if there is no form.
|
||||||
|
"""
|
||||||
user = self.get_current_user()
|
user = self.get_current_user()
|
||||||
if not self.allow_named_servers and user.running:
|
if not self.allow_named_servers and user.running:
|
||||||
url = user.url
|
url = user.url
|
||||||
@@ -102,7 +109,12 @@ class SpawnHandler(BaseHandler):
|
|||||||
if user.spawner.options_form:
|
if user.spawner.options_form:
|
||||||
self.finish(self._render_form())
|
self.finish(self._render_form())
|
||||||
else:
|
else:
|
||||||
# not running, no form. Trigger spawn.
|
# Explicit spawn request: clear _spawn_future
|
||||||
|
# which may have been saved to prevent implicit spawns
|
||||||
|
# after a failure.
|
||||||
|
if user.spawner._spawn_future and user.spawner._spawn_future.done():
|
||||||
|
user.spawner._spawn_future = None
|
||||||
|
# not running, no form. Trigger spawn by redirecting to /user/:name
|
||||||
self.redirect(user.url)
|
self.redirect(user.url)
|
||||||
|
|
||||||
@web.authenticated
|
@web.authenticated
|
||||||
|
@@ -54,6 +54,7 @@ class Spawner(LoggingConfigurable):
|
|||||||
_proxy_pending = False
|
_proxy_pending = False
|
||||||
_waiting_for_response = False
|
_waiting_for_response = False
|
||||||
_jupyterhub_version = None
|
_jupyterhub_version = None
|
||||||
|
_spawn_future = None
|
||||||
|
|
||||||
@property
|
@property
|
||||||
def _log_name(self):
|
def _log_name(self):
|
||||||
|
@@ -22,6 +22,11 @@
|
|||||||
{{message_html | safe}}
|
{{message_html | safe}}
|
||||||
</p>
|
</p>
|
||||||
{% endif %}
|
{% endif %}
|
||||||
|
{% if extra_error_html %}
|
||||||
|
<p>
|
||||||
|
{{extra_error_html | safe}}
|
||||||
|
</p>
|
||||||
|
{% endif %}
|
||||||
{% endblock error_detail %}
|
{% endblock error_detail %}
|
||||||
</div>
|
</div>
|
||||||
|
|
||||||
|
Reference in New Issue
Block a user