forked from opendatahub-io-contrib/jupyterhub-quickstart
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathjupyterhub_config.py
278 lines (194 loc) · 9 KB
/
jupyterhub_config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
import os
import wrapt
from kubernetes.client.configuration import Configuration
from kubernetes.config.incluster_config import load_incluster_config
from kubernetes.client.api_client import ApiClient
from kubernetes.client.rest import ApiException
from openshift.dynamic import DynamicClient
# Helper function for doing unit conversions or translations if needed.
def convert_size_to_bytes(size):
multipliers = {
'k': 1000,
'm': 1000**2,
'g': 1000**3,
't': 1000**4,
'ki': 1024,
'mi': 1024**2,
'gi': 1024**3,
'ti': 1024**4,
}
size = str(size)
for suffix in multipliers:
if size.lower().endswith(suffix):
return int(size[0:-len(suffix)]) * multipliers[suffix]
else:
if size.lower().endswith('b'):
return int(size[0:-1])
try:
return int(size)
except ValueError:
raise RuntimeError('"%s" is not a valid memory specification. Must be an integer or a string with suffix K, M, G, T, Ki, Mi, Gi or Ti.' % size)
# Initialise client for the REST API used doing configuration.
#
# XXX Currently have a workaround here for OpenShift 4.0 beta versions
# which disables verification of the certificate. If don't use this the
# Python openshift/kubernetes clients will fail. We also disable any
# warnings from urllib3 to get rid of the noise in the logs this creates.
load_incluster_config()
import urllib3
urllib3.disable_warnings()
instance = Configuration()
instance.verify_ssl = False
Configuration.set_default(instance)
api_client = DynamicClient(ApiClient())
image_stream_resource = api_client.resources.get(
api_version='image.openshift.io/v1', kind='ImageStream')
route_resource = api_client.resources.get(
api_version='route.openshift.io/v1', kind='Route')
# Work out the name of the JupyterHub deployment passed in environment.
application_name = os.environ.get('APPLICATION_NAME', 'jupyterhub')
# Work out the name of the namespace in which we are being deployed.
service_account_path = '/var/run/secrets/kubernetes.io/serviceaccount'
with open(os.path.join(service_account_path, 'namespace')) as fp:
namespace = fp.read().strip()
# Work out hostname for the exposed route of the JupyterHub server.
routes = route_resource.get(namespace=namespace)
def extract_hostname(routes, name):
for route in routes.items:
if route.metadata.name == name:
return route.spec.host
public_hostname = extract_hostname(routes, application_name)
if not public_hostname:
raise RuntimeError('Cannot calculate external host name for JupyterHub.')
# Helper function for determining the correct name for the image. We
# need to do this for references to image streams because of the image
# lookup policy often not being correctly setup on OpenShift clusters.
def resolve_image_name(name):
# If the image name contains a slash, we assume it is already
# referring to an image on some image registry. Even if it does
# not contain a slash, it may still be hosted on docker.io.
if name.find('/') != -1:
return name
# Separate actual source image name and tag for the image from the
# name. If the tag is not supplied, default to 'latest'.
parts = name.split(':', 1)
if len(parts) == 1:
source_image, tag = parts, 'latest'
else:
source_image, tag = parts
# See if there is an image stream in the current project with the
# target name.
try:
image_stream = image_stream_resource.get(namespace=namespace,
name=source_image)
except ApiException as e:
if e.status not in (403, 404):
raise
return name
# If we get here then the image stream exists with the target name.
# We need to determine if the tag exists. If it does exist, we
# extract out the full name of the image including the reference
# to the image registry it is hosted on.
if image_stream.status.tags:
for entry in image_stream.status.tags:
if entry.tag == tag:
registry_image = image_stream.status.dockerImageRepository
if registry_image:
return '%s:%s' % (registry_image, tag)
# Use original value if can't find a matching tag.
return name
# Define the default configuration for JupyterHub application.
c.Spawner.environment = dict()
c.JupyterHub.services = []
c.KubeSpawner.init_containers = []
c.KubeSpawner.extra_containers = []
c.JupyterHub.extra_handlers = []
c.JupyterHub.port = 8080
c.JupyterHub.hub_ip = '0.0.0.0'
c.JupyterHub.hub_port = 8081
c.JupyterHub.hub_connect_ip = application_name
c.ConfigurableHTTPProxy.api_url = 'http://127.0.0.1:8082'
c.Spawner.start_timeout = 120
c.Spawner.http_timeout = 60
c.KubeSpawner.port = 8080
c.KubeSpawner.common_labels = { 'app': application_name }
c.KubeSpawner.uid = os.getuid()
c.KubeSpawner.fs_gid = os.getuid()
c.KubeSpawner.extra_annotations = {
"alpha.image.policy.openshift.io/resolve-names": "*"
}
c.KubeSpawner.cmd = ['start-singleuser.sh']
c.KubeSpawner.pod_name_template = '%s-nb-{username}' % application_name
c.JupyterHub.admin_access = True
if os.environ.get('JUPYTERHUB_COOKIE_SECRET'):
c.JupyterHub.cookie_secret = os.environ[
'JUPYTERHUB_COOKIE_SECRET'].encode('UTF-8')
else:
c.JupyterHub.cookie_secret_file = '/opt/app-root/data/cookie_secret'
if os.environ.get('JUPYTERHUB_DATABASE_PASSWORD'):
c.JupyterHub.db_url = 'postgresql://%s:%s@%s:5432/%s' % (
os.environ.get('JUPYTERHUB_DATABASE_USER', 'jupyterhub'),
os.environ['JUPYTERHUB_DATABASE_PASSWORD'],
os.environ['JUPYTERHUB_DATABASE_HOST'],
os.environ.get('JUPYTERHUB_DATABASE_NAME', 'jupyterhub'))
else:
c.JupyterHub.db_url = '/opt/app-root/data/database.sqlite'
c.JupyterHub.authenticator_class = 'tmpauthenticator.TmpAuthenticator'
c.JupyterHub.spawner_class = 'kubespawner.KubeSpawner'
c.KubeSpawner.image_spec = resolve_image_name(
os.environ.get('JUPYTERHUB_NOTEBOOK_IMAGE',
's2i-minimal-notebook:3.6'))
if os.environ.get('JUPYTERHUB_NOTEBOOK_MEMORY'):
c.Spawner.mem_limit = convert_size_to_bytes(os.environ['JUPYTERHUB_NOTEBOOK_MEMORY'])
notebook_interface = os.environ.get('JUPYTERHUB_NOTEBOOK_INTERFACE')
if notebook_interface:
c.Spawner.environment['JUPYTER_NOTEBOOK_INTERFACE'] = notebook_interface
# Workaround bug in minishift where a service cannot be contacted from a
# pod which backs the service. For further details see the minishift issue
# https://github.com/minishift/minishift/issues/2400.
#
# What these workarounds do is monkey patch the JupyterHub proxy client
# API code, and the code for creating the environment for local service
# processes, and when it sees something which uses the service name as
# the target in a URL, it replaces it with localhost. These work because
# the proxy/service processes are in the same pod. It is not possible to
# change hub_connect_ip to localhost because that is passed to other
# pods which need to contact back to JupyterHub, and so it must be left
# as the service name.
@wrapt.patch_function_wrapper('jupyterhub.proxy', 'ConfigurableHTTPProxy.add_route')
def _wrapper_add_route(wrapped, instance, args, kwargs):
def _extract_args(routespec, target, data, *_args, **_kwargs):
return (routespec, target, data, _args, _kwargs)
routespec, target, data, _args, _kwargs = _extract_args(*args, **kwargs)
old = 'http://%s:%s' % (c.JupyterHub.hub_connect_ip, c.JupyterHub.hub_port)
new = 'http://127.0.0.1:%s' % c.JupyterHub.hub_port
if target.startswith(old):
target = target.replace(old, new)
return wrapped(routespec, target, data, *_args, **_kwargs)
@wrapt.patch_function_wrapper('jupyterhub.spawner', 'LocalProcessSpawner.get_env')
def _wrapper_get_env(wrapped, instance, args, kwargs):
env = wrapped(*args, **kwargs)
target = env.get('JUPYTERHUB_API_URL')
old = 'http://%s:%s' % (c.JupyterHub.hub_connect_ip, c.JupyterHub.hub_port)
new = 'http://127.0.0.1:%s' % c.JupyterHub.hub_port
if target and target.startswith(old):
target = target.replace(old, new)
env['JUPYTERHUB_API_URL'] = target
return env
# Load configuration overrides based on configuration type.
configuration_type = os.environ.get('CONFIGURATION_TYPE')
if configuration_type:
config_file = '/opt/app-root/etc/jupyterhub_config-%s.py' % configuration_type
if os.path.exists(config_file):
with open(config_file) as fp:
exec(compile(fp.read(), config_file, 'exec'), globals())
# Load configuration included in the image.
image_config_file = '/opt/app-root/src/.jupyter/jupyterhub_config.py'
if os.path.exists(image_config_file):
with open(image_config_file) as fp:
exec(compile(fp.read(), image_config_file, 'exec'), globals())
# Load configuration provided via the environment.
environ_config_file = '/opt/app-root/configs/jupyterhub_config.py'
if os.path.exists(environ_config_file):
with open(environ_config_file) as fp:
exec(compile(fp.read(), environ_config_file, 'exec'), globals())