bird-house · mishaschwartz · Dec 10, 2025 · Dec 12, 2025 · Dec 12, 2025 · Dec 15, 2025
@@ -15,7 +15,21 @@
 [Unreleased](https://github.com/bird-house/birdhouse-deploy/tree/master) (latest)
 ------------------------------------------------------------------------------------------------------------------
 
-[//]: # (list changes here, using '-' for each new entry, remove this when items are added)
+## Changes
+
+- Set GPU access on Jupyterlab containers based on Magpie user or group name
+
+  Adds to the feature that lets resource allocations to Jupyterlab containers be assigned based on username or
+  group membership.
+
+  New settings for the `JUPYTERHUB_RESOURCE_LIMITS` variable are `gpu_ids` and `gpu_count`.
+  `gpu_ids` are a comma separated list of the GPU ids available on the host that you want to make available to
+  the user or group. GPU ids can typically be discovered by running the `nvidia-smi` command.
+  If `gpu_count` is also specified, this is an integer indicating how many GPUs to make available to that user 
+  or group. If `gpu_count` is not specified, then only one GPU will be made available to that user.
+
+  For example, if `gpu_ids=gpu1,gpu2,gpu6` and `gpu_count=2` then two GPUs will be randomly selected from the 
+  `gpu_ids` list.
 
 [2.19.0](https://github.com/bird-house/birdhouse-deploy/tree/2.19.0) (2025-12-05)
 ------------------------------------------------------------------------------------------------------------------

@@ -73,24 +73,35 @@ export JUPYTERHUB_AUTHENTICATOR_REFRESH_AGE=60
 export JUPYTERHUB_ADMIN_USERS='{\"${MAGPIE_ADMIN_USERNAME}\"}'  # python set syntax
 
 # Resource limits for JupyterLab containers. Resource limits can be set per Magpie user or group.
-# The value for this variable is a whitespace delimited string. Each section is delimited by colons (:) 
-# where the first element is either `group` or `user` and the second element is the name of the user or group
-# to apply the limits to. The rest are resource limits of the form `limit=amount`. For example:
-#
-#  export JUPYTERHUB_RESOURCE_LIMITS="
-#     user:user1:mem_limit=30G
-#     group:group1:mem_limit=10G:cpu_limit=1
-#     group:group2:cpu_limit=3
-#  "
-#
-#  Supported limits are: `mem_limit` and `cpu_limit`. See the Jupyterhub Dockerspawner documentation
-#  for details and supported values.
-#  Note that this will not create the groups in Magpie, that must be done manually.
-#  Note that if a user belongs to multiple groups, later values in `JUPYTERHUB_RESOURCE_LIMITS` will take
-#  precedence. For example, if a user named user1 belongs to group1 and group2 then the following limits will apply:
+# The value for this variable is a yaml or JSON array of mappings with the following keys: "type" (either "user" 
+# or "group"), "name" (the name of the group or user to apply the limits to) and "limits" (see below). For example:
+# export JUPYTERHUB_RESOURCE_LIMITS='
+#  [
+#    {"type": "user", "name": "user1", "limits": {"mem_limit": "30G"}},
+#    {"type": "group", "name": "group1", "limits": {"mem_limit": "10G", "cpu_limit": 1}},
+#    {"type": "group", "name": "group2", "limits": {"cpu_limit": 3, "gpu_ids": [0, 3, 4]}},
+#    {"type": "user", "name": "user2", "limits": {"gpu_ids": [1, 2, 3], "gpu_count": 2}}
+#  ]
+#'
+# Supported limits are: "mem_limit", "cpu_limit", "gpu_count", "gpu_ids". 
+# For a JSON schema describing the structure of this JSON array see 
+# birdhouse/components/jupyterhub/resource-limit.schema.json
+# See the Jupyterhub Dockerspawner documentation
+# for details and supported values for mem_limit and cpu_limit.
+#  - https://jupyterhub-dockerspawner.readthedocs.io/en/latest/api/index.html#dockerspawner.DockerSpawner.cpu_limit
+#  - https://jupyterhub-dockerspawner.readthedocs.io/en/latest/api/index.html#dockerspawner.DockerSpawner.mem_limit
+# gpu_ids are an array of the GPU uuids or zero based indexes of the GPUs that you want to make available 
+# to the user or group. GPU uuids and indexes can be discovered by running the `nvidia-smi --list-gpus` command.
+# If gpu_count is also specified, this is an integer indicating how many GPUs to make available to that user or group.
+# If gpu_count is not specified, then exactly one GPU will be randomly selected.
+# For example, if {"gpu_ids": [1,2,6], "gpu_count": 2} then two GPUs will be randomly selected from the gpu_ids list.
+# Note that this will not create the groups in Magpie, that must be done manually.
+# Note that if a user belongs to multiple groups, later values in `JUPYTERHUB_RESOURCE_LIMITS` will take
+# precedence. For example, if a user named user1 belongs to group1 and group2 then the following limits will apply:
 #  - mem_limit=10G (because group1 is later in the list)
 #  - cpu_limit=3 (because group2 is later in the list)
-export JUPYTERHUB_RESOURCE_LIMITS=
+#  - gpu_ids=0,3,4
+export JUPYTERHUB_RESOURCE_LIMITS='[]'
 
 export DELAYED_EVAL="
   $DELAYED_EVAL

@@ -1,8 +1,11 @@
 import os
 from os.path import join
 import logging
+import random
 import subprocess
 
+import docker
+import yaml
 from dockerspawner import DockerSpawner
 
 c = get_config()  # noqa  # can be called directy without import because injected by IPython
@@ -137,10 +140,18 @@ if os.environ['WORKSPACE_DIR'] != jupyterhub_data_dir:
 container_gdrive_settings_path = join(container_home_dir, ".jupyter/lab/user-settings/@jupyterlab/google-drive/drive.jupyterlab-settings")
 host_gdrive_settings_path = os.environ['JUPYTER_GOOGLE_DRIVE_SETTINGS']
 
-# resource_limits: dict[tuple[Literal["user", "group"], str], dict[Literal["cpu_limit", "mem_limit"], str]]
-resource_limits = {tuple(lim[:2]): dict(li.split("=") for li in lim[2:] if "=" in li)
-                    for limit in """${JUPYTERHUB_RESOURCE_LIMITS}""".strip().split() 
-                    if (lim := limit.split(":"))}
+# class LimitDict(TypedDict):
+#   mem_limit: NotRequired[str | int]
+#   cpu_limit: NotRequired[str | float | int]
+#   gpu_ids: NotRequired[list[int | str]]
+#   gpu_count: NotRequired[int]
+#
+# class LimitRule(TypedDict):
+#   type: Literal["user", "group"]
+#   name: str
+#   limits: LimitDict
+# resource_limits: LimitRule
+resource_limits = yaml.safe_load("""${JUPYTERHUB_RESOURCE_LIMITS}""")
 
 if len(host_gdrive_settings_path) > 0:
     c.DockerSpawner.volumes[host_gdrive_settings_path] = {
@@ -183,14 +194,28 @@ def limit_resource_hook(spawner):
         spawner.mem_limit = os.environ['JUPYTER_DEMO_USER_MEM_LIMIT']
 
     user_groups = {g.name for g in spawner.user.groups}
-    for (name_type, name), limits in resource_limits.items():
-        if (name_type == "user" and name == spawner.user.name) or (name_type == "group" and name in user_groups):
-            for limit, value in limits.items():
+    gpu_ids = []
+    gpu_count = 1
+    for rule in resource_limits:
+        rule_type = rule["type"]
+        name = rule["name"]
+        if rule_type == "user" and name == spawner.user.name or rule_type == "group" and name in user_groups:
+            for limit, value in rule["limits"].items():
                 if limit == "cpu_limit":
-                    spawner.cpu_limit = float(value)
+                    spawner.cpu_limit = value
                 elif limit == "mem_limit":
                     spawner.mem_limit = value
-
+                elif limit == "gpu_ids":
+                    gpu_ids = value
+                elif limit == "gpu_count":
+                    gpu_count = value
+    if gpu_ids:
+        # randomly assign GPUs in an attempt to evenly distribute GPU resources
+        random.shuffle(gpu_ids)
+        gpu_ids = gpu_ids[:gpu_count]
+        spawner.extra_host_config["device_requests"] = [
+            docker.types.DeviceRequest(device_ids=gpu_ids, capabilities=[["gpu"]])
+        ]
 
 def pre_spawn_hook(spawner):
     create_dir_hook(spawner)

@@ -0,0 +1,47 @@
+{
+  "type": "array",
+  "items": {
+    "type": "object",
+    "properties": {
+      "type": {
+        "type": "string",
+        "enum": [
+          "user",
+          "group"
+        ]
+      },
+      "name": {
+        "type": "string",
+        "pattern": "^.+$"
+      },
+      "limits": {
+        "type": "object",
+        "properties": {
+          "mem_limit": {
+            "type": "string"
+          },
+          "cpu_limit": {
+            "type": "number"
+          },
+          "gpu_ids": {
+            "type": "array"
+          },
+          "gpu_count": {
+            "type": "number"
+          }
+        },
+        "dependentRequired": {
+          "gpu_count": [
+            "gpu_ids"
+          ]
+        },
+        "additionalProperties": false
+      }
+    },
+    "required": [
+      "type",
+      "name",
+      "limits"
+    ]
+  }
+}
@@ -381,26 +381,35 @@ export GEOSERVER_ADMIN_PASSWORD="${__DEFAULT__GEOSERVER_ADMIN_PASSWORD}"
 #export JUPYTERHUB_AUTHENTICATOR_REFRESH_AGE=60
 
 # Resource limits for JupyterLab containers. Resource limits can be set per Magpie user or group.
-# The value for this variable is a whitespace delimited string. Each section is delimited by colons (:) 
-# where the first element is either `group` or `user` and the second element is the name of the user or group
-# to apply the limits to. The rest are resource limits of the form `limit=amount`. For example:
-#
-#  export JUPYTERHUB_RESOURCE_LIMITS="
-#     user:user1:mem_limit=30G
-#     group:group1:mem_limit=10G:cpu_limit=1
-#     group:group2:cpu_limit=3
-#  "
-#
-#  Supported limits are: `mem_limit` and `cpu_limit`. See the Jupyterhub Dockerspawner documentation
-#  for details and supported values.
+# The value for this variable is a yaml or JSON array of mappings with the following keys: "type" (either "user" 
+# or "group"), "name" (the name of the group or user to apply the limits to) and "limits" (see below). For example:
+# export JUPYTERHUB_RESOURCE_LIMITS='
+#  [
+#    {"type": "user", "name": "user1", "limits": {"mem_limit": "30G"}},
+#    {"type": "group", "name": "group1", "limits": {"mem_limit": "10G", "cpu_limit": 1}},
+#    {"type": "group", "name": "group2", "limits": {"cpu_limit": 3, "gpu_ids": [0, 3, 4]}},
+#    {"type": "user", "name": "user2", "limits": {"gpu_ids": [1, 2, 3], "gpu_count": 2}}
+#  ]
+#'
+#  Supported limits are: "mem_limit", "cpu_limit", "gpu_count", "gpu_ids". 
+#  For a JSON schema describing the structure of this JSON array see 
+#  birdhouse/components/jupyterhub/resource-limit.schema.json
+#  See the Jupyterhub Dockerspawner documentation
+#  for details and supported values for mem_limit and cpu_limit.
 #   - https://jupyterhub-dockerspawner.readthedocs.io/en/latest/api/index.html#dockerspawner.DockerSpawner.cpu_limit
 #   - https://jupyterhub-dockerspawner.readthedocs.io/en/latest/api/index.html#dockerspawner.DockerSpawner.mem_limit
+#  gpu_ids are an array of the GPU uuids or zero based indexes of the GPUs that you want to make available 
+#  to the user or group. GPU uuids and indexes can be discovered by running the `nvidia-smi --list-gpus` command.
+#  If gpu_count is also specified, this is an integer indicating how many GPUs to make available to that user or group.
+#  If gpu_count is not specified, then exactly one GPU will be randomly selected.
+#  For example, if {"gpu_ids": [1,2,6], "gpu_count": 2} then two GPUs will be randomly selected from the gpu_ids list.
 #  Note that this will not create the groups in Magpie, that must be done manually.
 #  Note that if a user belongs to multiple groups, later values in `JUPYTERHUB_RESOURCE_LIMITS` will take
 #  precedence. For example, if a user named user1 belongs to group1 and group2 then the following limits will apply:
 #  - mem_limit=10G (because group1 is later in the list)
 #  - cpu_limit=3 (because group2 is later in the list)
-#export JUPYTERHUB_RESOURCE_LIMITS=
+#  - gpu_ids=0,3,4
+#export JUPYTERHUB_RESOURCE_LIMITS='[]'
 
 # Allow for adding new config or override existing config in
 # config/jupyterhub/jupyterhub_config.py.template.