Skip to content

Commit

Permalink
Add bare-metal GPU runtime class
Browse files Browse the repository at this point in the history
This adds a runtime class for the local just-based deployments as well
as the release artifacts that corresponds to the GPU-enabled runtime for
Contrast on bare-metal platforms.
  • Loading branch information
msanft committed Jan 22, 2025
1 parent 2771f21 commit 5255d32
Show file tree
Hide file tree
Showing 7 changed files with 46 additions and 11 deletions.
4 changes: 4 additions & 0 deletions .github/workflows/release.yml
Original file line number Diff line number Diff line change
Expand Up @@ -247,6 +247,7 @@ jobs:
coordinatorImg=$(nix run .#containers.push-coordinator -- "$container_registry/contrast/coordinator")
nodeInstallerMsftImg=$(nix run .#containers.push-node-installer-microsoft -- "$container_registry/contrast/node-installer-microsoft")
nodeInstallerKataImg=$(nix run .#containers.push-node-installer-kata -- "$container_registry/contrast/node-installer-kata")
nodeInstallerKataGPUImg=$(nix run .#containers.push-node-installer-kata-gpu -- "$container_registry/contrast/node-installer-kata")
initializerImg=$(nix run .#containers.push-initializer -- "$container_registry/contrast/initializer")
serviceMeshImg=$(nix run .#containers.push-service-mesh-proxy -- "$container_registry/contrast/service-mesh-proxy")
tardevSnapshotterImg=$(nix run .#containers.push-tardev-snapshotter -- "$container_registry/contrast/tardev-snapshotter")
Expand All @@ -256,6 +257,7 @@ jobs:
echo "coordinatorImg=$coordinatorImg" | tee -a "$GITHUB_ENV"
echo "nodeInstallerMsftImg=$nodeInstallerMsftImg" | tee -a "$GITHUB_ENV"
echo "nodeInstallerKataImg=$nodeInstallerKataImg" | tee -a "$GITHUB_ENV"
echo "nodeInstallerKataGPUImg=$nodeInstallerKataGPUImg" | tee -a "$GITHUB_ENV"
echo "initializerImg=$initializerImg" | tee -a "$GITHUB_ENV"
echo "serviceMeshImg=$serviceMeshImg" | tee -a "$GITHUB_ENV"
echo "tardevSnapshotterImg=$tardevSnapshotterImg" | tee -a "$GITHUB_ENV"
Expand All @@ -272,6 +274,7 @@ jobs:
echo "coordinatorImgTagged=$(tag "$coordinatorImg")" | tee -a "$GITHUB_ENV"
echo "nodeInstallerMsftImgTagged=$(tag "$nodeInstallerMsftImg")" | tee -a "$GITHUB_ENV"
echo "nodeInstallerKataImgTagged=$(tag "$nodeInstallerKataImg")" | tee -a "$GITHUB_ENV"
echo "nodeInstallerKataGPUImgTagged=$(tag "$nodeInstallerKataGPUImg")" | tee -a "$GITHUB_ENV"
echo "initializerImgTagged=$(tag "$initializerImg")" | tee -a "$GITHUB_ENV"
echo "serviceMeshImgTagged=$(tag "$serviceMeshImg")" | tee -a "$GITHUB_ENV"
echo "nydusPullImgTagged=$(tag "$nydusPullImg")" | tee -a "$GITHUB_ENV"
Expand All @@ -294,6 +297,7 @@ jobs:
echo "ghcr.io/edgelesssys/contrast/service-mesh-proxy:latest=$serviceMeshImgTagged"
echo "ghcr.io/edgelesssys/contrast/node-installer-microsoft:latest=$nodeInstallerMsftImgTagged"
echo "ghcr.io/edgelesssys/contrast/node-installer-kata:latest=$nodeInstallerKataImgTagged"
echo "ghcr.io/edgelesssys/contrast/node-installer-kata-gpu:latest=$nodeInstallerKataGPUImgTagged"
echo "ghcr.io/edgelesssys/contrast/tardev-snapshotter:latest=$tardevSnapshotterImgTagged"
echo "ghcr.io/edgelesssys/contrast/nydus-snapshotter:latest=$nydusSnapshotterImgTagged"
echo "ghcr.io/edgelesssys/contrast/nydus-pull:latest=$nydusPullImgTagged"
Expand Down
6 changes: 6 additions & 0 deletions internal/kuberesource/parts.go
Original file line number Diff line number Diff line change
Expand Up @@ -153,6 +153,9 @@ func NodeInstaller(namespace string, platform platforms.Platform) (*NodeInstalle
snapshotterVolumes = tardevSnapshotterVolumes
case platforms.MetalQEMUSNP, platforms.MetalQEMUTDX, platforms.MetalQEMUSNPGPU:
nodeInstallerImageURL = "ghcr.io/edgelesssys/contrast/node-installer-kata:latest"
if platform == platforms.MetalQEMUSNPGPU {
nodeInstallerImageURL = "ghcr.io/edgelesssys/contrast/node-installer-kata-gpu:latest"
}
containers = append(containers, nydusSnapshotter, nydusPull)
nydusSnapshotterVolumes = append(nydusSnapshotterVolumes,
Volume().
Expand All @@ -171,6 +174,9 @@ func NodeInstaller(namespace string, platform platforms.Platform) (*NodeInstalle
snapshotterVolumes = nydusSnapshotterVolumes
case platforms.K3sQEMUTDX, platforms.K3sQEMUSNP, platforms.K3sQEMUSNPGPU, platforms.RKE2QEMUTDX:
nodeInstallerImageURL = "ghcr.io/edgelesssys/contrast/node-installer-kata:latest"
if platform == platforms.K3sQEMUSNPGPU {
nodeInstallerImageURL = "ghcr.io/edgelesssys/contrast/node-installer-kata-gpu:latest"
}
containers = append(containers, nydusSnapshotter, nydusPull)
nydusSnapshotterVolumes = append(nydusSnapshotterVolumes,
Volume().
Expand Down
7 changes: 6 additions & 1 deletion justfile
Original file line number Diff line number Diff line change
Expand Up @@ -50,11 +50,16 @@ node-installer platform=default_platform:
just push "tardev-snapshotter"
just push "node-installer-microsoft"
;;
"Metal-QEMU-SNP"|"Metal-QEMU-TDX"|"Metal-QEMU-SNP-GPU"|"K3s-QEMU-SNP"|"K3s-QEMU-SNP-GPU"|"K3s-QEMU-TDX"|"RKE2-QEMU-TDX")
"Metal-QEMU-SNP"|"Metal-QEMU-TDX"|"K3s-QEMU-SNP"|"K3s-QEMU-TDX"|"RKE2-QEMU-TDX")
just push "nydus-snapshotter"
just push "nydus-pull"
just push "node-installer-kata"
;;
"Metal-QEMU-SNP-GPU"|"K3s-QEMU-SNP-GPU")
just push "nydus-snapshotter"
just push "nydus-pull"
just push "node-installer-kata-gpu"
;;
"AKS-PEER-SNP")
nix run -L .#scripts.deploy-caa -- \
--kustomization=./infra/azure-peerpods/kustomization.yaml \
Expand Down
20 changes: 15 additions & 5 deletions packages/by-name/kata/contrast-node-installer-image/package.nix
Original file line number Diff line number Diff line change
Expand Up @@ -18,9 +18,15 @@
OVMF-TDX,

debugRuntime ? false,
withGPU ? false,
}:

let
os-image = kata.kata-image.override {
inherit withGPU;
withDebug = debugRuntime;
};

node-installer = ociLayerTar {
files = [
{
Expand Down Expand Up @@ -110,7 +116,7 @@ let
}
];
inherit debugRuntime;
qemuExtraKernelParams = kata.kata-image.cmdline;
qemuExtraKernelParams = os-image.cmdline;
};
destination = "/config/contrast-node-install.json";
}
Expand All @@ -120,15 +126,15 @@ let
kata-container-img = ociLayerTar {
files = [
{
source = "${kata.kata-image.image}/${kata.kata-image.imageFileName}";
source = "${os-image.image}/${os-image.imageFileName}";
destination = "/opt/edgeless/share/kata-containers.img";
}
{
source = "${kata.kata-image.kernel}/bzImage";
source = "${os-image.kernel}/bzImage";
destination = "/opt/edgeless/share/kata-kernel";
}
{
source = "${kata.kata-image.initialRamdisk}/initrd";
source = "${os-image.initialRamdisk}/initrd";
destination = "/opt/edgeless/share/kata-initrd.zst";
}
];
Expand Down Expand Up @@ -251,10 +257,14 @@ in
ociImageLayout {
manifests = [ manifest ];
passthru = {
inherit debugRuntime;
inherit debugRuntime os-image;
runtimeHash = hashDirs {
dirs = layers; # Layers without node-installer, or we have a circular dependency!
name = "runtime-hash-kata";
};
gpu = kata.contrast-node-installer-image.override {
inherit debugRuntime;
withGPU = true;
};
};
}
9 changes: 5 additions & 4 deletions packages/by-name/kata/snp-launch-digest/package.nix
Original file line number Diff line number Diff line change
Expand Up @@ -9,25 +9,26 @@
python3Packages,

debug ? false,
os-image ? kata.kata-image,
}:

let
ovmf-snp = "${OVMF-SNP}/FV/OVMF.fd";
kernel = "${kata.kata-image}/bzImage";
initrd = "${kata.kata-image}/initrd";
kernel = "${os-image}/bzImage";
initrd = "${os-image}/initrd";

# Kata uses a base command line and then appends the command line from the kata config (i.e. also our node-installer config).
# Thus, we need to perform the same steps when calculating the digest.
baseCmdline = if debug then kata.kata-runtime.cmdline.debug else kata.kata-runtime.cmdline.default;
cmdline = lib.strings.concatStringsSep " " [
baseCmdline
kata.kata-image.cmdline
os-image.cmdline
];
in

stdenvNoCC.mkDerivation {
name = "snp-launch-digest${lib.optionalString debug "-debug"}";
inherit (kata.kata-image) version;
inherit (os-image) version;

dontUnpack = true;

Expand Down
3 changes: 3 additions & 0 deletions packages/containers.nix
Original file line number Diff line number Diff line change
Expand Up @@ -198,5 +198,8 @@ containers
push-node-installer-kata =
pushOCIDir "push-node-installer-kata" pkgs.kata.contrast-node-installer-image
"v${pkgs.contrast.version}";
push-node-installer-kata-gpu =
pushOCIDir "push-node-installer-kata-gpu" pkgs.kata.contrast-node-installer-image.gpu
"v${pkgs.contrast.version}";
}
// (lib.concatMapAttrs (name: container: { "push-${name}" = pushContainer container; }) containers)
8 changes: 7 additions & 1 deletion packages/nixos/kata.nix
Original file line number Diff line number Diff line change
Expand Up @@ -78,7 +78,13 @@ in
};

# Not used directly, but required for kernel-specific driver builds.
boot.kernelPackages = pkgs.recurseIntoAttrs (pkgs.linuxPackagesFor pkgs.kata-kernel-uvm);
boot.kernelPackages = pkgs.recurseIntoAttrs (
pkgs.linuxPackagesFor (
pkgs.kata-kernel-uvm.override {
withGPU = config.contrast.gpu.enable;
}
)
);

boot.initrd = {
# Don't require TPM2 support. (additional modules)
Expand Down

0 comments on commit 5255d32

Please sign in to comment.