From 97086ec35f967332b2f5e3fe7d0e5a193b741974 Mon Sep 17 00:00:00 2001 From: Kevin Klues Date: Mon, 20 Sep 2021 17:14:42 +0200 Subject: [PATCH 1/2] Update to latest cuda base images Signed-off-by: Kevin Klues --- deployments/gpu-operator/Makefile | 2 +- deployments/systemd/packages/Makefile | 6 +++--- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/deployments/gpu-operator/Makefile b/deployments/gpu-operator/Makefile index 78427b44..c0339b46 100644 --- a/deployments/gpu-operator/Makefile +++ b/deployments/gpu-operator/Makefile @@ -16,7 +16,7 @@ VERSION ?= v0.1.2 DOCKER ?= docker GOLANG_VERSION ?= 1.15 -CUDA_BASE_IMAGE ?= nvcr.io/nvidia/cuda:11.4.1-base +CUDA_BASE_IMAGE ?= nvcr.io/nvidia/cuda:11.4.2-base BUILD_DIR ?= ../.. ifeq ($(IMAGE),) diff --git a/deployments/systemd/packages/Makefile b/deployments/systemd/packages/Makefile index 3796f8db..e4256f78 100644 --- a/deployments/systemd/packages/Makefile +++ b/deployments/systemd/packages/Makefile @@ -51,7 +51,7 @@ ubuntu18.04: --build-arg PACKAGE_VERSION=$(VERSION) \ --build-arg PACKAGE_REVISION=$(REVISION) \ --build-arg GOLANG_VERSION=$(GOLANG_VERSION) \ - --build-arg BASE_IMAGE=nvcr.io/nvidia/cuda:11.4.1-base-ubuntu18.04 \ + --build-arg BASE_IMAGE=nvcr.io/nvidia/cuda:11.4.2-base-ubuntu18.04 \ --tag $(IMAGE):v$(VERSION)-ubuntu18.04 \ --file Dockerfile.ubuntu \ $(BUILD_DIR) @@ -65,7 +65,7 @@ ubuntu20.04: --build-arg PACKAGE_VERSION=$(VERSION) \ --build-arg PACKAGE_REVISION=$(REVISION) \ --build-arg GOLANG_VERSION=$(GOLANG_VERSION) \ - --build-arg BASE_IMAGE=nvcr.io/nvidia/cuda:11.4.1-base-ubuntu20.04 \ + --build-arg BASE_IMAGE=nvcr.io/nvidia/cuda:11.4.2-base-ubuntu20.04 \ --tag $(IMAGE):v$(VERSION)-ubuntu20.04 \ --file Dockerfile.ubuntu \ $(BUILD_DIR) @@ -79,7 +79,7 @@ ubi8: --build-arg PACKAGE_VERSION=$(VERSION) \ --build-arg PACKAGE_REVISION=$(REVISION) \ --build-arg GOLANG_VERSION=$(GOLANG_VERSION) \ - --build-arg BASE_IMAGE=nvcr.io/nvidia/cuda:11.4.1-base-ubi8 \ + --build-arg BASE_IMAGE=nvcr.io/nvidia/cuda:11.4.2-base-ubi8 \ --tag $(IMAGE):v$(VERSION)-ubi8 \ --file Dockerfile.ubi8 \ $(BUILD_DIR) From b6077469703cb9561bded5da333be3af64c1f6fd Mon Sep 17 00:00:00 2001 From: Kevin Klues Date: Mon, 20 Sep 2021 17:20:03 +0200 Subject: [PATCH 2/2] Bump to v0.1.3 Signed-off-by: Kevin Klues --- cmd/main.go | 2 +- deployments/gpu-operator/Makefile | 2 +- .../gpu-operator/nvidia-mig-manager-example.yaml | 2 +- deployments/systemd/packages/Makefile | 2 +- deployments/systemd/packages/debian/changelog | 10 ++++++++++ .../systemd/packages/rpm/SPECS/nvidia-mig-manager.spec | 7 +++++++ 6 files changed, 21 insertions(+), 4 deletions(-) diff --git a/cmd/main.go b/cmd/main.go index 0e50c8af..c7a15894 100644 --- a/cmd/main.go +++ b/cmd/main.go @@ -40,7 +40,7 @@ func main() { c.UseShortOptionHandling = true c.EnableBashCompletion = true c.Usage = "Manage MIG partitions across the full set of NVIDIA GPUs on a node" - c.Version = "0.1.2" + c.Version = "0.1.3" // Setup the flags for this command c.Flags = []cli.Flag{ diff --git a/deployments/gpu-operator/Makefile b/deployments/gpu-operator/Makefile index c0339b46..fbd4223b 100644 --- a/deployments/gpu-operator/Makefile +++ b/deployments/gpu-operator/Makefile @@ -12,7 +12,7 @@ # See the License for the specific language governing permissions and # limitations under the License. -VERSION ?= v0.1.2 +VERSION ?= v0.1.3 DOCKER ?= docker GOLANG_VERSION ?= 1.15 diff --git a/deployments/gpu-operator/nvidia-mig-manager-example.yaml b/deployments/gpu-operator/nvidia-mig-manager-example.yaml index 9c5d1820..9402b312 100644 --- a/deployments/gpu-operator/nvidia-mig-manager-example.yaml +++ b/deployments/gpu-operator/nvidia-mig-manager-example.yaml @@ -21,7 +21,7 @@ spec: serviceAccountName: gpu-operator containers: - name: nvidia-mig-manager - image: nvcr.io/nvidia/k8s-mig-manager:v0.1.2-ubi8 + image: nvcr.io/nvidia/k8s-mig-manager:v0.1.3-ubi8 imagePullPolicy: IfNotPresent env: - name: NODE_NAME diff --git a/deployments/systemd/packages/Makefile b/deployments/systemd/packages/Makefile index e4256f78..c4cc35df 100644 --- a/deployments/systemd/packages/Makefile +++ b/deployments/systemd/packages/Makefile @@ -13,7 +13,7 @@ # limitations under the License. NAME = nvidia-mig-manager -VERSION ?= 0.1.2 +VERSION ?= 0.1.3 REVISION ?= 1 DOCKER ?= docker diff --git a/deployments/systemd/packages/debian/changelog b/deployments/systemd/packages/debian/changelog index 0ede7b0e..abc93788 100644 --- a/deployments/systemd/packages/debian/changelog +++ b/deployments/systemd/packages/debian/changelog @@ -1,3 +1,13 @@ +nvidia-mig-manager (0.1.3-1) UNRELEASED; urgency=medium + + * Add default configs for the PG506-96GB card + * Remove CombinedMigManager and add wrappers for Mode/Config Managers + * Add a function to check the minimum NVML version required + * Add SystemGetNVMLVersion() to the NVML interface + * Fix small bug in assert logic for non MIG-capable GPUs + + -- NVIDIA CORPORATION Mon, 20 Sep 2021 17:16:26 +0000 + nvidia-mig-manager (0.1.2-1) UNRELEASED; urgency=medium * Do not start nvidia-mig-manager.service when installing the .deb diff --git a/deployments/systemd/packages/rpm/SPECS/nvidia-mig-manager.spec b/deployments/systemd/packages/rpm/SPECS/nvidia-mig-manager.spec index 5d8ec70c..ad3e8de7 100644 --- a/deployments/systemd/packages/rpm/SPECS/nvidia-mig-manager.spec +++ b/deployments/systemd/packages/rpm/SPECS/nvidia-mig-manager.spec @@ -81,6 +81,13 @@ systemctl disable nvidia-mig-manager.service systemctl daemon-reload %changelog +* Mon Sep 20 2021 NVIDIA CORPORATION 0.1.3-1 +- Add default configs for the PG506-96GB card +- Remove CombinedMigManager and add wrappers for Mode/Config Managers +- Add a function to check the minimum NVML version required +- Add SystemGetNVMLVersion() to the NVML interface +- Fix small bug in assert logic for non MIG-capable GPUs + * Thu Aug 05 2021 NVIDIA CORPORATION 0.1.2-1 - Do not start nvidia-mig-manager.service when installing the .deb - Restore lost assert_gpu_reset_available() function