From f04181b078a439ec873e8183bbb9a72826eb7be4 Mon Sep 17 00:00:00 2001 From: Kevin Pouget Date: Tue, 14 Jun 2022 17:17:13 +0200 Subject: [PATCH] DGX-A100_GPU-Operator_testing: cluster_setup.md: new file --- .../cluster_setup.md | 165 ++++++++++++++++++ 1 file changed, 165 insertions(+) create mode 100644 DGX-A100_GPU-Operator_testing/cluster_setup.md diff --git a/DGX-A100_GPU-Operator_testing/cluster_setup.md b/DGX-A100_GPU-Operator_testing/cluster_setup.md new file mode 100644 index 0000000..3106734 --- /dev/null +++ b/DGX-A100_GPU-Operator_testing/cluster_setup.md @@ -0,0 +1,165 @@ +# Prepare the cluster operators + +1. Install NFD Operator + - don't forget to create the NodeFeatureDiscoveries + +2. Install the NVIDIA GPU Operator + - don't forgot to create the ClusterPolicy + +2. Install the Local Storage Operator + - see next step for the creation of a LocalVolume + +# Setup the storage + +1. Create the local disk storage class + +``` +DISK_DEV=/dev/nvme2n1 +STORAGE_CLASS_NAME=local-sc-dgx +NODE_NAME=dgxa100 + +cat <