diff --git a/docs/DEVELOPMENT.md b/docs/DEVELOPMENT.md index ed213bfb..1a01e352 100644 --- a/docs/DEVELOPMENT.md +++ b/docs/DEVELOPMENT.md @@ -31,7 +31,7 @@ For fulfilling `xargs` and `kubectl` binary requirements necessary for running s ```bash touch /usr/local/bin/kubectl -echo '#!/bin/bash\nuds zarf tools kubectl "$@"' > /usr/local/bin/kubectl +echo -e '#!/bin/bash\nuds zarf tools kubectl "$@"' > /usr/local/bin/kubectl chmod +x /usr/local/bin/kubectl ``` @@ -138,3 +138,11 @@ For example, this is how you pull and deploy a LATEST version of a package: uds zarf package pull oci://ghcr.io/justinthelaw/packages/uds/uds-rke2/nvidia-gpu-operator:latest -a amd64 uds run deploy:nvidia-gpu-operator ``` + +## Troubleshooting + +If your RKE2 cluster is failing to spin up in the first place, you can use `journalctl` to monitor the progress. Please note that it may take up to 10 minutes for the cluster spin-up and move on to the next step of the UDS RKE2 bundle deployment. + +```bash +journalctl -xef -u rke2-server +``` diff --git a/packages/nvidia-gpu-operator/values/nvidia-gpu-operator-values.yaml b/packages/nvidia-gpu-operator/values/nvidia-gpu-operator-values.yaml index ed07a2fe..562f5d61 100644 --- a/packages/nvidia-gpu-operator/values/nvidia-gpu-operator-values.yaml +++ b/packages/nvidia-gpu-operator/values/nvidia-gpu-operator-values.yaml @@ -66,7 +66,7 @@ validator: driver: # RKE2-specific configurations env: - - name: disable_dev_char_symlink_creation + - name: DISABLE_DEV_CHAR_SYMLINK_CREATION value: "true" - name: NVIDIA_VISIBLE_DEVICES value: all