更多kubernetes文章:k8s专栏目录
版本
1.9.0
namespace限制gpu
[root@tensorflow1 gpu-namespace]# cat compute-resources2.yaml
apiVersion: v1
kind: ResourceQuota
metadata:
name: compute-resources
spec:
hard:
#pods: "4"
#requests.cpu: "1"
#requests.memory: 1Gi
#limits.cpu: "2"
#limits.memory: 2Gi
kubectl create -f compute-resources2.yaml
kubectl get quota
kubectl describe quota compute-resources
kubectl delete quota compute-resources
先创建namespace 再在namespace上增加限制,这里是在default下增加限制
- docker里面没vi等基本命令
echo "nameserver 192.168.1.254" > /etc/resolv.conf
apt-get update
apt install net-tools # ifconfig
apt install iputils-ping # ping
apt install vi
启动gpu任务
Warning FailedScheduling 3s (x7 over 34s) default-scheduler 0/3 nodes are available: 1 PodToleratesNodeTaints, 3 Insufficient
nvidia.com/gpu.
- 调整副本数
kubectl scale ds/kube-flannel-ds --replicas=1
- 在指定node上启动容器
增加参数 nodeName: xxxx
eg:
apiVersion: v1
kind: Pod
metadata:
name: cuda-vector-add
spec:
restartPolicy: OnFailure
containers:
- name: cuda-vector-add
image: "nfs:5000/tensorflow/tensorflow:nightly"
#resources:
#limits:
#
nvidia.com/gpu: 1 # requesting 1 GPU
nodeName: tensorflow1