diff --git a/kubernetes/Helm/templates/torchserve.yaml b/kubernetes/Helm/templates/torchserve.yaml index e8b4b3df0a..e847246100 100644 --- a/kubernetes/Helm/templates/torchserve.yaml +++ b/kubernetes/Helm/templates/torchserve.yaml @@ -42,17 +42,7 @@ spec: volumes: - name: persistent-storage persistentVolumeClaim: - claimName: model-store-claim - initContainers: - - name: volume-ownership - image: alpine:3 - command: - - chown - - root:{{ .Values.securityContext.groupId }} - - {{ .Values.torchserve.pvd_mount }} - volumeMounts: - - name: persistent-storage - mountPath: {{ .Values.torchserve.pvd_mount }} + claimName: {{ .Values.persistentVolume.name }} containers: - name: torchserve image: {{ .Values.torchserve_image }} @@ -73,6 +63,3 @@ spec: cpu: {{ .Values.torchserve.n_cpu }} memory: {{ .Values.torchserve.memory_limit }} nvidia.com/gpu: {{ .Values.torchserve.n_gpu }} - requests: - cpu: {{ .Values.torchserve.n_cpu }} - memory: {{ .Values.torchserve.memory_request }} diff --git a/kubernetes/Helm/values.yaml b/kubernetes/Helm/values.yaml index 8a82b4d085..fb74a4277c 100644 --- a/kubernetes/Helm/values.yaml +++ b/kubernetes/Helm/values.yaml @@ -9,13 +9,12 @@ torchserve: inference_port: 8080 metrics_port: 8082 pvd_mount: /home/model-server/shared/ - n_gpu: 1 - n_cpu: 1 - memory_limit: 4Gi - memory_request: 1Gi + n_gpu: 4 + n_cpu: 16 + memory_limit: 32Gi deployment: replicas: 1 -persitant_volume: - size: 1Gi +persistentVolume: + name: efs-claim