val progress

tylertitsworth · tylertitsworth · commit 5cc2e18504ae · 2024-08-29T14:52:15.000-07:00
Signed-off-by: tylertitsworth &lt;tyler.titsworth@intel.com&gt;
diff --git a/workflows/charts/tensorflow-serving/README.md b/workflows/charts/tensorflow-serving/README.md
@@ -17,23 +17,16 @@ TensorFlow Serving is a flexible, high-performance serving system for machine le
 | deploy.env | object | `{"configMapName":"intel-proxy-config","enabled":true}` | Add Environment mapping |
 | deploy.image | string | `"intel/intel-extension-for-tensorflow:serving-gpu"` | Intel Extension for Tensorflow Serving image |
 | deploy.modelName | string | `""` | Model Name |
-| deploy.modelPath | string | `"/serving"` | Path to Model Folder |
 | deploy.replicas | int | `1` | Number of pods |
 | deploy.resources.limits | object | `{"cpu":"4000m","gpu.intel.com/i915":1,"memory":"1Gi"}` | Maximum resources per pod |
 | deploy.resources.limits."gpu.intel.com/i915" | int | `1` | Intel GPU Device Configuration |
 | deploy.resources.requests | object | `{"cpu":"1000m","memory":"512Mi"}` | Minimum resources per pod |
-| deploy.storage.nfs | object | `{"enabled":false,"path":"nil","readOnly":true,"server":"nil","subPath":"nil"}` | Network File System (NFS) storage for models |
+| deploy.storage.nfs | object | `{"enabled":false,"path":"nil","readOnly":true,"server":"nil"}` | Network File System (NFS) storage for models |
 | fullnameOverride | string | `""` | Full qualified Domain Name |
-| ingress.annotations | object | `{}` |  |
-| ingress.className | string | `""` |  |
-| ingress.enabled | bool | `false` |  |
-| ingress.hosts[0].host | string | `"chart-example.local"` |  |
-| ingress.hosts[0].paths[0].path | string | `"/"` |  |
-| ingress.hosts[0].paths[0].pathType | string | `"ImplementationSpecific"` |  |
-| ingress.tls | list | `[]` |  |
 | nameOverride | string | `""` | Name of the serving service |
-| pvc.size | string | `"1Gi"` | Size of the storage |
-| service.port | int | `9090` | Port of the service |
+| pvc.size | string | `"5Gi"` | Size of the storage |
+| service.grpcPort | int | `8500` |  |
+| service.restPort | int | `8501` | Port of the service |
 | service.type | string | `"NodePort"` | Type of service |
 
 ----------------------------------------------
diff --git a/workflows/charts/tensorflow-serving/templates/NOTES.txt b/workflows/charts/tensorflow-serving/templates/NOTES.txt
@@ -1,11 +1,5 @@
 1. Get the application URL by running these commands:
-{{- if .Values.ingress.enabled }}
-{{- range $host := .Values.ingress.hosts }}
-  {{- range .paths }}
-  http{{ if $.Values.ingress.tls }}s{{ end }}://{{ $host.host }}{{ .path }}
-  {{- end }}
-{{- end }}
-{{- else if contains "NodePort" .Values.service.type }}
+{{- if contains "NodePort" .Values.service.type }}
   export NODE_PORT=$(kubectl get --namespace {{ .Release.Namespace }} -o jsonpath="{.spec.ports[0].nodePort}" services {{ include "tensorflow-serving.fullname" . }})
   export NODE_IP=$(kubectl get nodes --namespace {{ .Release.Namespace }} -o jsonpath="{.items[0].status.addresses[0].address}")
   echo http://$NODE_IP:$NODE_PORT
@@ -20,3 +14,6 @@
   echo "Visit http://127.0.0.1:8080 to use your application"
   kubectl --namespace {{ .Release.Namespace }} port-forward $POD_NAME 8080:$CONTAINER_PORT
 {{- end }}
+2. Make a prediction
+  curl http://$NODE_IP:$NODE_PORT/v1/models/{{ .Values.deploy.modelName }}
+  curl -X POST http://$NODE_IP:$NODE_PORT/v1/models/{{ .Values.deploy.modelName }}:predict -d '{"data": []}'
diff --git a/workflows/charts/tensorflow-serving/templates/deployment.yaml b/workflows/charts/tensorflow-serving/templates/deployment.yaml
@@ -11,17 +11,16 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
+{{- $name := .Values.deploy.modelName | required ".Values.deploy.modelName is required." -}}
+---
 apiVersion: apps/v1
 kind: Deployment
 metadata:
   name: {{ include "tensorflow-serving.fullname" . }}
   labels:
     {{- include "tensorflow-serving.labels" . | nindent 4 }}
 spec:
-  {{- if not .Values.autoscaling.enabled }}
   replicas: {{ .Values.deploy.replicas }}
-  {{- end }}
   selector:
     matchLabels:
       {{- include "tensorflow-serving.selectorLabels" . | nindent 6 }}
@@ -44,21 +43,20 @@ spec:
           env:
             - name: MODEL_NAME
               value: {{ .Values.deploy.modelName }}
-            - name: MODEL_DIR
-              value: {{ .Values.deploy.modelPath }}
           ports:
-            - name: serving
-              containerPort: {{ .Values.service.port }}
+            - name: rest
+              containerPort: {{ .Values.service.restPort }}
+            - name: grpc
+              containerPort: {{ .Values.service.grpcPort }}
           volumeMounts:
             - mountPath: /dev/shm
               name: dshm
           {{- if .Values.deploy.storage.nfs.enabled }}
             - name: model
-              mountPath: /home/model-server/model-store
-              subPath: {{ .Values.deploy.storage.nfs.subPath }}
+              mountPath: /models/{{ .Values.deploy.modelName }}
           {{- else }}
             - name: model
-              mountPath: /home/model-server/model-store
+              mountPath: /models/{{ .Values.deploy.modelName }}
           {{- end }}
           resources:
             {{- toYaml .Values.deploy.resources | nindent 12 }}
@@ -72,7 +70,6 @@ spec:
             server: {{ .Values.deploy.storage.nfs.server }}
             path: {{ .Values.deploy.storage.nfs.path }}
             readOnly: {{ .Values.deploy.storage.nfs.readOnly }}
-          emptyDir: {}
       {{- else }}
         - name: model
           persistentVolumeClaim:
diff --git a/workflows/charts/tensorflow-serving/templates/ingress.yaml b/workflows/charts/tensorflow-serving/templates/ingress.yaml
diff --git a/workflows/charts/tensorflow-serving/templates/pvc.yaml b/workflows/charts/tensorflow-serving/templates/pvc.yaml
@@ -0,0 +1,29 @@
+# Copyright (c) 2024 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+---
+{{- if not .Values.deploy.storage.nfs.enabled }}
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: {{ include "tensorflow-serving.fullname" . }}-model-dir
+  labels:
+    {{- include "tensorflow-serving.labels" . | nindent 4 }}
+spec:
+  accessModes:
+    - ReadWriteMany
+  resources:
+    requests:
+      storage: {{ .Values.pvc.size }}
+{{- end }}
diff --git a/workflows/charts/tensorflow-serving/templates/service.yaml b/workflows/charts/tensorflow-serving/templates/service.yaml
@@ -21,8 +21,11 @@ metadata:
 spec:
   type: {{ .Values.service.type }}
   ports:
-    - name: serving
-      port: {{ .Values.service.port }}
-      targetPort: serving
+    - name: rest
+      port: {{ .Values.service.restPort }}
+      targetPort: rest
+    - name: grpc
+      port: {{ .Values.service.grpcPort }}
+      targetPort: grpc
   selector:
     {{- include "tensorflow-serving.selectorLabels" . | nindent 4 }}
diff --git a/workflows/charts/tensorflow-serving/templates/tests/test-connection.yaml b/workflows/charts/tensorflow-serving/templates/tests/test-connection.yaml
@@ -22,8 +22,8 @@ metadata:
     "helm.sh/hook": test
 spec:
   containers:
-    - name: wget
-      image: busybox
-      command: ['wget']
-      args: ['{{ include "tensorflow-serving.fullname" . }}:{{ .Values.service.port }}']
-  restartPolicy: Never
+    - name: info
+      image: curlimages/curl
+      command: ['sh', '-c']
+      args: ['curl -f {{ include "tensorflow-serving.fullname" . }}:{{ .Values.service.restPort }}/v1/model/{{ .Values.deploy.modelName}}']
+  restartPolicy: OnFailure
diff --git a/workflows/charts/tensorflow-serving/values.yaml b/workflows/charts/tensorflow-serving/values.yaml
@@ -25,8 +25,6 @@ deploy:
     enabled: true
   # -- Model Name
   modelName: ""
-  # -- Path to Model Folder
-  modelPath: /serving
   # -- Number of pods
   replicas: 1
   resources:
@@ -47,27 +45,12 @@ deploy:
       server: nil
       path: nil
       readOnly: true
-      subPath: nil
 service:
   # -- Type of service
   type: NodePort
   # -- Port of the service
-  port: 9090
+  restPort: 8501
+  grpcPort: 8500
 pvc:
   # -- Size of the storage
-  size: 1Gi
-ingress:
-  enabled: false
-  className: ""
-  annotations: {}
-  # kubernetes.io/ingress.class: nginx
-  # kubernetes.io/tls-acme: "true"
-  hosts:
-  - host: chart-example.local
-    paths:
-    - path: /
-      pathType: ImplementationSpecific
-  tls: []
-  #  - secretName: chart-example-tls
-  #    hosts:
-  #      - chart-example.local
+  size: 5Gi
diff --git a/workflows/charts/tgi/templates/tests/test-connection.yaml b/workflows/charts/tgi/templates/tests/test-connection.yaml
@@ -25,5 +25,5 @@ spec:
     - name: info
       image: curlimages/curl
       command: ['sh', '-c']
-      args: ['curl --noproxy "*" -f {{ include "tgi.fullname" . }}:{{ .Values.service.port }}/info']
+      args: ['curl -f {{ include "tgi.fullname" . }}:{{ .Values.service.port }}/info']
   restartPolicy: OnFailure