Feature/erwan gitops model (rh-aiservices-bu#34)

erwangranger · web-flow · commit b525a79912e6 · 2023-12-19T23:35:18.000-05:00
* gitops for modelmesh/ovms/model
* removing extraneous lines from applicationset
* pinger pod is not active yet. will need more work.
diff --git a/.github/.wordlist.txt b/.github/.wordlist.txt
@@ -136,3 +136,5 @@ Prasanth
 Anbalagan
 Erwan
 Granger
+applicationset
+imagesdir
diff --git a/bootstrap/applicationset/applicationset-bootstrap.yaml b/bootstrap/applicationset/applicationset-bootstrap.yaml
@@ -8,23 +8,25 @@ spec:
   - list:
       elements:
       - cluster: in-cluster
-        url: https://kubernetes.default.svc
         name: ic-shared-minio-app
         repoURL: https://github.com/rh-aiservices-bu/insurance-claim-processing.git
         targetRevision: dev
         path: bootstrap/ic-shared-minio
       - cluster: in-cluster
-        url: https://kubernetes.default.svc
         name: ic-shared-database-app
         repoURL: https://github.com/rh-aiservices-bu/insurance-claim-processing.git
         targetRevision: dev
         path: bootstrap/ic-shared-database
       - cluster: in-cluster
-        url: https://kubernetes.default.svc
         name: ic-shared-llm-app
         repoURL: https://github.com/rh-aiservices-bu/insurance-claim-processing.git
         targetRevision: dev
         path: bootstrap/ic-shared-llm
+      - cluster: in-cluster
+        name: ic-shared-img-det
+        repoURL: https://github.com/rh-aiservices-bu/insurance-claim-processing.git
+        targetRevision: dev
+        path: bootstrap/ic-shared-img-det
   template:
     metadata:
       name: '{{name}}'
diff --git a/bootstrap/bootstrap.md b/bootstrap/bootstrap.md
@@ -10,6 +10,8 @@ CMD=" oc apply -f ${GITEA_INT_URL}${GITEA_REPO}raw/branch/${GITEA_BRANCH}${GITEA
 
 echo ${CMD}
 
+oc apply -f ./bootstrap/applicationset/applicationset-bootstrap.yaml
+
 ```
 
 <!--
diff --git a/bootstrap/ic-shared-img-det/add-model-job.yaml b/bootstrap/ic-shared-img-det/add-model-job.yaml
@@ -0,0 +1,54 @@
+---
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: add-model-job
+  annotations:
+    argocd.argoproj.io/sync-wave: "2"
+spec:
+  backoffLimit: 4
+  template:
+    spec:
+      serviceAccount: sa-img-det-gitops-setup
+      serviceAccountName: sa-img-det-gitops-setup
+      initContainers:
+      # - name: wait-for-imagestream
+      #   image: image-registry.openshift-image-registry.svc:5000/openshift/tools:latest
+      #   imagePullPolicy: IfNotPresent
+      #   command: ["/bin/bash"]
+      #   args:
+      #   - -ec
+      #   - |-
+      #     echo -n 'Waiting for RHODS to deploy ImageStreams'
+      #     while ! oc get istag -n redhat-ods-applications 2>/dev/null | grep -qF s2i-generic-data-science-notebook:1.2; do
+      #       echo -n .
+      #       sleep 5
+      #     done; echo
+      containers:
+      - name: add-model
+        image: image-registry.openshift-image-registry.svc:5000/redhat-ods-applications/s2i-generic-data-science-notebook:1.2
+        imagePullPolicy: IfNotPresent
+        command: ["/bin/bash"]
+        args:
+        - -ec
+        - |-
+          # in case we need to add more models, we can do it here too.
+          echo -n "not doing anything right now"
+          # curl -LO https://ai-on-openshift.io/odh-rhods/img-triton/card.fraud.detection.onnx
+          # cat << 'EOF' | python3
+          # filename = "card.fraud.detection.onnx"
+          # import boto3, os
+          # s3 = boto3.client("s3",
+          #                   endpoint_url=os.getenv("AWS_S3_ENDPOINT"),
+          #                   aws_access_key_id=os.getenv("AWS_ACCESS_KEY_ID"),
+          #                   aws_secret_access_key=os.getenv("AWS_SECRET_ACCESS_KEY"))
+          # bucket = os.getenv("AWS_S3_BUCKET")
+          # if bucket not in [bu["Name"] for bu in s3.list_buckets()["Buckets"]]:
+          #   s3.create_bucket(Bucket=bucket)
+          # with open(filename, "rb") as f:
+          #   s3.upload_fileobj(f, bucket, f'fraud/{filename}')
+          # EOF
+        envFrom:
+        - secretRef:
+            name: aws-connection-minio
+      restartPolicy: Never
diff --git a/bootstrap/ic-shared-img-det/create-data-connection.yaml b/bootstrap/ic-shared-img-det/create-data-connection.yaml
@@ -0,0 +1,51 @@
+---
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: create-data-connection
+  annotations:
+    argocd.argoproj.io/sync-wave: "1"
+    argocd.argoproj.io/hook: Sync
+    argocd.argoproj.io/hook-delete-policy: BeforeHookCreation
+spec:
+  backoffLimit: 4
+  template:
+    spec:
+      serviceAccount: sa-img-det-gitops-setup
+      serviceAccountName: sa-img-det-gitops-setup
+      containers:
+      - name: create-data-connection
+        image: image-registry.openshift-image-registry.svc:5000/openshift/tools:latest
+        imagePullPolicy: IfNotPresent
+        command: ["/bin/bash"]
+        args:
+        - -ec
+        - |-
+          echo -n "Waiting for minio-root-user."
+          while [ -z "$(oc get secret -n ic-shared-minio minio-root-user -oname 2>/dev/null)" ]; do
+            echo -n '.'
+            sleep 1
+          done; echo
+          id=$(oc get secret -n ic-shared-minio minio-root-user -ogo-template='{{.data.MINIO_ROOT_USER|base64decode}}')
+          secret=$(oc get secret -n ic-shared-minio minio-root-user -ogo-template='{{.data.MINIO_ROOT_PASSWORD|base64decode}}')
+          echo "Creating secret for ${id}"
+          cat << EOF | oc apply -f-
+          apiVersion: v1
+          kind: Secret
+          metadata:
+            name: aws-connection-minio
+            labels:
+              opendatahub.io/dashboard: "true"
+              opendatahub.io/managed: "true"
+            annotations:
+              opendatahub.io/connection-type: s3
+              openshift.io/display-name: MinIO
+          type: Opaque
+          stringData:
+            AWS_ACCESS_KEY_ID: ${id}
+            AWS_SECRET_ACCESS_KEY: ${secret}
+            AWS_DEFAULT_REGION: us
+            AWS_S3_ENDPOINT: http://minio.ic-shared-minio.svc:9000
+            AWS_S3_BUCKET: models
+          EOF
+      restartPolicy: Never
diff --git a/bootstrap/ic-shared-img-det/kustomization.yaml b/bootstrap/ic-shared-img-det/kustomization.yaml
@@ -0,0 +1,18 @@
+---
+apiVersion: kustomize.config.k8s.io/v1beta1
+kind: Kustomization
+
+commonLabels:
+  component: model
+
+namespace: ic-shared-img-det
+
+resources:
+- project.yaml
+- setup-serviceaccount.yaml
+- create-data-connection.yaml
+- add-model-job.yaml
+- runtime.yaml
+- model.yaml
+# pinger is not ready yet
+# - pinger.yaml
diff --git a/bootstrap/ic-shared-img-det/model.yaml b/bootstrap/ic-shared-img-det/model.yaml
@@ -0,0 +1,44 @@
+# ---
+# apiVersion: serving.kserve.io/v1beta1
+# kind: InferenceService
+# metadata:
+#   annotations:
+#     openshift.io/display-name: accident
+#     serving.kserve.io/deploymentMode: ModelMesh
+#     argocd.argoproj.io/sync-wave: "3"
+#     argocd.argoproj.io/sync-options: SkipDryRunOnMissingResource=true
+#   labels:
+#     name: accident
+#     opendatahub.io/dashboard: "true"
+#   name: accident
+# spec:
+#   predictor:
+#     model:
+#       modelFormat:
+#         name: onnx
+#         version: "1"
+#       runtime: triton
+#       storage:
+#         key: aws-connection-minio
+#         path: accident/
+---
+apiVersion: serving.kserve.io/v1beta1
+kind: InferenceService
+metadata:
+  annotations:
+    openshift.io/display-name: img-det
+    serving.kserve.io/deploymentMode: ModelMesh
+  labels:
+    name: "img-det"
+    opendatahub.io/dashboard: 'true'
+  name: "img-det"
+spec:
+  predictor:
+    model:
+      modelFormat:
+        name: onnx
+        version: '1'
+      runtime: ovms
+      storage:
+        key: aws-connection-minio
+        path: accident/
diff --git a/bootstrap/ic-shared-img-det/pinger.yaml b/bootstrap/ic-shared-img-det/pinger.yaml
@@ -0,0 +1,134 @@
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: model-pinger
+  labels:
+    app: model-pinger
+spec:
+  replicas: 1
+  revisionHistoryLimit: 3
+  selector:
+    matchLabels:
+      app: model-pinger
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1
+      maxUnavailable: 100%
+  template:
+    metadata:
+      labels:
+        app: model-pinger
+    spec:
+      containers:
+      - name: pinger
+        image: quay.io/rlundber/sds-small:1.8
+        command:
+        - python
+        - -u
+        - /ping_model.py
+        env:
+        - name: MM_SERVING_HOST
+          value: modelmesh-serving:8008
+        - name: MM_MODEL_NAME
+          # value: fraud-4
+          value: fraud-latest
+        - name: SLEEP_TIME
+          value: "5"
+        resources:
+          limits:
+            cpu: "0.2"
+            memory: 256Mi
+        volumeMounts:
+        - name: pinger-config
+          subPath: ping_model.py
+          mountPath: /ping_model.py
+      volumes:
+      - name: pinger-config
+        configMap:
+          name: model-pinger
+
+---
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: model-pinger
+data:
+  ping_model.py: |
+    import os
+    import time
+    from datetime import datetime
+    import random
+
+    # MM_SERVING_HOST = os.environ.get("MM_SERVING_HOST", "modelmesh-serving:8008")
+    # MM_MODEL_NAME = os.environ.get("MM_MODEL_NAME", "fraud-latest")
+
+    # # deployed_model_name = "fraud-latest"
+    # # rest_url = "http://modelmesh-serving:8008"
+    # deployed_model_name = MM_MODEL_NAME
+    # rest_url = f"http://{MM_SERVING_HOST}"
+    # infer_url = f"{rest_url}/v2/models/{deployed_model_name}/infer"
+    # print(infer_url)
+
+    # import requests
+
+    # def rest_request(data):
+    #     json_data = {
+    #         "inputs": [
+    #             {
+    #                 "name": "dense_input",
+    #                 "shape": [1, 5],
+    #                 "datatype": "FP32",
+    #                 "data": data
+    #             }
+    #         ]
+    #     }
+
+    #     response = requests.post(infer_url, json=json_data)
+    #     response_dict = response.json()
+    #     return response_dict['outputs'][0]['data']
+
+
+    # MM_SERVING_HOST = os.environ.get("MM_SERVING_HOST", "modelmesh-serving:8033")
+    # MM_MODEL_NAME = os.environ.get("MM_MODEL_NAME", "ansible-model-pinger")
+
+    # SLEEP_TIME = os.environ.get("SLEEP_TIME", "3")
+    # SLEEP_TIME = int(SLEEP_TIME)
+
+
+    # while True:
+    #   now = datetime.now()
+    #   time_string = now.strftime("%Y-%m-%d %H:%M:%S")
+
+    #   print("--------------------------------------")
+    #   print("Sending Request at",time_string)
+
+    #   start = time.time()
+    #   try:
+    #     random_dist = round(random.uniform(0, 50), 2)
+    #     data = [random_dist, 1.9459399775518593, 1.0, 0.0, 0.0]
+    #     print("Data sent to model ("+deployed_model_name+"):")
+    #     print(data)
+
+    #     # Start the timer
+    #     start_time = time.time()
+
+    #     prediction = rest_request(data)
+
+    #     # End the timer
+    #     end_time = time.time()
+
+    #     # Calculate the elapsed time in milliseconds
+    #     response_time_ms = (end_time - start_time) * 1000
+
+    #      # prediction
+    #     print("Likelyhood of fraud")
+    #     print(str(prediction[0]*100)+"%")
+
+    #     print("Prediction took ", response_time_ms, "milliseconds")
+
+    #   except Exception as e:
+    #     print(f"Errored after {time.time() - start}s: {e}")
+
+    #   time.sleep(SLEEP_TIME)
diff --git a/bootstrap/ic-shared-img-det/project.yaml b/bootstrap/ic-shared-img-det/project.yaml
@@ -0,0 +1,14 @@
+---
+apiVersion: project.openshift.io/v1
+kind: Project
+metadata:
+  annotations:
+    openshift.io/description: Project created to demonstrate custom serving runtime
+    openshift.io/display-name: Shared Image Detection Model
+    argocd.argoproj.io/sync-wave: "0"
+    argocd.argoproj.io/managed-by: openshift-gitops
+  labels:
+    kubernetes.io/metadata.name: ic-shared-img-det
+    modelmesh-enabled: "true"
+    opendatahub.io/dashboard: "true"
+  name: ic-shared-img-det
diff --git a/bootstrap/ic-shared-img-det/runtime.yaml b/bootstrap/ic-shared-img-det/runtime.yaml
diff --git a/bootstrap/ic-shared-img-det/setup-serviceaccount.yaml b/bootstrap/ic-shared-img-det/setup-serviceaccount.yaml
diff --git a/content/modules/ROOT/assets/images/ic-eng-diag.drawio b/content/modules/ROOT/assets/images/ic-eng-diag.drawio
diff --git a/content/modules/ROOT/pages/01-04-examples-from-prototype.adoc b/content/modules/ROOT/pages/01-04-examples-from-prototype.adoc