agora/cerebral_api/operations/cerebral-api.yaml (118 lines of code) (raw):

apiVersion: apps/v1 kind: Deployment metadata: name: cerebral-api-deployment namespace: contoso-hypermarket spec: replicas: 1 selector: matchLabels: app: cerebral-api template: metadata: labels: app: cerebral-api spec: initContainers: - name: init-documents image: mcr.microsoft.com/cbl-mariner/base/core:2.0 command: - sh - -c - | tdnf update -y tdnf install wget -y cd /app/docs wget -O "SmartShelf_Manual.pdf" "https://download.microsoft.com/download/2b3927e0-5342-4d84-8b55-ab958281259b/SmartShelf%20System%20User%20Manual%20for%20Contoso%20Hypermarket.pdf" && \ wget -O "Scale_Manual.pdf" "https://download.microsoft.com/download/2b3927e0-5342-4d84-8b55-ab958281259b/Scale%20System%20User%20Manual%20for%20Contoso%20Hypermarket.pdf" && \ wget -O "Refrigeration_Manual.pdf" "https://download.microsoft.com/download/2b3927e0-5342-4d84-8b55-ab958281259b/Refrigeration%20System%20User%20Manual%20for%20Contoso%20Hypermarket.pdf" && \ wget -O "Checkout_Manual.pdf" "https://download.microsoft.com/download/2b3927e0-5342-4d84-8b55-ab958281259b/Automated%20Checkout%20System%20User%20Manual%20for%20Contoso%20Hypermarket.pdf" && \ wget -O "HVAC_Manual.pdf" "https://download.microsoft.com/download/2b3927e0-5342-4d84-8b55-ab958281259b/HVAC%20System%20User%20Manual%20for%20Contoso%20Hypermarket.pdf" volumeMounts: - name: cerebral-docs mountPath: /app/docs - name: init-slm-model image: mcr.microsoft.com/azurelinux/base/python:3.12 command: - sh - -c - | pip install -U "huggingface_hub[cli]" huggingface-cli download microsoft/Phi-3-mini-4k-instruct-onnx \ --include "cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/*" \ --local-dir /app/models if [ ! -d "/app/models/phi3" ]; then mkdir /app/models/phi3 fi volumeMounts: - name: cerebral-slm-model mountPath: /app/models containers: - name: cerebral-api image: mcr.microsoft.com/jumpstart/agora/cerebral_api:1.0.0 ports: - containerPort: 5003 env: - name: AZURE_OPENAI_API_KEY value: "replaceme" - name: CHATGPT_MODEL value: "gpt-35-turbo" - name: AZURE_OPENAI_ENDPOINT value: "" - name: OPENAI_API_VERSION value: "2024-03-01-preview" - name: INFLUXDB_URL value: "http://influxdb.contoso-hypermarket.svc.cluster.local:8086" - name: INFLUXDB_BUCKET value: "hypermarket" - name: INFLUXDB_TOKEN value: "secret-token" - name: INFLUXDB_ORG value: "InfluxData" - name: REDIS_URL value: "redis://redis-service.contoso-hypermarket.svc.cluster.local:6379" - name: SQL_DATABASENAME value: "RetailDB" - name: SQL_SERVER value: "mssql-service" - name: SQL_USERNAME value: "SA" - name: SQL_PASSWORD value: "ArcPassword123!!" - name: WHISPER_MODEL_PATH value: "" - name: AZURE_AI_SPEECH_KEY value: "" - name: AZURE_AI_SPEECH_REGION value: "" - name: USE_LOCAL_LLM value: "false" - name: MODEL_PATH value: "/app/models" - name: CHROMA_HOST value: "chroma-db-service.contoso-hypermarket.svc.cluster.local" - name: CHROMA_PORT value: "8040" - name: CHROMA_COLLECTION value: "documents" volumes: - name: cerebral-docs persistentVolumeClaim: claimName: cerebral-docs - name: cerebral-slm-model persistentVolumeClaim: claimName: cerebral-slm-model --- apiVersion: v1 kind: Service metadata: name: cerebral-api-service namespace: contoso-hypermarket spec: type: LoadBalancer selector: app: cerebral-api ports: - protocol: TCP port: 5003 targetPort: 5003