diff --git a/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna-guardrails.yaml b/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna-guardrails.yaml index 70aa65bd6..7265ebff5 100644 --- a/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna-guardrails.yaml +++ b/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna-guardrails.yaml @@ -554,7 +554,7 @@ spec: securityContext: {} image: "opea/chatqna-ui:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: ui containerPort: 5173 @@ -612,7 +612,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/dataprep-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: data-prep containerPort: 6007 @@ -687,7 +687,7 @@ spec: seccompProfile: type: RuntimeDefault image: "redis/redis-stack:7.2.0-v9" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: data-volume @@ -762,7 +762,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/guardrails-tgi:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: guardrails-usvc containerPort: 9090 @@ -840,7 +840,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/retriever-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: retriever-usvc containerPort: 7000 @@ -919,7 +919,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -1010,7 +1010,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -1101,7 +1101,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: model-volume @@ -1181,7 +1181,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: model-volume @@ -1273,7 +1273,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/chatqna-guardrails:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /tmp name: tmp @@ -1314,7 +1314,7 @@ spec: spec: containers: - image: nginx:1.27.1 - imagePullPolicy: IfNotPresent + imagePullPolicy: Always name: nginx volumeMounts: - mountPath: /etc/nginx/conf.d diff --git a/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna.yaml b/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna.yaml index 744f09591..26813816e 100644 --- a/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna.yaml +++ b/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna.yaml @@ -454,7 +454,7 @@ spec: securityContext: {} image: "opea/chatqna-ui:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: ui containerPort: 5173 @@ -512,7 +512,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/dataprep-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: data-prep containerPort: 6007 @@ -587,7 +587,7 @@ spec: seccompProfile: type: RuntimeDefault image: "redis/redis-stack:7.2.0-v9" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: data-volume @@ -662,7 +662,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/retriever-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: retriever-usvc containerPort: 7000 @@ -741,7 +741,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -832,7 +832,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -923,7 +923,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: model-volume @@ -1011,7 +1011,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/chatqna:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /tmp name: tmp @@ -1052,7 +1052,7 @@ spec: spec: containers: - image: nginx:1.27.1 - imagePullPolicy: IfNotPresent + imagePullPolicy: Always name: nginx volumeMounts: - mountPath: /etc/nginx/conf.d diff --git a/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna_bf16.yaml b/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna_bf16.yaml index b18285117..aac57140b 100644 --- a/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna_bf16.yaml +++ b/ChatQnA/kubernetes/intel/cpu/xeon/manifest/chatqna_bf16.yaml @@ -455,7 +455,7 @@ spec: securityContext: {} image: "opea/chatqna-ui:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: ui containerPort: 5173 @@ -513,7 +513,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/dataprep-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: data-prep containerPort: 6007 @@ -588,7 +588,7 @@ spec: seccompProfile: type: RuntimeDefault image: "redis/redis-stack:7.2.0-v9" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: data-volume @@ -663,7 +663,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/retriever-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: retriever-usvc containerPort: 7000 @@ -742,7 +742,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -833,7 +833,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -926,7 +926,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: model-volume @@ -1014,7 +1014,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/chatqna:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /tmp name: tmp @@ -1055,7 +1055,7 @@ spec: spec: containers: - image: nginx:1.27.1 - imagePullPolicy: IfNotPresent + imagePullPolicy: Always name: nginx volumeMounts: - mountPath: /etc/nginx/conf.d diff --git a/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna-guardrails.yaml b/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna-guardrails.yaml index 54b35912b..cd40efed1 100644 --- a/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna-guardrails.yaml +++ b/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna-guardrails.yaml @@ -556,7 +556,7 @@ spec: securityContext: {} image: "opea/chatqna-ui:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: ui containerPort: 5173 @@ -614,7 +614,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/dataprep-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: data-prep containerPort: 6007 @@ -692,7 +692,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/guardrails-tgi:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: guardrails-usvc containerPort: 9090 @@ -767,7 +767,7 @@ spec: seccompProfile: type: RuntimeDefault image: "redis/redis-stack:7.2.0-v9" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: data-volume @@ -842,7 +842,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/retriever-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: retriever-usvc containerPort: 7000 @@ -921,7 +921,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/tei-gaudi:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -1013,7 +1013,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -1104,7 +1104,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/tgi-gaudi:2.0.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: model-volume @@ -1185,7 +1185,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/tgi-gaudi:2.0.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: model-volume @@ -1278,7 +1278,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/chatqna-guardrails:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /tmp name: tmp @@ -1319,7 +1319,7 @@ spec: spec: containers: - image: nginx:1.27.1 - imagePullPolicy: IfNotPresent + imagePullPolicy: Always name: nginx volumeMounts: - mountPath: /etc/nginx/conf.d diff --git a/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna-vllm.yaml b/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna-vllm.yaml index 988f48ca2..2ca62a504 100644 --- a/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna-vllm.yaml +++ b/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna-vllm.yaml @@ -592,7 +592,7 @@ spec: securityContext: {} image: "opea/chatqna-ui:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: ui containerPort: 5173 @@ -650,7 +650,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/dataprep-redis:v0.9" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: data-prep containerPort: 6007 @@ -728,7 +728,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/embedding-tei:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: embedding-usvc containerPort: 6000 @@ -806,7 +806,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/llm-vllm:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: llm-uservice containerPort: 9000 @@ -881,7 +881,7 @@ spec: seccompProfile: type: RuntimeDefault image: "redis/redis-stack:7.2.0-v9" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: data-volume @@ -956,7 +956,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/reranking-tei:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: reranking-usvc containerPort: 8000 @@ -1034,7 +1034,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/retriever-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: retriever-usvc containerPort: 7000 @@ -1107,7 +1107,7 @@ spec: capabilities: add: ["SYS_NICE"] image: "ghcr.io/huggingface/tei-gaudi:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -1193,7 +1193,7 @@ spec: securityContext: {} image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -1281,7 +1281,7 @@ spec: - | export VLLM_CPU_KVCACHE_SPACE=40 && \ python3 -m vllm.entrypoints.openai.api_server --enforce-eager --gpu-memory-utilization 0.5 --dtype auto --model $MODEL_ID --port 2080 --tensor-parallel-size 8 --block-size 128 --max-num-seqs 256 --max-seq_len-to-capture 2048 - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: model-volume @@ -1363,7 +1363,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/chatqna:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /tmp name: tmp @@ -1404,7 +1404,7 @@ spec: spec: containers: - image: nginx:1.27.1 - imagePullPolicy: IfNotPresent + imagePullPolicy: Always name: nginx volumeMounts: - mountPath: /etc/nginx/conf.d diff --git a/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna.yaml b/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna.yaml index 6bde1a104..1c80ca5af 100644 --- a/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna.yaml +++ b/ChatQnA/kubernetes/intel/hpu/gaudi/manifest/chatqna.yaml @@ -455,7 +455,7 @@ spec: securityContext: {} image: "opea/chatqna-ui:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: ui containerPort: 5173 @@ -513,7 +513,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/dataprep-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: data-prep containerPort: 6007 @@ -588,7 +588,7 @@ spec: seccompProfile: type: RuntimeDefault image: "redis/redis-stack:7.2.0-v9" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: data-volume @@ -663,7 +663,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/retriever-redis:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always ports: - name: retriever-usvc containerPort: 7000 @@ -742,7 +742,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/tei-gaudi:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -834,7 +834,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always args: - "--auto-truncate" volumeMounts: @@ -925,7 +925,7 @@ spec: seccompProfile: type: RuntimeDefault image: "ghcr.io/huggingface/tgi-gaudi:2.0.5" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /data name: model-volume @@ -1014,7 +1014,7 @@ spec: seccompProfile: type: RuntimeDefault image: "opea/chatqna:latest" - imagePullPolicy: IfNotPresent + imagePullPolicy: Always volumeMounts: - mountPath: /tmp name: tmp @@ -1055,7 +1055,7 @@ spec: spec: containers: - image: nginx:1.27.1 - imagePullPolicy: IfNotPresent + imagePullPolicy: Always name: nginx volumeMounts: - mountPath: /etc/nginx/conf.d