Skip to content

Commit c681522

Browse files
committed
Updates to remove hacks and add default values file
1 parent 21555e8 commit c681522

8 files changed

+361
-44
lines changed

charts/model-engine/templates/_helpers.tpl

+2-6
Original file line numberDiff line numberDiff line change
@@ -341,15 +341,11 @@ env:
341341
value: "true"
342342
- name: LAUNCH_SERVICE_TEMPLATE_FOLDER
343343
value: "/workspace/model-engine/model_engine_server/infra/gateways/resources/templates"
344-
{{- if .Values.redis.auth}}
345-
- name: REDIS_AUTH_TOKEN
346-
value: {{ .Values.redis.auth }}
347-
{{- end }}
348-
{{- if .Values.redis.authSecret }}
344+
{{- if .Values.secrets.kubernetesRedisSecretName }}
349345
- name: REDIS_AUTH_TOKEN
350346
valueFrom:
351347
secretKeyRef:
352-
name: {{ .Values.redis.authSecret }}
348+
name: {{ .Values.secrets.kubernetesRedisSecretName }}
353349
key: auth_token
354350
{{- end }}
355351
{{- if .Values.azure}}

charts/model-engine/templates/inference_framework_config.yaml

+3-3
Original file line numberDiff line numberDiff line change
@@ -12,8 +12,8 @@ metadata:
1212
data:
1313
deepspeed: "latest"
1414
text_generation_inference: "latest"
15-
vllm: "{{ .Values.vllmTag }}"
16-
vllm_batch: "{{ .Values.vllmTag }}"
17-
vllm_batch_v2: "{{ .Values.vllmTag }}"
15+
vllm: "{{ .Values.vLLM.primaryTag }}"
16+
vllm_batch: "{{ .Values.vLLM.batchTag }}"
17+
vllm_batch_v2: "{{ .Values.vLLM.batchV2Tag }}"
1818
lightllm: "latest"
1919
tensorrt_llm: "latest"

charts/model-engine/templates/istio-virtualservice.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,12 @@
1-
{{- if .Values.virtualservice.enabled -}}
1+
{{- if .values.virtualService.enabled -}}
22
{{- $fullName := include "modelEngine.fullname" . -}}
33
apiVersion: networking.istio.io/v1alpha3
44
kind: VirtualService
55
metadata:
66
name: {{ $fullName }}
77
labels:
88
{{- include "modelEngine.labels" . | nindent 4 }}
9-
{{- with .Values.virtualservice.annotations }}
9+
{{- with .values.virtualService.annotations }}
1010
annotations:
1111
{{- toYaml . | nindent 4 }}
1212
{{- end }}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
{{- if and (.Values.serviceTemplate) (.Values.serviceTemplate.createInferenceServiceAccount) (.Values.serviceTemplate.serviceAccountAnnotations) (.Values.serviceTemplate.serviceAccountName) (.Values.config.values.launch.endpoint_namespace)}}
2+
{{- $annotations := .Values.serviceTemplate.serviceAccountAnnotations }}
3+
{{- $inferenceServiceAccountName := .Values.serviceTemplate.serviceAccountName }}
4+
{{- $inferenceServiceAccountNamespace := .Values.config.values.launch.endpoint_namespace }}
5+
{{- $labels := include "modelEngine.labels" . }}
6+
apiVersion: v1
7+
kind: ServiceAccount
8+
metadata:
9+
name: {{- printf " %s" $inferenceServiceAccountName }}
10+
namespace: {{- printf " %s" $inferenceServiceAccountNamespace }}
11+
labels:
12+
{{- $labels | nindent 4 }}
13+
{{- with $annotations }}
14+
annotations:
15+
{{- toYaml . | nindent 4 }}
16+
{{- if $.Values.azure }}
17+
azure.workload.identity/client-id: {{ $.Values.azure.client_id }}
18+
{{- end }}
19+
{{- end }}
20+
{{- if $.Values.azure }}
21+
imagePullSecrets:
22+
- name: egp-ecr-regcred
23+
{{- end }}
24+
---
25+
{{- end }}

charts/model-engine/templates/service_config_map.yaml

+7-7
Original file line numberDiff line numberDiff line change
@@ -64,11 +64,11 @@ data:
6464
6565
sqs_queue_tag_template: |-
6666
{
67-
"infra.scale.com/product": "{{ .Values.productTag }}",
68-
"infra.scale.com/team": "${team}",
69-
"infra.scale.com/contact": "{{ .Values.contactEmail }}",
70-
"infra.scale.com/customer": "AllCustomers",
71-
"infra.scale.com/financialOwner": "{{ .Values.contactEmail}}",
67+
"{{ .Values.tagging.organization }}/product": "{{ .Values.tagging.productTag }}",
68+
"{{ .Values.tagging.organization }}/team": "${team}",
69+
"{{ .Values.tagging.organization }}/contact": "{{ .Values.tagging.contactEmail }}",
70+
"{{ .Values.tagging.organization }}/customer": "AllCustomers",
71+
"{{ .Values.tagging.organization }}/financialOwner": "{{ .Values.tagging.contactEmail }}",
7272
"Launch-Endpoint-Id": "${endpoint_id}",
7373
"Launch-Endpoint-Name": "${endpoint_name}",
7474
"Launch-Endpoint-Created-By": "${endpoint_created_by}"
@@ -101,8 +101,8 @@ data:
101101
env: {{ .Values.context | quote }}
102102
cloud_provider: "aws"
103103
env: "prod"
104-
k8s_cluster_name: "usgw1-prod"
105-
dns_host_domain: "model-engine.ml-serving.{{ $.Values.global.networking.internalDomain }}"
104+
k8s_cluster_name: "{{ .Values.clusterName }}"
105+
dns_host_domain: "model-engine.{{ $.Values.global.networking.internalDomain }}"
106106
default_region: "{{ .Values.aws.region }}"
107107
ml_account_id: "{{ .Values.aws.accountId }}"
108108
docker_repo_prefix: "{{ .Values.aws.accountId }}.dkr.ecr.{{ .Values.aws.region }}.amazonaws.com"

charts/model-engine/templates/service_template_config_map.yaml

+9-15
Original file line numberDiff line numberDiff line change
@@ -95,17 +95,14 @@ data:
9595
{{- toYaml . | nindent 12 }}
9696
{{- end }}
9797
{{- if eq $device "gpu" }}
98-
# {{- if empty $node_selector }}
99-
# nodeSelector:
100-
# {{- end }}
101-
# k8s.amazonaws.com/accelerator: ${GPU_TYPE}
98+
{{- if empty $node_selector }}
99+
nodeSelector:
100+
{{- end }}
101+
k8s.amazonaws.com/accelerator: ${GPU_TYPE}
102102
tolerations:
103103
- key: "nvidia.com/gpu"
104104
operator: "Exists"
105105
effect: "NoSchedule"
106-
- key: "gpu_a100_multi"
107-
operator: "Exists"
108-
effect: "NoSchedule"
109106
{{- end }}
110107
priorityClassName: ${PRIORITY}
111108
containers:
@@ -489,7 +486,7 @@ data:
489486
protocol: TCP
490487
name: http
491488
${NODE_PORT_DICT}
492-
{{- if .Values.virtualservice.enabled }}
489+
{{- if .values.virtualService.enabled }}
493490
virtual-service.yaml: |-
494491
apiVersion: networking.istio.io/v1alpha3
495492
kind: VirtualService
@@ -680,17 +677,14 @@ data:
680677
{{- toYaml . | nindent 12 }}
681678
{{- end }}
682679
{{- if eq $device "gpu" }}
683-
# {{- if empty $node_selector }}
684-
# nodeSelector:
685-
# {{- end }}
686-
# k8s.amazonaws.com/accelerator: ${GPU_TYPE}
680+
{{- if empty $node_selector }}
681+
nodeSelector:
682+
{{- end }}
683+
k8s.amazonaws.com/accelerator: ${GPU_TYPE}
687684
tolerations:
688685
- key: "nvidia.com/gpu"
689686
operator: "Exists"
690687
effect: "NoSchedule"
691-
- key: "gpu_a100_multi"
692-
operator: "Exists"
693-
effect: "NoSchedule"
694688
{{- end }}
695689
{{- if $service_template_service_account_name }}
696690
serviceAccountName: {{ $service_template_service_account_name }}

0 commit comments

Comments
 (0)