Skip to content

Commit

Permalink
Merge pull request #55 from graphistry/cuda-worker-args-hotfix
Browse files Browse the repository at this point in the history
  • Loading branch information
webcoderz authored Aug 20, 2023
2 parents 7d646bf + fe33391 commit 0a86de8
Show file tree
Hide file tree
Showing 8 changed files with 19 additions and 13 deletions.
2 changes: 1 addition & 1 deletion .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -150,4 +150,4 @@ cluster-config/cluster-config.yaml
charts/graphistry-helm/templates/postgres/pg-sts.yaml


chart-bundle
charts-aux-bundled
9 changes: 6 additions & 3 deletions charts/graphistry-helm/templates/dask/dask-cluster.yml
Original file line number Diff line number Diff line change
Expand Up @@ -29,17 +29,20 @@ spec:
image: {{.Values.global.containerregistry.name}}/{{.Values.graphistry}}:{{.Values.daskcudaworker.repository}}-{{.Values.global.tag}}-{{.Values.cuda.version}}
imagePullPolicy: {{.Values.global.imagePullPolicy }}
args:
- dask-cuda-worker
- dask cuda worker
- --interface
- eth0
- --dashboard-address localhost:8787
#- --resources GPU=10
#- dask-scheduler:8786
- --resources GPU=10,PROCESS=2
- --nthreads 2
- {{.Values.daskscheduler.location | quote }}
command:
- /entrypoints/rapids-entrypoint.sh
env:
- name: GRAPHISTRY_CPU_MODE
value: {{.Values.graphistryCPUMode | quote }}
- name: SKIP_SERVER
value: "1"
{{- range .Values.env }}
- name: {{ .name }}
value: {{ .value | quote }}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -41,17 +41,20 @@ spec:
- "nexus"
containers:
- args:
- dask-cuda-worker
- dask cuda worker
- --interface
- eth0
- --dashboard-address localhost:8787
#- --resources GPU=10
- dask-scheduler:8786
- --resources GPU=10,PROCESS=2
- --nthreads 2
- {{.Values.daskscheduler.location | quote }}
command:
- /entrypoints/rapids-entrypoint.sh
env:
- name: GRAPHISTRY_CPU_MODE
value: {{.Values.graphistryCPUMode | quote }}
- name: SKIP_SERVER
value: "1"
{{- range .Values.env }}
- name: {{ .name }}
value: {{ .value | quote }}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -97,7 +97,7 @@ spec:
command:
- sh
- -c
- "curl -f http://localhost:8080/cudfhealth && curl -f http://localhost:8080/blazinghealth"
- "curl -f http://localhost:8080/cudfhealth && curl -f http://localhost:8080/dasksqlhealth"
failureThreshold: 3
initialDelaySeconds: 180
periodSeconds: 120
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -207,7 +207,7 @@ spec:
- name: PROMETHEUS_PORT
value: "4040"
{{- if eq .Values.global.containerregistry.name "docker.io/graphistry" }}
image: quay.io/martinhelmich/prometheus-nginxlog-exporter:v1.9.2 #DockerHub
image: ghcr.io/martin-helmich/prometheus-nginxlog-exporter/exporter:v1.9.2 #DockerHub
{{ else }}
image: {{.Values.global.containerregistry.name}}/prometheus-nginxlog-exporter:v1.9.2
{{- end }}
Expand Down
2 changes: 1 addition & 1 deletion charts/graphistry-helm/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -406,7 +406,7 @@ dask:
#dask-scheduler repository name
daskscheduler:
repository: etl-server-python #dask-scheduler repository name
location: "dask-scheduler:8786" #dask-scheduler location
location: dask-scheduler:8786 #dask-scheduler location

vgpu: false #enables vgpu mode for bigger than memory workloads on VGPU

Expand Down
4 changes: 2 additions & 2 deletions charts/postgres-cluster/templates/postgres-cluster.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -48,11 +48,11 @@ spec:
{{- if eq .Values.global.multiNode true }}
accessModes:
- "ReadWriteMany"
storageClassName: postgres-longhorn-{{ .Release.Namespace }}
storageClassName: postgres-longhorn
{{- else }}
accessModes:
- "ReadWriteOnce"
storageClassName: retain-sc-{{ .Release.Namespace }}
storageClassName: retain-sc
{{- end }}
resources:
requests:
Expand Down
2 changes: 1 addition & 1 deletion charts/values-overrides/internal/eks-dev-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@ k8sDashboard:

global:
provisioner: ebs.csi.aws.com
tag: v2.40.3
tag: v2.40.27
nodeSelector: {"accelerator": "nvidia"}
#change log levels
#logs:
Expand Down

0 comments on commit 0a86de8

Please sign in to comment.