-
Notifications
You must be signed in to change notification settings - Fork 716
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
1 parent
1332e8a
commit c6622d2
Showing
6 changed files
with
117 additions
and
53 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,26 @@ | ||
# In this file you can specify a custom configuration for TfJob, such as specific driver mounts | ||
# and environment variable. | ||
# Note that configurations for GCE and Azure (ACS, acs-engine, AKS) are already available: simply set cloud=gce | ||
# or cloud=azure in values.yaml | ||
apiVersion: v1 | ||
kind: ConfigMap | ||
metadata: | ||
name: tf-job-operator-config | ||
namespace: default | ||
data: | ||
controller_config_file.yaml: | | ||
grpcServerFilePath: /opt/mlkube/grpc_tensorflow_server/grpc_tensorflow_server.py | ||
accelerators: | ||
alpha.kubernetes.io/nvidia-gpu: | ||
# These are all the Volumes and VolumeMounts that should be added to any pod requesting | ||
# a resource of type "alpha.kubernetes.io/nvidia-gpu" | ||
volumes: | ||
- name: nvidia-libraries | ||
mountPath: /usr/local/nvidia/lib64 # This path is special; it is expected to be present in `/etc/ld.so.conf` inside the container image. | ||
hostPath: /home/kubernetes/bin/nvidia/lib | ||
- name: nvidia-debug-tools # optional | ||
mountPath: /usr/local/bin/nvidia | ||
hostPath: /home/kubernetes/bin/nvidia/bin | ||
# These are all the environment variables that should be added to any pod requesting | ||
# a resource of type "alpha.kubernetes.io/nvidia-gpu", such as LD_LIBRARY_PATH | ||
envVars: |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,47 @@ | ||
{{- $cloud := .Values.cloud | default "" -}} | ||
|
||
{{ if eq $cloud "azure" }} | ||
apiVersion: v1 | ||
kind: ConfigMap | ||
metadata: | ||
name: tf-job-operator-config | ||
namespace: default | ||
data: | ||
controller_config_file.yaml: | | ||
grpcServerFilePath: /opt/mlkube/grpc_tensorflow_server/grpc_tensorflow_server.py | ||
accelerators: | ||
alpha.kubernetes.io/nvidia-gpu: | ||
envVars: | ||
- name: LD_LIBRARY_PATH | ||
value: /usr/lib/nvidia:/usr/lib/x86_64-linux-gnu | ||
volumes: | ||
- name: lib | ||
mountPath: /usr/lib/nvidia | ||
hostPath: /usr/lib/nvidia-384 | ||
- name: bin | ||
mountPath: /usr/local/nvidia/bin | ||
hostPath: /usr/lib/nvidia-384/bin | ||
- name: libcuda | ||
mountPath: /usr/lib/x86_64-linux-gnu/libcuda.so.1 | ||
hostPath: /usr/lib/x86_64-linux-gnu/libcuda.so.1 | ||
{{ else if eq $cloud "gce" }} | ||
apiVersion: v1 | ||
kind: ConfigMap | ||
metadata: | ||
name: tf-job-operator-config | ||
namespace: default | ||
data: | ||
controller_config_file.yaml: | | ||
grpcServerFilePath: /opt/mlkube/grpc_tensorflow_server/grpc_tensorflow_server.py | ||
accelerators: | ||
alpha.kubernetes.io/nvidia-gpu: | ||
volumes: | ||
- name: nvidia-libraries | ||
mountPath: /usr/local/nvidia/lib64 # This path is special; it is expected to be present in `/etc/ld.so.conf` inside the container image. | ||
hostPath: /home/kubernetes/bin/nvidia/lib | ||
- name: nvidia-debug-tools # optional | ||
mountPath: /usr/local/bin/nvidia | ||
hostPath: /home/kubernetes/bin/nvidia/bin | ||
{{ else if eq $cloud ""}} | ||
{{ .Files.Get "custom-config.yaml"}} | ||
{{ end }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters