You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
# head group template and specs, (perhaps 'group' is not needed in the name)
66
+
headGroupSpec:
67
+
# Kubernetes Service Type, valid values are 'ClusterIP', 'NodePort' and 'LoadBalancer'
68
+
serviceType: ClusterIP
69
+
# logical group name, for this called head-group, also can be functional
70
+
# pod type head or worker
71
+
# rayNodeType: head # Not needed since it is under the headgroup
72
+
# the following params are used to complete the ray start: ray start --head --block ...
73
+
rayStartParams:
74
+
# Flag "no-monitor" will be automatically set when autoscaling is enabled.
75
+
dashboard-host: '0.0.0.0'
76
+
block: 'true'
77
+
# num-cpus: '1' # can be auto-completed from the limits
78
+
# Use `resources` to optionally specify custom resource annotations for the Ray node.
79
+
# The value of `resources` is a string-integer mapping.
80
+
# Currently, `resources` must be provided in the specific format demonstrated below:
81
+
# resources: '"{\"Custom1\": 1, \"Custom2\": 5}"'
82
+
#pod template
83
+
template:
84
+
spec:
85
+
containers:
86
+
# The Ray head pod
87
+
- name: ray-head
88
+
image: rayproject/ray:2.0.0
89
+
imagePullPolicy: Always
90
+
ports:
91
+
- containerPort: 6379
92
+
name: gcs
93
+
- containerPort: 8265
94
+
name: dashboard
95
+
- containerPort: 10001
96
+
name: client
97
+
lifecycle:
98
+
preStop:
99
+
exec:
100
+
command: ["/bin/sh","-c","ray stop"]
101
+
resources:
102
+
limits:
103
+
cpu: "1"
104
+
memory: "1G"
105
+
requests:
106
+
cpu: "500m"
107
+
memory: "512Mi"
108
+
workerGroupSpecs:
109
+
# the pod replicas in this group typed worker
110
+
- replicas: 1
111
+
minReplicas: 1
112
+
maxReplicas: 300
113
+
# logical group name, for this called small-group, also can be functional
114
+
groupName: small-group
115
+
# if worker pods need to be added, we can simply increment the replicas
116
+
# if worker pods need to be removed, we decrement the replicas, and populate the podsToDelete list
117
+
# the operator will remove pods from the list until the number of replicas is satisfied
118
+
# when a pod is confirmed to be deleted, its name will be removed from the list below
119
+
#scaleStrategy:
120
+
# workersToDelete:
121
+
# - raycluster-complete-worker-small-group-bdtwh
122
+
# - raycluster-complete-worker-small-group-hv457
123
+
# - raycluster-complete-worker-small-group-k8tj7
124
+
# the following params are used to complete the ray start: ray start --block ...
125
+
rayStartParams:
126
+
block: 'true'
127
+
#pod template
128
+
template:
129
+
metadata:
130
+
labels:
131
+
key: value
132
+
# annotations for pod
133
+
annotations:
134
+
key: value
135
+
spec:
136
+
initContainers:
137
+
# the env var $RAY_IP is set by the operator if missing, with the value of the head service name
138
+
- name: init-myservice
139
+
image: busybox:1.28
140
+
command: ['sh', '-c', "until nslookup $RAY_IP.$(cat /var/run/secrets/kubernetes.io/serviceaccount/namespace).svc.cluster.local; do echo waiting for myservice; sleep 2; done"]
141
+
containers:
142
+
- name: machine-learning # must consist of lower case alphanumeric characters or '-', and must start and end with an alphanumeric character (e.g. 'my-name', or '123-abc'
143
+
image: rayproject/ray:2.0.0
144
+
# environment variables to set in the container.Optional.
145
+
# Refer to https://kubernetes.io/docs/tasks/inject-data-application/define-environment-variable-container/
0 commit comments