Skip to content

Commit 5ed5e81

Browse files
committed
Upgrade ray version; shrink worker resource allocation
1 parent d871347 commit 5ed5e81

File tree

1 file changed

+18
-22
lines changed

1 file changed

+18
-22
lines changed

modules/kuberay-cluster/kuberay-autopilot-values.yaml

Lines changed: 18 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# Copyright 2023 Google LLC
1+
# Copyright 2024 Google LLC
22
#
33
# Licensed under the Apache License, Version 2.0 (the "License");
44
# you may not use this file except in compliance with the License.
@@ -22,7 +22,7 @@
2222
image:
2323
# Replace this with your own image if needed.
2424
repository: rayproject/ray
25-
tag: 2.6.1-py310-gpu
25+
tag: 2.9.3-py310-gpu
2626
pullPolicy: IfNotPresent
2727

2828
nameOverride: "kuberay"
@@ -64,8 +64,6 @@ head:
6464
# containerEnv specifies environment variables for the Ray container,
6565
# Follows standard K8s container env schema.
6666
containerEnv:
67-
# - name: EXAMPLE_ENV
68-
# value: "1"
6967
- name: RAY_memory_monitor_refresh_ms
7068
value: "0"
7169
- name: RAY_GRAFANA_IFRAME_HOST
@@ -90,18 +88,18 @@ head:
9088
# for further guidance.
9189
resources:
9290
limits:
93-
cpu: "8"
91+
cpu: "1"
9492
# To avoid out-of-memory issues, never allocate less than 2G memory for the Ray head.
95-
memory: "20G"
93+
memory: "8G"
9694
ephemeral-storage: 20Gi
9795
requests:
98-
cpu: "8"
99-
memory: "20G"
96+
cpu: "1"
97+
memory: "8G"
10098
ephemeral-storage: 20Gi
10199
annotations:
102100
gke-gcsfuse/volumes: "true"
103-
gke-gcsfuse/cpu-limit: "2"
104-
gke-gcsfuse/memory-limit: 20Gi
101+
gke-gcsfuse/cpu-limit: "1"
102+
gke-gcsfuse/memory-limit: 2Gi
105103
gke-gcsfuse/ephemeral-storage-limit: 20Gi
106104
nodeSelector:
107105
cloud.google.com/compute-class: "Performance"
@@ -158,8 +156,6 @@ worker:
158156
disabled: true
159157

160158
# The map's key is used as the groupName.
161-
# For example, key:small-group in the map below
162-
# will be used as the groupName
163159
additionalWorkerGroups:
164160
cpuGroup:
165161
# Disabled by default
@@ -194,16 +190,16 @@ additionalWorkerGroups:
194190
resources:
195191
limits:
196192
cpu: 4
197-
memory: "20G"
193+
memory: "16G"
198194
ephemeral-storage: 20Gi
199195
requests:
200196
cpu: 4
201-
memory: "20G"
197+
memory: "16G"
202198
ephemeral-storage: 20Gi
203199
annotations:
204200
gke-gcsfuse/volumes: "true"
205201
gke-gcsfuse/cpu-limit: "2"
206-
gke-gcsfuse/memory-limit: 20Gi
202+
gke-gcsfuse/memory-limit: 10Gi
207203
gke-gcsfuse/ephemeral-storage-limit: 20Gi
208204
nodeSelector:
209205
cloud.google.com/compute-class: "Performance"
@@ -287,19 +283,19 @@ additionalWorkerGroups:
287283
# for further guidance.
288284
resources:
289285
limits:
290-
cpu: "8"
291-
nvidia.com/gpu: "2"
292-
memory: "40G"
286+
cpu: "4"
287+
nvidia.com/gpu: "1"
288+
memory: "16G"
293289
ephemeral-storage: 20Gi
294290
requests:
295-
cpu: "8"
296-
nvidia.com/gpu: "2"
297-
memory: "40G"
291+
cpu: "4"
292+
nvidia.com/gpu: "1"
293+
memory: "16G"
298294
ephemeral-storage: 20Gi
299295
annotations:
300296
gke-gcsfuse/volumes: "true"
301297
gke-gcsfuse/cpu-limit: "2"
302-
gke-gcsfuse/memory-limit: 20Gi
298+
gke-gcsfuse/memory-limit: 10Gi
303299
gke-gcsfuse/ephemeral-storage-limit: 20Gi
304300
nodeSelector:
305301
cloud.google.com/compute-class: "Accelerator"

0 commit comments

Comments
 (0)