Skip to content

Commit 8e3c26b

Browse files
committed
update worker-config
Signed-off-by: pandyamarut <[email protected]>
1 parent 66ea8b1 commit 8e3c26b

File tree

1 file changed

+13
-12
lines changed

1 file changed

+13
-12
lines changed

worker-config.json

+13-12
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
{
22
"versions": {
3-
"0.6.4": {
4-
"imageName": "runpod/worker-v1-vllm:v1.7.0stable-cuda12.1.0",
3+
"0.6.6": {
4+
"imageName": "runpod/worker-v1-vllm:v1.8.0stable-cuda12.1.0",
55
"minimumCudaVersion": "12.1",
66
"categories": [
77
{
@@ -61,8 +61,8 @@
6161
}
6262
]
6363
},
64-
"0.6.3": {
65-
"imageName": "runpod/worker-v1-vllm:v1.6.0stable-cuda12.1.0",
64+
"0.6.4": {
65+
"imageName": "runpod/worker-v1-vllm:v1.7.0stable-cuda12.1.0",
6666
"minimumCudaVersion": "12.1",
6767
"categories": [
6868
{
@@ -122,8 +122,8 @@
122122
}
123123
]
124124
},
125-
"0.6.2": {
126-
"imageName": "runpod/worker-v1-vllm:v1.5.0stable-cuda12.1.0",
125+
"0.6.3": {
126+
"imageName": "runpod/worker-v1-vllm:v1.6.0stable-cuda12.1.0",
127127
"minimumCudaVersion": "12.1",
128128
"categories": [
129129
{
@@ -134,7 +134,7 @@
134134
"MAX_MODEL_LEN", "GUIDED_DECODING_BACKEND", "DISTRIBUTED_EXECUTOR_BACKEND",
135135
"WORKER_USE_RAY", "RAY_WORKERS_USE_NSIGHT", "PIPELINE_PARALLEL_SIZE",
136136
"TENSOR_PARALLEL_SIZE", "MAX_PARALLEL_LOADING_WORKERS", "ENABLE_PREFIX_CACHING",
137-
"DISABLE_SLIDING_WINDOW", "USE_V2_BLOCK_MANAGER", "NUM_LOOKAHEAD_SLOTS",
137+
"DISABLE_SLIDING_WINDOW", "NUM_LOOKAHEAD_SLOTS",
138138
"SEED", "NUM_GPU_BLOCKS_OVERRIDE", "MAX_NUM_BATCHED_TOKENS", "MAX_NUM_SEQS",
139139
"MAX_LOGPROBS", "DISABLE_LOG_STATS", "QUANTIZATION", "ROPE_SCALING", "ROPE_THETA",
140140
"TOKENIZER_POOL_SIZE", "TOKENIZER_POOL_TYPE", "TOKENIZER_POOL_EXTRA_CONFIG",
@@ -146,7 +146,8 @@
146146
"NGRAM_PROMPT_LOOKUP_MAX", "NGRAM_PROMPT_LOOKUP_MIN", "SPEC_DECODING_ACCEPTANCE_METHOD",
147147
"TYPICAL_ACCEPTANCE_SAMPLER_POSTERIOR_THRESHOLD", "TYPICAL_ACCEPTANCE_SAMPLER_POSTERIOR_ALPHA",
148148
"MODEL_LOADER_EXTRA_CONFIG", "PREEMPTION_MODE", "PREEMPTION_CHECK_PERIOD",
149-
"PREEMPTION_CPU_CAPACITY", "MAX_LOG_LEN", "DISABLE_LOGGING_REQUEST"
149+
"PREEMPTION_CPU_CAPACITY", "MAX_LOG_LEN", "DISABLE_LOGGING_REQUEST",
150+
"ENABLE_AUTO_TOOL_CHOICE", "TOOL_CALL_PARSER"
150151
]
151152
},
152153
{
@@ -182,8 +183,8 @@
182183
}
183184
]
184185
},
185-
"0.6.1": {
186-
"imageName": "runpod/worker-v1-vllm:v1.4.0stable-cuda12.1.0",
186+
"0.6.2": {
187+
"imageName": "runpod/worker-v1-vllm:v1.5.0stable-cuda12.1.0",
187188
"minimumCudaVersion": "12.1",
188189
"categories": [
189190
{
@@ -242,8 +243,8 @@
242243
}
243244
]
244245
},
245-
"0.5.5": {
246-
"imageName": "runpod/worker-v1-vllm:v1.3.1stable-cuda12.1.0",
246+
"0.6.1": {
247+
"imageName": "runpod/worker-v1-vllm:v1.4.0stable-cuda12.1.0",
247248
"minimumCudaVersion": "12.1",
248249
"categories": [
249250
{

0 commit comments

Comments
 (0)