From 8e3c26be14109bcfcbff1b98a89b68c8f17b97f9 Mon Sep 17 00:00:00 2001 From: pandyamarut Date: Mon, 30 Dec 2024 17:41:10 -0800 Subject: [PATCH] update worker-config Signed-off-by: pandyamarut --- worker-config.json | 25 +++++++++++++------------ 1 file changed, 13 insertions(+), 12 deletions(-) diff --git a/worker-config.json b/worker-config.json index c150314..7845882 100644 --- a/worker-config.json +++ b/worker-config.json @@ -1,7 +1,7 @@ { "versions": { - "0.6.4": { - "imageName": "runpod/worker-v1-vllm:v1.7.0stable-cuda12.1.0", + "0.6.6": { + "imageName": "runpod/worker-v1-vllm:v1.8.0stable-cuda12.1.0", "minimumCudaVersion": "12.1", "categories": [ { @@ -61,8 +61,8 @@ } ] }, - "0.6.3": { - "imageName": "runpod/worker-v1-vllm:v1.6.0stable-cuda12.1.0", + "0.6.4": { + "imageName": "runpod/worker-v1-vllm:v1.7.0stable-cuda12.1.0", "minimumCudaVersion": "12.1", "categories": [ { @@ -122,8 +122,8 @@ } ] }, - "0.6.2": { - "imageName": "runpod/worker-v1-vllm:v1.5.0stable-cuda12.1.0", + "0.6.3": { + "imageName": "runpod/worker-v1-vllm:v1.6.0stable-cuda12.1.0", "minimumCudaVersion": "12.1", "categories": [ { @@ -134,7 +134,7 @@ "MAX_MODEL_LEN", "GUIDED_DECODING_BACKEND", "DISTRIBUTED_EXECUTOR_BACKEND", "WORKER_USE_RAY", "RAY_WORKERS_USE_NSIGHT", "PIPELINE_PARALLEL_SIZE", "TENSOR_PARALLEL_SIZE", "MAX_PARALLEL_LOADING_WORKERS", "ENABLE_PREFIX_CACHING", - "DISABLE_SLIDING_WINDOW", "USE_V2_BLOCK_MANAGER", "NUM_LOOKAHEAD_SLOTS", + "DISABLE_SLIDING_WINDOW", "NUM_LOOKAHEAD_SLOTS", "SEED", "NUM_GPU_BLOCKS_OVERRIDE", "MAX_NUM_BATCHED_TOKENS", "MAX_NUM_SEQS", "MAX_LOGPROBS", "DISABLE_LOG_STATS", "QUANTIZATION", "ROPE_SCALING", "ROPE_THETA", "TOKENIZER_POOL_SIZE", "TOKENIZER_POOL_TYPE", "TOKENIZER_POOL_EXTRA_CONFIG", @@ -146,7 +146,8 @@ "NGRAM_PROMPT_LOOKUP_MAX", "NGRAM_PROMPT_LOOKUP_MIN", "SPEC_DECODING_ACCEPTANCE_METHOD", "TYPICAL_ACCEPTANCE_SAMPLER_POSTERIOR_THRESHOLD", "TYPICAL_ACCEPTANCE_SAMPLER_POSTERIOR_ALPHA", "MODEL_LOADER_EXTRA_CONFIG", "PREEMPTION_MODE", "PREEMPTION_CHECK_PERIOD", - "PREEMPTION_CPU_CAPACITY", "MAX_LOG_LEN", "DISABLE_LOGGING_REQUEST" + "PREEMPTION_CPU_CAPACITY", "MAX_LOG_LEN", "DISABLE_LOGGING_REQUEST", + "ENABLE_AUTO_TOOL_CHOICE", "TOOL_CALL_PARSER" ] }, { @@ -182,8 +183,8 @@ } ] }, - "0.6.1": { - "imageName": "runpod/worker-v1-vllm:v1.4.0stable-cuda12.1.0", + "0.6.2": { + "imageName": "runpod/worker-v1-vllm:v1.5.0stable-cuda12.1.0", "minimumCudaVersion": "12.1", "categories": [ { @@ -242,8 +243,8 @@ } ] }, - "0.5.5": { - "imageName": "runpod/worker-v1-vllm:v1.3.1stable-cuda12.1.0", + "0.6.1": { + "imageName": "runpod/worker-v1-vllm:v1.4.0stable-cuda12.1.0", "minimumCudaVersion": "12.1", "categories": [ {