From a657cd5be64fbae4a50786b1c828dad55d907fa2 Mon Sep 17 00:00:00 2001 From: Sam Stoelinga Date: Wed, 20 Nov 2024 11:34:40 -0800 Subject: [PATCH] revert back 125m model changes --- manifests/models/opt-125m-cpu.yaml | 7 ------- 1 file changed, 7 deletions(-) diff --git a/manifests/models/opt-125m-cpu.yaml b/manifests/models/opt-125m-cpu.yaml index d5320244..9fb87e57 100644 --- a/manifests/models/opt-125m-cpu.yaml +++ b/manifests/models/opt-125m-cpu.yaml @@ -5,13 +5,6 @@ metadata: name: opt-125m-cpu spec: features: [TextGeneration] - env: - VLLM_WORKER_MULTIPROC_METHOD: spawn - # VLLM_RPC_TIMEOUT: "10000" - # VLLM_CPU_KVCACHE_SPACE: "1" - args: - - --disable-frontend-multiprocessing - - --max-num-seqs=1 owner: facebook url: hf://facebook/opt-125m engine: VLLM