Skip to content

Commit 9b9f288

Browse files
committed
updated LoRA adapters
Signed-off-by: Nir Rozenbaum <[email protected]>
1 parent 7cfd036 commit 9b9f288

File tree

1 file changed

+2
-18
lines changed

1 file changed

+2
-18
lines changed

config/manifests/vllm/cpu-deployment.yaml

Lines changed: 2 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -26,8 +26,8 @@ spec:
2626
- "--max-loras"
2727
- "4"
2828
- "--lora-modules"
29-
- '{"name": "tweet-summary-0", "path": "/adapters/ai-blond/Qwen-Qwen2.5-Coder-1.5B-Instruct-lora_0"}'
30-
- '{"name": "tweet-summary-1", "path": "/adapters/ai-blond/Qwen-Qwen2.5-Coder-1.5B-Instruct-lora_1"}'
29+
- '{"name": "tweet-summary-0", "path": "SriSanth2345/Qwen-1.5B-Tweet-Generations", "base_model_name": "Qwen/Qwen2.5-1.5B"}'
30+
- '{"name": "tweet-summary-1", "path": "SriSanth2345/Qwen-1.5B-Tweet-Generations", "base_model_name": "Qwen/Qwen2.5-1.5B"}'
3131
env:
3232
- name: PORT
3333
value: "8000"
@@ -73,22 +73,6 @@ spec:
7373
name: shm
7474
- name: adapters
7575
mountPath: "/adapters"
76-
initContainers:
77-
- name: adapter-loader
78-
image: ghcr.io/tomatillo-and-multiverse/adapter-puller:demo
79-
command: ["python"]
80-
args:
81-
- ./pull_adapters.py
82-
- --adapter
83-
- ai-blond/Qwen-Qwen2.5-Coder-1.5B-Instruct-lora
84-
- --duplicate-count
85-
- "4"
86-
env:
87-
- name: HF_HOME
88-
value: /adapters
89-
volumeMounts:
90-
- name: adapters
91-
mountPath: "/adapters"
9276
restartPolicy: Always
9377
schedulerName: default-scheduler
9478
terminationGracePeriodSeconds: 30

0 commit comments

Comments
 (0)