-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcompose.yaml
More file actions
21 lines (20 loc) · 804 Bytes
/
Copy pathcompose.yaml
File metadata and controls
21 lines (20 loc) · 804 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
services:
prompt-compression:
build:
context: .
image: prompt-compression:local
ports:
- "8080:8080"
environment:
COMPRESSOR_MODEL: ${COMPRESSOR_MODEL:-microsoft/llmlingua-2-bert-base-multilingual-cased-meetingbank}
COMPRESSOR_MIN_RATE: ${COMPRESSOR_MIN_RATE:-0.45}
COMPRESSOR_DEVICE: ${COMPRESSOR_DEVICE:-cpu}
COMPRESSOR_ADAPTER_SLOTS: ${COMPRESSOR_ADAPTER_SLOTS:-tenant_lora_probe=models/tenant_lora_probe;tenant_rick_probe=models/tenant_rick_probe}
COMPRESSOR_PRELOAD_SLOTS: ${COMPRESSOR_PRELOAD_SLOTS:-base;tenant_lora_probe;tenant_rick_probe}
HF_HOME: /cache/huggingface
TRANSFORMERS_CACHE: /cache/huggingface
volumes:
- huggingface-cache:/cache/huggingface
restart: unless-stopped
volumes:
huggingface-cache: