add docker compose for qwen 5b
This commit is contained in:
commit
434a7e0f29
32
docker-compose-qwen.yml
Normal file
32
docker-compose-qwen.yml
Normal file
@ -0,0 +1,32 @@
|
|||||||
|
networks:
|
||||||
|
traefik-exposed:
|
||||||
|
name: traefik-exposed
|
||||||
|
external: true
|
||||||
|
|
||||||
|
services:
|
||||||
|
qwen:
|
||||||
|
image: vllm/vllm-openai:latest
|
||||||
|
runtime: nvidia
|
||||||
|
restart: always
|
||||||
|
networks:
|
||||||
|
- traefik-exposed
|
||||||
|
deploy:
|
||||||
|
resources:
|
||||||
|
reservations:
|
||||||
|
devices:
|
||||||
|
- capabilities: [ gpu ]
|
||||||
|
volumes:
|
||||||
|
- ~/.cache/huggingface:/root/.cache/huggingface
|
||||||
|
ports:
|
||||||
|
- "5432:5432"
|
||||||
|
command: --model Qwen/Qwen2.5-1.5B-Instruct --port 5432 --quantization bitsandbytes
|
||||||
|
labels:
|
||||||
|
- "traefik.enable=true"
|
||||||
|
- "traefik.http.routers.qwen.rule=Host(`odin.capgemini.com`) && PathPrefix(`/qwen`)"
|
||||||
|
- "traefik.http.routers.qwen.entrypoints=web"
|
||||||
|
- "traefik.http.services.qwen.loadbalancer.server.port=5432"
|
||||||
|
- "traefik.http.routers.qwen.middlewares=qwen-stripprefix"
|
||||||
|
- "traefik.http.middlewares.qwen-stripprefix.stripprefix.prefixes=/qwen"
|
||||||
|
# HTTPS is currently not supported on odin.
|
||||||
|
# - "traefik.http.routers.http-catchall.middlewares=redirect-to-https"
|
||||||
|
# - "traefik.http.middlewares.redirect-to-https.redirectscheme.scheme=https"
|
||||||
Loading…
Reference in New Issue
Block a user