add docker compose for qwen 5b
This commit is contained in:
commit
434a7e0f29
32
docker-compose-qwen.yml
Normal file
32
docker-compose-qwen.yml
Normal file
@ -0,0 +1,32 @@
|
||||
networks:
|
||||
traefik-exposed:
|
||||
name: traefik-exposed
|
||||
external: true
|
||||
|
||||
services:
|
||||
qwen:
|
||||
image: vllm/vllm-openai:latest
|
||||
runtime: nvidia
|
||||
restart: always
|
||||
networks:
|
||||
- traefik-exposed
|
||||
deploy:
|
||||
resources:
|
||||
reservations:
|
||||
devices:
|
||||
- capabilities: [ gpu ]
|
||||
volumes:
|
||||
- ~/.cache/huggingface:/root/.cache/huggingface
|
||||
ports:
|
||||
- "5432:5432"
|
||||
command: --model Qwen/Qwen2.5-1.5B-Instruct --port 5432 --quantization bitsandbytes
|
||||
labels:
|
||||
- "traefik.enable=true"
|
||||
- "traefik.http.routers.qwen.rule=Host(`odin.capgemini.com`) && PathPrefix(`/qwen`)"
|
||||
- "traefik.http.routers.qwen.entrypoints=web"
|
||||
- "traefik.http.services.qwen.loadbalancer.server.port=5432"
|
||||
- "traefik.http.routers.qwen.middlewares=qwen-stripprefix"
|
||||
- "traefik.http.middlewares.qwen-stripprefix.stripprefix.prefixes=/qwen"
|
||||
# HTTPS is currently not supported on odin.
|
||||
# - "traefik.http.routers.http-catchall.middlewares=redirect-to-https"
|
||||
# - "traefik.http.middlewares.redirect-to-https.redirectscheme.scheme=https"
|
||||
Loading…
Reference in New Issue
Block a user