mirror of
https://github.com/runyanjake/olomana.git
synced 2026-06-25 08:04:52 -07:00
Update organization of software
This commit is contained in:
parent
e45d794be6
commit
29e5b9a199
@ -1,38 +0,0 @@
|
|||||||
services:
|
|
||||||
llama-cpp:
|
|
||||||
image: ghcr.io/ggml-org/llama.cpp:server-cuda
|
|
||||||
container_name: llama-cpp
|
|
||||||
restart: unless-stopped
|
|
||||||
networks:
|
|
||||||
- traefik
|
|
||||||
volumes:
|
|
||||||
- /pwspool/software/llama-cpp/models:/models
|
|
||||||
# We moved your environment variables here to guarantee they are applied
|
|
||||||
command:
|
|
||||||
- "--model"
|
|
||||||
- "/models/Qwen3.5-35B-A3B-UD-IQ2_XXS.gguf"
|
|
||||||
- "--host"
|
|
||||||
- "0.0.0.0"
|
|
||||||
- "--port"
|
|
||||||
- "8080"
|
|
||||||
- "--n-gpu-layers"
|
|
||||||
- "99"
|
|
||||||
- "--ctx-size"
|
|
||||||
- "8192"
|
|
||||||
deploy:
|
|
||||||
resources:
|
|
||||||
reservations:
|
|
||||||
devices:
|
|
||||||
- driver: nvidia
|
|
||||||
count: all
|
|
||||||
capabilities: [gpu]
|
|
||||||
labels:
|
|
||||||
- "traefik.enable=true"
|
|
||||||
- "traefik.http.routers.llama.rule=Host(`llm.whitney.rip`)"
|
|
||||||
- "traefik.http.routers.llama.entrypoints=websecure"
|
|
||||||
- "traefik.http.routers.llama.tls.certresolver=lets-encrypt"
|
|
||||||
- "traefik.http.services.llama.loadbalancer.server.port=8080"
|
|
||||||
|
|
||||||
networks:
|
|
||||||
traefik:
|
|
||||||
external: true
|
|
||||||
Loading…
x
Reference in New Issue
Block a user