services:
  gpustack:
    image: gpustack/gpustack:v0.6.2-cuda12.8
    container_name: gpustack
    restart: unless-stopped
    ports:
      - "4080:80"  
      - "10150:10150" 
    environment:
      TZ: Asia/Shanghai
      HF_ENDPOINT: https://hf-mirror.com ##HF的镜像
    volumes:
      - ./data:/var/lib/gpustack  # 数据目录挂载
      - ./data/ui:/usr/local/lib/python3.10/dist-packages/gpustack/ui ## 前端页面
    command: ["--worker-ip", "192.168.1.10"] ## 宿主机的IP
    deploy:
      resources:
        limits:
          cpus: '4.0'
          memory: 8G
        reservations:
          cpus: '2'
          memory: 4G
          ## GPU 驱动
          devices:
          - driver: nvidia
	     #device_ids: ['0','1']
            device_ids: [all] ##使用所有的GPU
            capabilities: [gpu]

#### /etc/docker/daemon.json 需要加载  nvidia-container-runtime
#"runtimes": {
#        "nvidia": {
#            "args": [],
#            "path": "nvidia-container-runtime"
#        }
#    }
####