Blame view

third-party/xinference/docker-compose.yml 634 Bytes
b401ef94   tangwang   third-party/xinfe...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
  version: '3.8'
  
  services:
    xinference:
      image: xprobe/xinference:latest
      container_name: xinference
      ports:
        - "9997:9997"
        - "9998:9998"
      environment:
        - XINFERENCE_HOME=/data
      volumes:
        - ./models:/data
      deploy:
        resources:
          reservations:
            devices:
              - driver: nvidia
                count: all
                capabilities: [gpu]
      restart: unless-stopped
      command: xinference-local -H 0.0.0.0
      healthcheck:
        test: ["CMD", "curl", "-f", "http://localhost:9997/v1/models"]
        interval: 30s
        timeout: 10s
        retries: 3
        start_period: 40s