version: '3.8'
services:
  tabbyapi:
    build:
      context: ..
      dockerfile: ./docker/Dockerfile
      args:
        - DO_PULL=true
    ports:
      - "5000:5000"
    environment:
      - NAME=TabbyAPI
      - NVIDIA_VISIBLE_DEVICES=all
    volumes:
      # - /path/to/models:/app/models                       # Change me
      # - /path/to/config.yml:/app/config.yml               # Change me
      # - /path/to/api_tokens.yml:/app/api_tokens.yml       # Change me
    deploy:
      resources:
        reservations:
          devices:
            - driver: nvidia
              count: all
              capabilities: [gpu]