localgenai/pyinfra/framework/compose/whisper.yml

# Wyoming Whisper — speech-to-text over the Wyoming protocol.
# https://github.com/rhasspy/wyoming-whisper
#
# Wyoming is Home Assistant's voice protocol; it's also consumable by any
# Wyoming client. No web UI — this is a protocol server on TCP :10300.
#
# Model selection: `tiny-int8` is the smallest viable model (~75 MB),
# fast and good enough for command-style transcription. Bump to
# `base-int8` (140 MB) or `small-int8` (480 MB) for general dictation.
# Models are downloaded into /srv/docker/whisper/data on first start.
services:
  whisper:
    image: rhasspy/wyoming-whisper:latest
    container_name: wyoming-whisper
    restart: unless-stopped
    ports:
      - "10300:10300"
    volumes:
      - /srv/docker/whisper/data:/data
    command:
      - --model
      - tiny-int8
      - --language
      - en
      - --beam-size
      - "1"