Newer
Older
voice / .env.example
# Local TTS pipeline configuration example
# Copy this file to .env and adjust values.

HOST=0.0.0.0
PORT=8765
LOG_LEVEL=INFO

# Available backends:
#   dummy       — sine-wave test (no GPU, no deps)
#   s2          — Fish Audio S2-Pro INT4 (требует S2 API сервер на порту 8081)
#   fish_speech — Fish Speech 1.5 (требует чекпоинт fish-speech)
#   f5_tts      — F5-TTS v1 (экспериментальный)
#   xtts_v2     — XTTS-v2 от Coqui (авто-загрузка, ~2 GB VRAM)
TTS_BACKEND=s2

# Paths for Fish Speech / XTTS backends
TTS_MODEL_PATH=models/fishaudio_fish-speech-1.5
TTS_VOCAB_PATH=models/fish-speech
TTS_MODEL_NAME=tts_models/multilingual/multi-dataset/xtts_v2
TTS_SAMPLE_RATE=44100
TTS_SPEED=1.5

# Fish Speech tuning
FISH_COMPILE=false
FISH_CHUNK_LENGTH=300
FISH_USE_MEMORY_CACHE=on
FISH_TOP_P=0.7
FISH_TEMPERATURE=0.7
FISH_REPETITION_PENALTY=1.2
FISH_TAIL_SILENCE_THRESHOLD=0
FISH_LOWPASS_CUTOFF=0

VOICES_DIR=voices
DEFAULT_VOICE_REF=voices/default_ref.wav
DEFAULT_REF_TEXT=""

# Segmentation (прогрессивный порог: первый сегмент короче)
MIN_SEGMENT_LENGTH=30
MAX_SEGMENT_LENGTH=500
MAX_BUFFER_WAIT_MS=500
FAST_START_INITIAL=12
FAST_START_COUNT=3

DEVICE=cuda
DTYPE=bfloat16

WARMUP=true
WARMUP_TEXT="Привет. Это тестовая фраза."

# S2 API server URL
S2_API_URL=http://127.0.0.1:8081