2026-05-29 07:16:02 +00:00
|
|
|
|
# Конфигурация пайплайна транскрибации совещаний
|
|
|
|
|
|
|
|
|
|
|
|
# Профили оборудования
|
|
|
|
|
|
profiles:
|
|
|
|
|
|
# Текущий: MacBook Air M4, 16GB RAM
|
|
|
|
|
|
mac_m4:
|
|
|
|
|
|
device: cpu # MPS на Mac может быть медленнее/багован; CPU + int8 стабильнее
|
|
|
|
|
|
compute_type: int8
|
2026-05-29 09:42:07 +00:00
|
|
|
|
batch_size: 2 # Оптимум для CPU (1.2-1.3x быстрее, RAM ~4.5 GB)
|
2026-05-29 07:16:02 +00:00
|
|
|
|
model: large-v3
|
|
|
|
|
|
language: ru
|
|
|
|
|
|
diarize: true
|
|
|
|
|
|
|
|
|
|
|
|
# Будущий: GPU с 8GB VRAM
|
|
|
|
|
|
gpu_8gb:
|
|
|
|
|
|
device: cuda
|
|
|
|
|
|
compute_type: float16 # или int8 если не хватает памяти
|
|
|
|
|
|
batch_size: 1 # large-v3 + alignment + diarization в ~8GB
|
|
|
|
|
|
model: large-v3
|
|
|
|
|
|
language: ru
|
|
|
|
|
|
diarize: true
|
|
|
|
|
|
|
|
|
|
|
|
# Универсальный CPU (без GPU)
|
|
|
|
|
|
cpu_best:
|
|
|
|
|
|
device: cpu
|
|
|
|
|
|
compute_type: int8
|
|
|
|
|
|
batch_size: 1
|
|
|
|
|
|
model: large-v3
|
|
|
|
|
|
language: ru
|
|
|
|
|
|
diarize: true
|
|
|
|
|
|
|
|
|
|
|
|
# Активный профиль (можно переопределить через CLI: --profile gpu_8gb)
|
|
|
|
|
|
active_profile: mac_m4
|
|
|
|
|
|
|
|
|
|
|
|
# Настройки диаризации
|
|
|
|
|
|
hf_token: null # HuggingFace токен для pyannote. Установите через env: HF_TOKEN
|
|
|
|
|
|
|
|
|
|
|
|
# Настройки выходного документа
|
|
|
|
|
|
output:
|
2026-05-29 08:39:13 +00:00
|
|
|
|
formats: [docx, md] # Список форматов: docx, md, txt. Можно указать один или несколько.
|
2026-05-29 07:16:02 +00:00
|
|
|
|
include_timestamps: true
|
|
|
|
|
|
speaker_label_style: name # name | id | none
|
|
|
|
|
|
paragraph_pause_sec: 2.0 # новый абзац, если пауза > N секунд
|
|
|
|
|
|
|
2026-06-01 14:40:58 +00:00
|
|
|
|
# Настройки RAG (LightRAG для протоколов совещаний)
|
|
|
|
|
|
rag:
|
|
|
|
|
|
enabled: true
|
|
|
|
|
|
auto_index: true
|
|
|
|
|
|
sections:
|
|
|
|
|
|
- Планировка
|
|
|
|
|
|
- Конструкции
|
|
|
|
|
|
- MEP
|
|
|
|
|
|
- Отделка
|
|
|
|
|
|
- Общие вопросы
|
|
|
|
|
|
- Согласование
|
|
|
|
|
|
- Контроль качества
|
|
|
|
|
|
index_backend: opencode
|
|
|
|
|
|
index_model: mimo-v2.5-free
|
|
|
|
|
|
chat_backend: opencode
|
|
|
|
|
|
chat_model: deepseek-v4-flash-free
|
|
|
|
|
|
summary_auto: true
|
|
|
|
|
|
summary_model: deepseek-v4-flash-free
|
|
|
|
|
|
summary_chunk_size: 10000
|
|
|
|
|
|
classify_chunk_size: 7000
|
2026-06-01 14:41:31 +00:00
|
|
|
|
opencode_api_key: "sk-4jJBUMS7WJyBOtZZAexsSy6aT4NKOYp2gA19WLlaux8jHMw0HvyCl1V45Jf8SONz" # Или через env: OPENCODE_API_KEY
|
2026-06-01 14:40:58 +00:00
|
|
|
|
opencode_url: "https://opencode.ai/zen/v1"
|
|
|
|
|
|
project_index_dir: ./processed/lightrag_caches
|
|
|
|
|
|
|
|
|
|
|
|
# Очередь обработки
|
|
|
|
|
|
queue:
|
|
|
|
|
|
transcribe_workers: 2
|
|
|
|
|
|
postprocess_workers: 1
|
|
|
|
|
|
|
2026-06-01 15:54:25 +00:00
|
|
|
|
# Авторизация и multi-tenant (org + projects)
|
|
|
|
|
|
auth:
|
|
|
|
|
|
jwt_secret: "" # Обязательно задайте JWT_SECRET в .env для production
|
|
|
|
|
|
jwt_expire_hours: 168
|
|
|
|
|
|
database_path: ./data/transcriba.db
|
|
|
|
|
|
bootstrap:
|
|
|
|
|
|
org_slug: merakom
|
|
|
|
|
|
org_name: "МЕРАКОМ"
|
|
|
|
|
|
admin_username: admin
|
|
|
|
|
|
admin_password: "admin123" # Смените после первого входа; или AUTH_ADMIN_PASSWORD в .env
|
|
|
|
|
|
default_projects:
|
|
|
|
|
|
- slug: "2026"
|
|
|
|
|
|
name: "2026"
|
|
|
|
|
|
- slug: "gp-merakom"
|
|
|
|
|
|
name: "ГП МЕРАКОМ"
|
|
|
|
|
|
|
2026-05-29 07:16:02 +00:00
|
|
|
|
# Пути
|
|
|
|
|
|
paths:
|
|
|
|
|
|
output_dir: ./output
|
|
|
|
|
|
temp_dir: ./tmp
|