summaryrefslogtreecommitdiff
path: root/config.yaml.example
blob: 39880356de9c8ddabc6abffbde44bf46f0b65bd9 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
# TotalRecalooConfiguration Example
# Copy this to ~/.totalrecall.yaml or ./.totalrecall.yaml

# Audio configuration
audio:
  # Audio is generated using OpenAI TTS
  # Provider field removed - OpenAI is now the only option
  
  # Audio output format
  format: mp3
  
  # OpenAI TTS settings
  openai_key: ${OPENAI_API_KEY}  # Can also use environment variable
  openai_model: gpt-4o-mini-tts  # Options: tts-1, tts-1-hd, gpt-4o-mini-tts
  openai_speed: 0.9               # Range: 0.25 to 4.0 (may be ignored by gpt-4o-mini models)
  
  # Voice instructions for gpt-4o-mini-tts model
  # This allows you to customize how the AI speaks
  openai_instruction: "You are speaking Bulgarian language (български език). Pronounce the Bulgarian text with authentic Bulgarian phonetics, not Russian. Speak slowly and clearly for language learners."
  
  # Alternative instruction examples:
  # openai_instruction: "Speak in Bulgarian (not Russian!). Use native Bulgarian pronunciation with clear articulation for each syllable."
  # openai_instruction: "You are a Bulgarian language teacher. Pronounce the Bulgarian words slowly with authentic Bulgarian accent and phonetics."
  # openai_instruction: "Speak Bulgarian text with proper Bulgarian pronunciation. Avoid Russian accent. Speak clearly at a pace suitable for beginners."

# Image configuration
image:
  # Provider: currently only openai is supported
  provider: openai
  
  # OpenAI DALL-E settings
  openai_model: dall-e-3     # Options: dall-e-2, dall-e-3
  openai_size: 1024x1024     # Options vary by model
  openai_quality: standard   # Options: standard, hd (dall-e-3 only)
  openai_style: natural      # Options: natural, vivid (dall-e-3 only)

# Output configuration
output:
  directory: ~/Downloads