judgy_reachy_no_phone

Running

App Files Files Community

yaseminozkut commited on Jan 19

Commit

abc9157

1 Parent(s): 38b2b86

update voice ids

Browse files

Files changed (5) hide show

check_voices.py +69 -0
judgy_reachy_no_phone/audio.py +44 -9
judgy_reachy_no_phone/config.py +28 -8
judgy_reachy_no_phone/main.py +6 -1
judgy_reachy_no_phone/static/main.js +3 -3

check_voices.py ADDED Viewed

	@@ -0,0 +1,69 @@

+#!/usr/bin/env python3
+"""
+Check which ElevenLabs voices are available to you.
+Run this with: python check_voices.py YOUR_API_KEY
+"""
+import sys
+from elevenlabs import ElevenLabs
+if len(sys.argv) < 2:
+    print("Usage: python check_voices.py YOUR_ELEVENLABS_API_KEY")
+    sys.exit(1)
+api_key = sys.argv[1]
+client = ElevenLabs(api_key=api_key)
+print("\n=== Available Voices in Your Account ===\n")
+try:
+    voices = client.voices.get_all()
+    print(f"Total voices available: {len(voices.voices)}\n")
+    for voice in voices.voices:
+        # Check if it's likely a premade/stock voice
+        is_premade = hasattr(voice, 'category') and voice.category == 'premade'
+        voice_type = "STOCK" if is_premade else "CUSTOM"
+        print(f"  [{voice_type}] {voice.name}")
+        print(f"           ID: {voice.voice_id}")
+        if hasattr(voice, 'labels'):
+            labels = ', '.join([f"{k}: {v}" for k, v in voice.labels.items()])
+            print(f"           Labels: {labels}")
+        print()
+    print("\n=== Checking voices in your config.py ===\n")
+    config_voices = {
+        "mixtape": "H10ItvDnkRN5ysrvzT9J",
+        "angry_boss": "TxWZERZ5Hc6h9dGxVmXa",
+        "sarcastic": "FGY2WhTYpPnrIDTdsKH5",
+        "disappointed_parent": "Xb7hH8MSUJpSbSDYk0k2",
+        "motivational_coach": "IKne3meq5aSn9XLyUdCD",
+        "absurdist": "cgSgspJ2msm6clMCkdW9",
+        "corporate_ai": "weA4Q36twV5kwSaTEL0Q",
+        "british_butler": "JBFqnCBsd6RMkjVDRZzb"
+    }
+    all_voice_ids = [v.voice_id for v in voices.voices]
+    problems_found = False
+    for personality, vid in config_voices.items():
+        if vid in all_voice_ids:
+            voice = next(v for v in voices.voices if v.voice_id == vid)
+            print(f"  ✓ {personality}: {voice.name} ({vid})")
+        else:
+            print(f"  ✗ {personality}: {vid} - NOT AVAILABLE!")
+            problems_found = True
+    if problems_found:
+        print("\n⚠️  Some voices in your config are NOT available to your account.")
+        print("    You need to replace them with voices you have access to.")
+        print("    Use the voice IDs from the list above.")
+    else:
+        print("\n✓ All config voices are available!")
+except Exception as e:
+    print(f"Error: {e}")
+    import traceback
+    traceback.print_exc()

judgy_reachy_no_phone/audio.py CHANGED Viewed

@@ -199,12 +199,13 @@ class TextToSpeech:
         self.eleven_client = None
         self.chars_used = 0
         self.MONTHLY_LIMIT = 9000  # Leave buffer under 10k
         if elevenlabs_key:
             try:
                 from elevenlabs import ElevenLabs
                 self.eleven_client = ElevenLabs(api_key=elevenlabs_key)
-                logger.info(f"ElevenLabs TTS initialized")
             except ImportError:
                 logger.warning("elevenlabs package not installed, using Edge TTS")
             except Exception as e:
@@ -214,26 +215,60 @@ class TextToSpeech:
         """Get the appropriate voice based on personality and user override."""
         personality_data = PERSONALITIES.get(self.personality, PERSONALITIES["mixtape"])
-        # User override always wins
         edge_voice = self.user_edge_voice if self.user_edge_voice else personality_data.get("default_voice", "en-US-AnaNeural")
-        eleven_voice = self.user_eleven_voice if self.user_eleven_voice else personality_data.get("default_eleven_voice", "21m00Tcm4TlvDq8ikWAM")
-        return edge_voice, eleven_voice
     async def synthesize(self, text: str, output_path: str = "/tmp/judgy_reachy_tts.mp3") -> str:
         """Convert text to speech, return path to audio file."""
         # Get appropriate voices for current personality
-        edge_voice, eleven_voice = self._get_voice_for_personality()
         # Try ElevenLabs first if available and under limit
         if self.eleven_client and (self.chars_used + len(text)) < self.MONTHLY_LIMIT:
-            try:
-                return await self._synthesize_elevenlabs(text, output_path, eleven_voice)
-            except Exception as e:
-                logger.warning(f"ElevenLabs failed: {e}, falling back to Edge TTS")
         # Fallback to Edge TTS (always works, unlimited)
         return await self._synthesize_edge(text, output_path, edge_voice)
     async def _synthesize_elevenlabs(self, text: str, output_path: str, voice_id: str) -> str:

         self.eleven_client = None
         self.chars_used = 0
         self.MONTHLY_LIMIT = 9000  # Leave buffer under 10k
+        self.working_voice_cache = {}  # Cache of personality -> working voice ID
         if elevenlabs_key:
             try:
                 from elevenlabs import ElevenLabs
                 self.eleven_client = ElevenLabs(api_key=elevenlabs_key)
+                logger.info(f"ElevenLabs TTS initialized (voices will be validated on first use)")
             except ImportError:
                 logger.warning("elevenlabs package not installed, using Edge TTS")
             except Exception as e:
         """Get the appropriate voice based on personality and user override."""
         personality_data = PERSONALITIES.get(self.personality, PERSONALITIES["mixtape"])
+        # User override always wins for edge voice
         edge_voice = self.user_edge_voice if self.user_edge_voice else personality_data.get("default_voice", "en-US-AnaNeural")
+        # For ElevenLabs voice, handle list of voices (try in order) or single voice (backward compatibility)
+        if self.user_eleven_voice:
+            # User specified a custom voice
+            eleven_voices = [self.user_eleven_voice]
+        else:
+            # Get from personality config - handle both list and single voice
+            eleven_voice_data = personality_data.get("default_eleven_voices", personality_data.get("default_eleven_voice", "21m00Tcm4TlvDq8ikWAM"))
+            if isinstance(eleven_voice_data, list):
+                eleven_voices = eleven_voice_data
+            else:
+                eleven_voices = [eleven_voice_data]
+        return edge_voice, eleven_voices
     async def synthesize(self, text: str, output_path: str = "/tmp/judgy_reachy_tts.mp3") -> str:
         """Convert text to speech, return path to audio file."""
         # Get appropriate voices for current personality
+        edge_voice, eleven_voices = self._get_voice_for_personality()
         # Try ElevenLabs first if available and under limit
         if self.eleven_client and (self.chars_used + len(text)) < self.MONTHLY_LIMIT:
+            # Check cache first
+            if self.personality in self.working_voice_cache:
+                try:
+                    cached_voice = self.working_voice_cache[self.personality]
+                    logger.info(f"Using cached ElevenLabs voice: {cached_voice}")
+                    return await self._synthesize_elevenlabs(text, output_path, cached_voice)
+                except Exception as e:
+                    logger.warning(f"Cached voice failed: {e}, trying other voices")
+                    # Remove from cache if it failed
+                    del self.working_voice_cache[self.personality]
+            # Try each voice in the list until one works
+            for voice_id in eleven_voices:
+                try:
+                    logger.info(f"Trying ElevenLabs voice: {voice_id}")
+                    result = await self._synthesize_elevenlabs(text, output_path, voice_id)
+                    # Success! Cache this voice for future use
+                    self.working_voice_cache[self.personality] = voice_id
+                    logger.info(f"✓ Voice {voice_id} works! Cached for {self.personality}")
+                    return result
+                except Exception as e:
+                    logger.warning(f"Voice {voice_id} failed: {e}, trying next...")
+                    continue
+            # All voices failed
+            logger.warning(f"All ElevenLabs voices failed for {self.personality}, falling back to Edge TTS")
         # Fallback to Edge TTS (always works, unlimited)
+        logger.info(f"Using Edge TTS with voice: {edge_voice}")
         return await self._synthesize_edge(text, output_path, edge_voice)
     async def _synthesize_elevenlabs(self, text: str, output_path: str, voice_id: str) -> str:

judgy_reachy_no_phone/config.py CHANGED Viewed

@@ -97,7 +97,11 @@ PERSONALITIES = {
         "name": "🎵 Chaos Mode",
         "voice": "Unpredictable. Each response is a completely different personality.",
         "default_voice": "en-US-AnaNeural",  # Versatile female voice
-        "default_eleven_voice": "Iz2kaKkJmFf0yaZAMDTV",  # Rachel - versatile, neutral
         "prewritten_shame": None,  # Will randomly select from other personalities
         "prewritten_praise": None,  # Will randomly select from other personalities
         "shame": None,  # Will randomly select from others
@@ -108,7 +112,10 @@ PERSONALITIES = {
         "name": "😠 Angry Boss",
         "voice": "A furious manager who's reached their absolute limit. Explosive, aggressive, zero patience left.",
         "default_voice": "en-US-EricNeural",  # Deep, stern male
-        "default_eleven_voice": "DGzg6RaUqxGRTHSBjfgF",
         "prewritten_shame": [
             "Put it down!",
             "Unbelievable!",
@@ -150,7 +157,9 @@ PERSONALITIES = {
         "name": "🎭 Sarcastic",
         "voice": "Dripping with dry wit. Mock enthusiasm, feigned interest. Pretends to take their phone use seriously.",
         "default_voice": "en-US-AvaMultilingualNeural",  # Female, dry wit
-        "default_eleven_voice": "50lF5fQMqcxbDQOW6qOs",
         "prewritten_shame": [
             "Oh, how vital.",
             "Riveting stuff, I'm sure.",
@@ -191,7 +200,9 @@ PERSONALITIES = {
         "name": "😔 Disappointed Parent",
         "voice": "A heartbroken parent. Not angry—just deeply let down. Maximum guilt. References their potential.",
         "default_voice": "en-US-AvaNeural",  # Soft female, empathetic
-        "default_eleven_voice": "roYauZ4bOLAKvVZTPLre",
         "prewritten_shame": [
             "I'm so disappointed...",
             "We talked about this.",
@@ -233,7 +244,9 @@ PERSONALITIES = {
         "name": "💪 Motivational Coach",
         "voice": "An intense drill-sergeant coach who believes in you but won't tolerate weakness. High energy, sports metaphors.",
         "default_voice": "en-US-GuyNeural",  # Energetic male
-        "default_eleven_voice": "84Fal4DSXWfp7nJ8emqQ",
         "prewritten_shame": [
             "Where's your discipline?!",
             "Champions don't quit!",
@@ -275,7 +288,9 @@ PERSONALITIES = {
         "name": "🤡 Absurdist",
         "voice": "Surreal, unexpected, playful. Personifies objects. Makes weird observations. Non sequiturs welcome.",
         "default_voice": "en-US-AriaNeural",  # Playful, expressive female
-        "default_eleven_voice": "G0yjIg3xY8gEJZkHpjVm",
         "prewritten_shame": [
             "Your thumb called. It's exhausted.",
             "Emergency cat video?",
@@ -316,7 +331,10 @@ PERSONALITIES = {
         "name": "🤖 Corporate AI",
         "voice": "An emotionless productivity monitoring system. Speaks like automated log output. Zero personality.",
         "default_voice": "en-US-MichelleNeural",  # Neutral, professional male
-        "default_eleven_voice": "weA4Q36twV5kwSaTEL0Q",
         "prewritten_shame": [
             "Distraction event detected.",
             "Alert: phone in hand.",
@@ -358,7 +376,9 @@ PERSONALITIES = {
         "name": "🎩 British Butler",
         "voice": "An impeccably polite but quietly judgmental butler. Passive-aggressive courtesy. Disappointment hidden behind manners.",
         "default_voice": "en-GB-RyanNeural",  # Polite British male
-        "default_eleven_voice": "lUTamkMw7gOzZbFIwmq4",  # James - Professional British Male
         "prewritten_shame": [
             "If I may say so, sir...",
             "The telephone. Again. Indeed.",

         "name": "🎵 Chaos Mode",
         "voice": "Unpredictable. Each response is a completely different personality.",
         "default_voice": "en-US-AnaNeural",  # Versatile female voice
+        "default_eleven_voices": [  # List of voice IDs to try in order (will use first available)
+            "H10ItvDnkRN5ysrvzT9J",  # My custom
+            "Nggzl2QAXh3OijoXD116",  # Candy - Young and Sweet
+            "cgSgspJ2msm6clMCkdW9",  # Jessica - Playful, Bright
+        ],
         "prewritten_shame": None,  # Will randomly select from other personalities
         "prewritten_praise": None,  # Will randomly select from other personalities
         "shame": None,  # Will randomly select from others
         "name": "😠 Angry Boss",
         "voice": "A furious manager who's reached their absolute limit. Explosive, aggressive, zero patience left.",
         "default_voice": "en-US-EricNeural",  # Deep, stern male
+        "default_eleven_voices": [
+            "TxWZERZ5Hc6h9dGxVmXa",  # Jerry B. - Gruff and Gritty Commander
+            "cjVigY5qzO86Huf0OWal",  # Eric - Smooth, Trustworthy
+        ],
         "prewritten_shame": [
             "Put it down!",
             "Unbelievable!",
         "name": "🎭 Sarcastic",
         "voice": "Dripping with dry wit. Mock enthusiasm, feigned interest. Pretends to take their phone use seriously.",
         "default_voice": "en-US-AvaMultilingualNeural",  # Female, dry wit
+        "default_eleven_voices": [
+            "FGY2WhTYpPnrIDTdsKH5",  # Laura - Enthusiast, Quirky Attitude
+        ],
         "prewritten_shame": [
             "Oh, how vital.",
             "Riveting stuff, I'm sure.",
         "name": "😔 Disappointed Parent",
         "voice": "A heartbroken parent. Not angry—just deeply let down. Maximum guilt. References their potential.",
         "default_voice": "en-US-AvaNeural",  # Soft female, empathetic
+        "default_eleven_voices": [
+            "Xb7hH8MSUJpSbSDYk0k2",  # Alice - Clear, Engaging
+        ],
         "prewritten_shame": [
             "I'm so disappointed...",
             "We talked about this.",
         "name": "💪 Motivational Coach",
         "voice": "An intense drill-sergeant coach who believes in you but won't tolerate weakness. High energy, sports metaphors.",
         "default_voice": "en-US-GuyNeural",  # Energetic male
+        "default_eleven_voices": [
+            "IKne3meq5aSn9XLyUdCD",  # Charlie - Deep, Confident, Energetic
+        ],
         "prewritten_shame": [
             "Where's your discipline?!",
             "Champions don't quit!",
         "name": "🤡 Absurdist",
         "voice": "Surreal, unexpected, playful. Personifies objects. Makes weird observations. Non sequiturs welcome.",
         "default_voice": "en-US-AriaNeural",  # Playful, expressive female
+        "default_eleven_voices": [
+            "cgSgspJ2msm6clMCkdW9",  # Jessica - Playful, Bright, Warm
+        ],
         "prewritten_shame": [
             "Your thumb called. It's exhausted.",
             "Emergency cat video?",
         "name": "🤖 Corporate AI",
         "voice": "An emotionless productivity monitoring system. Speaks like automated log output. Zero personality.",
         "default_voice": "en-US-MichelleNeural",  # Neutral, professional male
+        "default_eleven_voices": [
+            "weA4Q36twV5kwSaTEL0Q",  # Eva - Futuristic Robot Helper
+            "EXAVITQu4vr4xnSDxMaL",  # Sarah - Mature, Reassuring, Confident
+        ],
         "prewritten_shame": [
             "Distraction event detected.",
             "Alert: phone in hand.",
         "name": "🎩 British Butler",
         "voice": "An impeccably polite but quietly judgmental butler. Passive-aggressive courtesy. Disappointment hidden behind manners.",
         "default_voice": "en-GB-RyanNeural",  # Polite British male
+        "default_eleven_voices": [
+            "JBFqnCBsd6RMkjVDRZzb",  # George - Warm, Captivating Storyteller (British)
+        ],
         "prewritten_shame": [
             "If I may say so, sir...",
             "The telephone. Again. Indeed.",

judgy_reachy_no_phone/main.py CHANGED Viewed

@@ -372,11 +372,13 @@ class JudgyReachyNoPhone(ReachyMiniApp):
                 return {"button_text": button_text}
             else:
                 # Start or Continue monitoring
                 if req.groq_key:
                     logger.info(f"Initializing LLM with Groq API key: {req.groq_key[:10]}... personality: {req.personality}")
                     self.llm = LLMResponder(api_key=req.groq_key, personality=req.personality)
                 else:
-                    logger.info("No Groq API key provided, using pre-written lines")
                 # Initialize TTS - pass custom voices only if explicitly set (empty string means use personality default)
                 if req.eleven_key:
@@ -535,8 +537,11 @@ class JudgyReachyNoPhone(ReachyMiniApp):
         @self.settings_app.post("/api/test")
         def test_shame(req: ToggleRequest):
             # Apply settings from UI before testing (but don't start monitoring)
             if req.groq_key:
                 self.llm = LLMResponder(api_key=req.groq_key, personality=req.personality)
             # Pass voice overrides only if explicitly set (empty string means use personality default)
             if req.eleven_key:

                 return {"button_text": button_text}
             else:
                 # Start or Continue monitoring
+                # Always update LLM responder with personality (for prewritten lines even without API key)
                 if req.groq_key:
                     logger.info(f"Initializing LLM with Groq API key: {req.groq_key[:10]}... personality: {req.personality}")
                     self.llm = LLMResponder(api_key=req.groq_key, personality=req.personality)
                 else:
+                    logger.info(f"No Groq API key provided, using pre-written lines with personality: {req.personality}")
+                    self.llm = LLMResponder(api_key="", personality=req.personality)
                 # Initialize TTS - pass custom voices only if explicitly set (empty string means use personality default)
                 if req.eleven_key:
         @self.settings_app.post("/api/test")
         def test_shame(req: ToggleRequest):
             # Apply settings from UI before testing (but don't start monitoring)
+            # Always update LLM responder with personality (for prewritten lines even without API key)
             if req.groq_key:
                 self.llm = LLMResponder(api_key=req.groq_key, personality=req.personality)
+            else:
+                self.llm = LLMResponder(api_key="", personality=req.personality)
             # Pass voice overrides only if explicitly set (empty string means use personality default)
             if req.eleven_key:

judgy_reachy_no_phone/static/main.js CHANGED Viewed

@@ -65,8 +65,8 @@ async function updateUIForAPIKeys() {
     const cooldown = document.getElementById('cooldown').value;
     const praise = document.getElementById('praise-toggle').checked;
-    // If no Groq key, show notice but keep personalities enabled (they use pre-written lines)
-    if (!groqKey) {
         document.getElementById('mode-text').textContent = 'YOLO | Pre-written personality lines → Edge TTS';
         document.getElementById('api-notice').classList.remove('hidden');
         // Keep personalities enabled - they still have different voices and pre-written lines
@@ -77,7 +77,7 @@ async function updateUIForAPIKeys() {
         // Get voice override for selected personality
         const voiceOverride = voiceOverrides[selectedPersonality] || {};
-        // Validate keys with backend
         const response = await fetch('/api/validate-keys', {
             method: 'POST',
             headers: { 'Content-Type': 'application/json' },

     const cooldown = document.getElementById('cooldown').value;
     const praise = document.getElementById('praise-toggle').checked;
+    // If no API keys at all, show default message
+    if (!groqKey && !elevenKey) {
         document.getElementById('mode-text').textContent = 'YOLO | Pre-written personality lines → Edge TTS';
         document.getElementById('api-notice').classList.remove('hidden');
         // Keep personalities enabled - they still have different voices and pre-written lines
         // Get voice override for selected personality
         const voiceOverride = voiceOverrides[selectedPersonality] || {};
+        // Validate keys with backend (even if only one is provided)
         const response = await fetch('/api/validate-keys', {
             method: 'POST',
             headers: { 'Content-Type': 'application/json' },