Streaming working

2025-09-15 13:35:38 -07:00 · 2025-09-15 13:35:38 -07:00 · 7a06bfc102
commit 7a06bfc102
parent 3c7584eadb
4 changed files with 260 additions and 153 deletions
--- a/voicebot/ai_providers.py
+++ b/voicebot/ai_providers.py
@ -380,16 +380,32 @@ class LocalProvider(AIProvider):
                    "num_predict": self.config.max_tokens
                }
            }
-            
+            logger.info(f"LocalProvider generate payload: {payload}")
            try:
                async with session.post(
-                    f"{self.base_url}/api/chat",
+                    f"{self.base_url}/chat/completions",
                    json=payload,
                    timeout=aiohttp.ClientTimeout(total=self.config.timeout)
                ) as resp:
                    if resp.status == 200:
                        result = await resp.json()
-                        response_text = result["message"]["content"]
+                        
+                        # Handle OpenAI-compatible format
+                        if "choices" in result and len(result["choices"]) > 0:
+                            choice = result["choices"][0]
+                            if "message" in choice and "content" in choice["message"]:
+                                response_text = choice["message"]["content"]
+                            elif "text" in choice:
+                                # Some APIs use "text" instead of "message.content"
+                                response_text = choice["text"]
+                            else:
+                                raise Exception(f"Unexpected response format: {result}")
+                        # Fallback to original format for backward compatibility
+                        elif "message" in result and "content" in result["message"]:
+                            response_text = result["message"]["content"]
+                        else:
+                            raise Exception(f"Unexpected response format: {result}")
+                            
                        context.add_message(MessageRole.ASSISTANT, response_text)
                        return response_text
                    else:
@ -411,25 +427,51 @@ class LocalProvider(AIProvider):
                "messages": context.get_context_messages(),
                "stream": True
            }
-            
+            logger.info(f"LocalProvider stream payload: {self.base_url} {payload}")
+
            try:
                async with session.post(
-                    f"{self.base_url}/api/chat",
+                    f"{self.base_url}/chat/completions",
                    json=payload,
                    timeout=aiohttp.ClientTimeout(total=self.config.timeout)
                ) as resp:
                    if resp.status == 200:
                        full_response = ""
+                        import json
                        async for line in resp.content:
                            if line:
-                                import json
                                try:
-                                    data = json.loads(line.decode())
-                                    if "message" in data and "content" in data["message"]:
-                                        content = data["message"]["content"]
-                                        full_response += content
-                                        yield content
-                                except json.JSONDecodeError:
+                                    # Decode the line
+                                    line_str = line.decode('utf-8').strip()
+                                    
+                                    # Skip empty lines
+                                    if not line_str:
+                                        continue
+                                    
+                                    # Handle Server-Sent Events format
+                                    if line_str.startswith('data: '):
+                                        line_str = line_str[6:]  # Remove 'data: ' prefix
+                                    
+                                    # Skip end-of-stream marker
+                                    if line_str == '[DONE]':
+                                        break
+                                    
+                                    data = json.loads(line_str)
+                                    
+                                    # Handle OpenAI-compatible format
+                                    if "choices" in data and len(data["choices"]) > 0:
+                                        choice = data["choices"][0]
+                                        if "delta" in choice and "content" in choice["delta"]:
+                                            content = choice["delta"]["content"]
+                                            if content:  # Only yield non-empty content
+                                                full_response += content
+                                                yield content
+                                    
+                                except (UnicodeDecodeError, json.JSONDecodeError) as e:
+                                    logger.debug(f"Skipping invalid line: {line} (error: {e})")
+                                    continue
+                                except Exception as e:
+                                    logger.warning(f"Unexpected error processing line: {e}")
                                    continue
                        
                        context.add_message(MessageRole.ASSISTANT, full_response)
@ -437,7 +479,7 @@ class LocalProvider(AIProvider):
                        raise Exception(f"Local API returned status {resp.status}")
                        
            except Exception as e:
-                logger.error(f"Local provider streaming failed: {e}")
+                logger.error(f"Local provider streaming failed {self.base_url}: {e}")
                raise
    
    async def health_check(self) -> bool:
@ -479,8 +521,8 @@ class AIProviderManager:
            ),
            AIProviderType.LOCAL: AIProviderConfig(
                provider_type=AIProviderType.LOCAL,
-                base_url=os.getenv("LOCAL_MODEL_URL", "http://localhost:11434"),
-                model=os.getenv("LOCAL_MODEL_NAME", "llama2"),
+                base_url=os.getenv("OPENAI_BASE_URL", "http://localhost:11434"),
+                model=os.getenv("OPENAI_MODEL", "llama2"),
                max_tokens=int(os.getenv("LOCAL_MAX_TOKENS", "1000")),
                temperature=float(os.getenv("LOCAL_TEMPERATURE", "0.7"))
            )
--- a/voicebot/bots/init.py
+++ b/voicebot/bots/init.py
@ -2,6 +2,5 @@

 from . import synthetic_media
 from . import whisper
-from . import chatbot

-__all__ = ["synthetic_media", "whisper", "chatbot"]
+__all__ = ["synthetic_media", "whisper"]
--- a/voicebot/bots/ai_chatbot.py
+++ b/voicebot/bots/ai_chatbot.py
@ -10,7 +10,8 @@ This bot demonstrates the advanced capabilities including:
 import os
 import time
 import uuid
-from typing import Dict, Optional, Callable, Awaitable, Any, Union
+import secrets
+from typing import Dict, Optional, Callable, Awaitable, Any, Union, AsyncGenerator
 from aiortc import MediaStreamTrack

 # Import system modules
@ -85,6 +86,15 @@ class EnhancedAIChatbot:
        self.conversation_context = None
        self.initialized = False
        
+        # Instance configuration variables
+        self.bot_personality = BOT_PERSONALITY
+        self.bot_ai_provider = BOT_AI_PROVIDER
+        self.bot_streaming = BOT_STREAMING
+        self.bot_memory_enabled = BOT_MEMORY_ENABLED
+        
+        # Per-lobby configurations
+        self.lobby_configs: Dict[str, Dict[str, Any]] = {}
+        
        # Initialize advanced features if available
        if AI_PROVIDERS_AVAILABLE:
            self._initialize_ai_features()
@ -95,18 +105,18 @@ class EnhancedAIChatbot:
        """Initialize AI provider, personality, and context management."""
        try:
            # Initialize personality
-            self.personality = personality_manager.create_personality_from_template(BOT_PERSONALITY)
+            self.personality = personality_manager.create_personality_from_template(self.bot_personality)
            if not self.personality:
-                logger.warning(f"Personality template '{BOT_PERSONALITY}' not found, using default")
+                logger.warning(f"Personality template '{self.bot_personality}' not found, using default")
                self.personality = personality_manager.create_personality_from_template("helpful_assistant")
            
            # Initialize AI provider
-            provider_type = AIProviderType(BOT_AI_PROVIDER)
+            provider_type = AIProviderType(self.bot_ai_provider)
            self.ai_provider = ai_provider_manager.create_provider(provider_type)
            ai_provider_manager.register_provider(f"{AGENT_NAME}_{self.session_id}", self.ai_provider)
            
            # Initialize conversation context if memory is enabled
-            if BOT_MEMORY_ENABLED:
+            if self.bot_memory_enabled:
                self.conversation_context = context_manager.get_or_create_context(
                    session_id=self.session_id,
                    bot_name=AGENT_NAME,
@ -114,7 +124,7 @@ class EnhancedAIChatbot:
                )
            
            self.initialized = True
-            logger.info(f"Enhanced AI chatbot initialized: provider={BOT_AI_PROVIDER}, personality={BOT_PERSONALITY}, memory={BOT_MEMORY_ENABLED}")
+            logger.info(f"Enhanced AI chatbot initialized: provider={self.bot_ai_provider}, personality={self.bot_personality}, memory={self.bot_memory_enabled}")
            
        except Exception as e:
            logger.error(f"Failed to initialize AI features: {e}")
@ -153,7 +163,7 @@ class EnhancedAIChatbot:
                    ai_context.add_message(MessageRole.SYSTEM, self.personality.generate_system_prompt())
            
            # Generate response
-            if BOT_STREAMING:
+            if self.bot_streaming:
                # For streaming, collect the full response
                response_parts = []
                async for chunk in self.ai_provider.stream_response(ai_context, message):
@ -168,8 +178,8 @@ class EnhancedAIChatbot:
                    conversation_id=self.conversation_context.conversation_id,
                    user_message=message,
                    bot_response=response,
-                    context_used={"ai_provider": BOT_AI_PROVIDER, "personality": BOT_PERSONALITY},
-                    metadata={"timestamp": time.time(), "streaming": BOT_STREAMING}
+                    context_used={"ai_provider": self.bot_ai_provider, "personality": self.bot_personality},
+                    metadata={"timestamp": time.time(), "streaming": self.bot_streaming}
                )
            
            return response
@ -226,6 +236,63 @@ class EnhancedAIChatbot:
            health["context_summary"] = self.conversation_context.get_conversation_summary()
        
        return health
+    
+    async def generate_streaming_response(self, message: str) -> AsyncGenerator[str, None]:
+        """Generate a streaming response, yielding partial responses as chunks arrive."""
+        if not self.initialized or not self.ai_provider:
+            yield self._get_fallback_response(message)
+            return
+        
+        try:
+            # Prepare conversation context (same as generate_response)
+            if self.conversation_context:
+                # Create a new AI conversation context with personality
+                ai_context = ConversationContext(
+                    session_id=self.session_id,
+                    bot_name=AGENT_NAME,
+                    personality_prompt=self.personality.generate_system_prompt() if self.personality else None
+                )
+                
+                # Add personality system message
+                if self.personality:
+                    ai_context.add_message(MessageRole.SYSTEM, self.personality.generate_system_prompt())
+                
+                # Add conversation history context
+                context_summary = context_manager.get_context_for_response(self.conversation_context.conversation_id)
+                if context_summary:
+                    ai_context.add_message(MessageRole.SYSTEM, f"Conversation context: {context_summary}")
+            else:
+                # Simple context without memory
+                ai_context = ConversationContext(
+                    session_id=self.session_id,
+                    bot_name=AGENT_NAME
+                )
+                if self.personality:
+                    ai_context.add_message(MessageRole.SYSTEM, self.personality.generate_system_prompt())
+            
+            # Stream the response
+            accumulated_response = ""
+            chunk_count = 0
+            async for chunk in self.ai_provider.stream_response(ai_context, message):
+                accumulated_response += chunk
+                chunk_count += 1
+                logger.info(f"AI provider yielded chunk {chunk_count}: '{chunk}' (accumulated: {len(accumulated_response)} chars)")
+                yield accumulated_response
+            
+            # Store conversation turn in context manager after streaming is complete
+            if self.conversation_context:
+                context_manager.add_conversation_turn(
+                    conversation_id=self.conversation_context.conversation_id,
+                    user_message=message,
+                    bot_response=accumulated_response,
+                    context_used={"ai_provider": self.bot_ai_provider, "personality": self.bot_personality},
+                    metadata={"timestamp": time.time(), "streaming": True}
+                )
+            
+        except Exception as e:
+            logger.error(f"AI streaming response generation failed: {e}")
+            yield self._get_fallback_response(message, error=True)
+    


 # Global bot instance
@ -268,15 +335,21 @@ async def handle_chat_message(
            _bot_instance = EnhancedAIChatbot(chat_message.sender_name)
            logger.info(f"Initialized enhanced AI chatbot for session: {chat_message.sender_name}")
        
-        # Generate response
-        response = await _bot_instance.generate_response(chat_message.message)
-        
-        # Send response
-        if response:
-            await send_message_func(response)
-            logger.info(f"AI Chatbot responded to {chat_message.sender_name}: {response[:100]}...")
-        
-        return response
+        if _bot_instance.bot_streaming:
+            # Handle streaming response
+            logger.info(f"Using streaming response path, bot_streaming={_bot_instance.bot_streaming}")
+            return await _handle_streaming_response(chat_message, send_message_func)
+        else:
+            # Generate non-streaming response
+            logger.info(f"Using non-streaming response path, bot_streaming={_bot_instance.bot_streaming}")
+            response = await _bot_instance.generate_response(chat_message.message)
+            
+            # Send response
+            if response:
+                await send_message_func(response)
+                logger.info(f"AI Chatbot responded to {chat_message.sender_name}: {response[:100]}...")
+            
+            return response
        
    except Exception as e:
        logger.error(f"Error in AI chatbot: {e}")
@ -285,6 +358,94 @@ async def handle_chat_message(
        return error_response


+async def _handle_streaming_response(
+    chat_message: ChatMessageModel,
+    send_message_func: Callable[[Union[str, ChatMessageModel]], Awaitable[None]]
+) -> Optional[str]:
+    """Handle streaming response by sending updates as chunks arrive."""
+    global _bot_instance
+    
+    logger.info("Starting _handle_streaming_response")
+    message_id = None
+    try:
+        # Generate a unique message ID for this streaming response
+        message_id = secrets.token_hex(8)
+        
+        # Get the client's session_id from the bound method
+        client = getattr(send_message_func, '__self__', None)
+        client_session_id = client.session_id if client else chat_message.sender_session_id
+        
+        # Send initial empty message to establish the message in the chat
+        initial_message = ChatMessageModel(
+            id=str(message_id),
+            message="",
+            sender_name=_bot_instance.session_name if _bot_instance else "AI Chatbot",
+            sender_session_id=client_session_id,
+            timestamp=time.time(),
+            lobby_id=chat_message.lobby_id,
+        )
+        await send_message_func(initial_message)
+        logger.info(f"Started streaming response with message ID: {message_id}")
+        
+        # Check if bot instance exists
+        if not _bot_instance:
+            error_msg = "Bot instance not available for streaming"
+            update_message = ChatMessageModel(
+                id=str(message_id),
+                message=error_msg,
+                sender_name="AI Chatbot",
+                sender_session_id=client_session_id,
+                timestamp=time.time(),
+                lobby_id=chat_message.lobby_id,
+            )
+            await send_message_func(update_message)
+            return error_msg
+        
+        # Stream the response
+        final_response = ""
+        chunk_count = 0
+        async for partial_response in _bot_instance.generate_streaming_response(chat_message.message):
+            final_response = partial_response
+            chunk_count += 1
+            logger.info(f"Sending streaming chunk {chunk_count}: {partial_response[:50]}...")
+            
+            update_message = ChatMessageModel(
+                id=str(message_id),
+                message=partial_response,
+                sender_name=_bot_instance.session_name,
+                sender_session_id=client_session_id,
+                timestamp=time.time(),
+                lobby_id=chat_message.lobby_id,
+            )
+            await send_message_func(update_message)
+        
+        logger.info(f"Completed streaming response to {chat_message.sender_name}: {final_response[:100]}...")
+        return final_response
+        
+    except Exception as e:
+        logger.error(f"Error in streaming response: {e}")
+        error_response = "I apologize, but I encountered an error. Please try again."
+        
+        # Try to update the existing message with the error, or send a new one
+        try:
+            client = getattr(send_message_func, '__self__', None)
+            client_session_id = client.session_id if client else chat_message.sender_session_id
+            error_message = ChatMessageModel(
+                id=str(message_id),
+                message=error_response,
+                sender_name=_bot_instance.session_name if _bot_instance else "AI Chatbot",
+                sender_session_id=client_session_id,
+                timestamp=time.time(),
+                lobby_id=chat_message.lobby_id,
+            )
+            await send_message_func(error_message)
+        except (NameError, TypeError, AttributeError):
+            # If message_id is not defined or other issues, send as string
+            await send_message_func(error_response)
+        
+        return error_response
+
+
 async def get_bot_status() -> Dict[str, Any]:
    """Get detailed bot status and health information."""
    global _bot_instance
@ -323,17 +484,17 @@ async def get_bot_status() -> Dict[str, Any]:


 # Additional helper functions for advanced features
-async def switch_personality(personality_id: str) -> bool:
+async def switch_personality(bot_instance: EnhancedAIChatbot, personality_id: str) -> bool:
    """Switch bot personality at runtime."""
-    global _bot_instance
    
-    if not AI_PROVIDERS_AVAILABLE or not _bot_instance:
+    if not AI_PROVIDERS_AVAILABLE or not bot_instance:
        return False
    
    try:
        new_personality = personality_manager.create_personality_from_template(personality_id)
        if new_personality:
-            _bot_instance.personality = new_personality
+            bot_instance.personality = new_personality
+            bot_instance.bot_personality = personality_id
            logger.info(f"Switched to personality: {personality_id}")
            return True
    except Exception as e:
@ -342,9 +503,8 @@ async def switch_personality(personality_id: str) -> bool:
    return False


-async def switch_ai_provider(provider_type: str) -> bool:
+async def switch_ai_provider(bot_instance: EnhancedAIChatbot, provider_type: str) -> bool:
    """Switch AI provider at runtime."""
-    global _bot_instance, BOT_AI_PROVIDER
    
    logger.info(f"Switching AI provider to: {provider_type}")
    
@ -353,17 +513,13 @@ async def switch_ai_provider(provider_type: str) -> bool:
        return False
    
    try:
-        # Always update the global default first
-        old_provider = BOT_AI_PROVIDER
-        BOT_AI_PROVIDER = provider_type
-        logger.info(f"Updated global BOT_AI_PROVIDER from {old_provider} to {provider_type}")
-        
        # If instance exists, switch its provider
-        if _bot_instance:
+        if bot_instance:
            logger.info("Switching existing bot instance provider")
            provider_enum = AIProviderType(provider_type)
            new_provider = ai_provider_manager.create_provider(provider_enum)
-            _bot_instance.ai_provider = new_provider
+            bot_instance.ai_provider = new_provider
+            bot_instance.bot_ai_provider = provider_type
            logger.info(f"Switched existing instance to AI provider: {provider_type}")
        else:
            logger.info("No existing bot instance to switch")
@ -371,8 +527,6 @@ async def switch_ai_provider(provider_type: str) -> bool:
        return True
    except Exception as e:
        logger.error(f"Failed to switch AI provider to {provider_type}: {e}")
-        # Revert the global change on failure
-        BOT_AI_PROVIDER = old_provider
        return False


@ -481,17 +635,21 @@ async def handle_config_update(lobby_id: str, config_values: Dict[str, Any]) ->
    try:
        logger.info(f"Updating config for lobby {lobby_id}: {config_values}")
        
+        # Get the bot instance (create if doesn't exist)
+        if _bot_instance is None:
+            _bot_instance = EnhancedAIChatbot("AI Chatbot")
+        
        # Apply configuration changes
        config_applied = False
        
        if "personality" in config_values:
-            success = await switch_personality(config_values["personality"])
+            success = await switch_personality(_bot_instance, config_values["personality"])
            if success:
                config_applied = True
                logger.info(f"Applied personality: {config_values['personality']}")
        
        if "ai_provider" in config_values:
-            success = await switch_ai_provider(config_values["ai_provider"])
+            success = await switch_ai_provider(_bot_instance, config_values["ai_provider"])
            if success:
                config_applied = True
                logger.info(f"Applied AI provider: {config_values['ai_provider']}")
@ -499,24 +657,21 @@ async def handle_config_update(lobby_id: str, config_values: Dict[str, Any]) ->
                logger.warning(f"Failed to apply AI provider: {config_values['ai_provider']}")
        
        if "streaming" in config_values:
-            global BOT_STREAMING
-            BOT_STREAMING = bool(config_values["streaming"])
+            _bot_instance.bot_streaming = bool(config_values["streaming"])
            config_applied = True
-            logger.info(f"Applied streaming: {BOT_STREAMING}")
+            logger.info(f"Applied streaming: {_bot_instance.bot_streaming}")
        
        if "memory_enabled" in config_values:
-            global BOT_MEMORY_ENABLED
-            BOT_MEMORY_ENABLED = bool(config_values["memory_enabled"])
+            _bot_instance.bot_memory_enabled = bool(config_values["memory_enabled"])
            config_applied = True
-            logger.info(f"Applied memory: {BOT_MEMORY_ENABLED}")
+            logger.info(f"Applied memory: {_bot_instance.bot_memory_enabled}")
        
        # Store other configuration values for use in response generation
-        if _bot_instance:
-            if not hasattr(_bot_instance, 'lobby_configs'):
-                _bot_instance.lobby_configs = {}
-            
-            _bot_instance.lobby_configs[lobby_id] = config_values
-            config_applied = True
+        if not hasattr(_bot_instance, 'lobby_configs'):
+            _bot_instance.lobby_configs = {}
+        
+        _bot_instance.lobby_configs[lobby_id] = config_values
+        config_applied = True
        
        return config_applied
        
--- a/voicebot/bots/chatbot.py
+++ b/voicebot/bots/chatbot.py
@ -1,89 +0,0 @@
-"""Simple chatbot agent that demonstrates chat message handling.
-
-This bot shows how to create an agent that primarily uses chat functionality
-rather than media streams.
-"""
-
-from typing import Dict, Optional, Callable, Awaitable, Union
-import time
-import random
-from shared.logger import logger
-from aiortc import MediaStreamTrack
-
-# Import shared models for chat functionality
-import sys
-import os
-sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))
-from shared.models import ChatMessageModel
-
-
-AGENT_NAME = "chatbot"
-AGENT_DESCRIPTION = "Simple chatbot that responds to chat messages"
-
-# Simple response database
-RESPONSES = {
-    "hello": ["Hello!", "Hi there!", "Hey!", "Greetings!"],
-    "how are you": ["I'm doing well, thank you!", "Great, thanks for asking!", "I'm fine!"],
-    "goodbye": ["Goodbye!", "See you later!", "Bye!", "Take care!"],
-    "help": ["I can respond to simple greetings and questions. Try saying hello, asking how I am, or say goodbye!"],
-    "time": ["Let me check... it's currently {time}"],
-    "joke": [
-        "Why don't scientists trust atoms? Because they make up everything!",
-        "I told my wife she was drawing her eyebrows too high. She seemed surprised.",
-        "What do you call a fish wearing a crown? A king fish!",
-        "Why don't eggs tell jokes? They'd crack each other up!"
-    ]
-}
-
-
-def agent_info() -> Dict[str, str]:
-    return {"name": AGENT_NAME, "description": AGENT_DESCRIPTION, "has_media": "false"}
-
-
-def create_agent_tracks(session_name: str) -> dict[str, MediaStreamTrack]:
-    """Chatbot doesn't provide media tracks - it's chat-only."""
-    return {}
-
-
-async def handle_chat_message(chat_message: ChatMessageModel, send_message_func: Callable[[Union[str, ChatMessageModel]], Awaitable[None]]) -> Optional[str]:
-    """Handle incoming chat messages and provide responses.
-    
-    Args:
-        chat_message: The received chat message
-        send_message_func: Function to send messages back to the lobby
-    
-    Returns:
-        Optional response message to send back to the lobby
-    """
-    message_lower = chat_message.message.lower().strip()
-    sender = chat_message.sender_name
-    
-    logger.info(f"Chatbot received message from {sender}: {chat_message.message}")
-    
-    # Skip messages from ourselves
-    if sender.lower() == AGENT_NAME.lower():
-        return None
-    
-    # Look for keywords in the message
-    for keyword, responses in RESPONSES.items():
-        if keyword in message_lower:
-            response = random.choice(responses)
-            # Handle special formatting
-            if "{time}" in response:
-                current_time = time.strftime("%Y-%m-%d %H:%M:%S")
-                response = response.format(time=current_time)
-            
-            logger.info(f"Chatbot responding with: {response}")
-            return response
-    
-    # If we get a direct mention or question, provide a generic response
-    if any(word in message_lower for word in ["bot", "chatbot", "?"]):
-        responses = [
-            f"Hi {sender}! I'm a simple chatbot. Say 'help' to see what I can do!",
-            f"Hello {sender}! I heard you mention me. How can I help?",
-            "I'm here and listening! Try asking me about the time or tell me a greeting!"
-        ]
-        return random.choice(responses)
-    
-    # Default: don't respond to unrecognized messages
-    return None