Spaces:

MCP-1st-Birthday
/

vibe-reader

Running

App Files Files Community

carolinacc commited on 11 days ago

Commit

96ce57f

verified ·

1 Parent(s): b777cd2

Update app.py

Browse files

Files changed (1) hide show

app.py +301 -301

app.py CHANGED Viewed

@@ -1,302 +1,302 @@
-import gradio as gr
-from typing import List, Optional, Tuple, Dict, Any
-import uuid
-import os
-import sys
-import traceback
-from agent import run_agent
-# ============================================================================
-# CONSTANTS
-# ============================================================================
-# Example images hosted online (replace with your own URLs)
-EXAMPLE_IMAGE_URLS = [
-    "https://64.media.tumblr.com/456e9e6d8f42e677581f7d7994554600/03546756eb18cebb-2e/s400x600/7cd50d0a76327cf08cc75d17e540a11212b56a3b.jpg",
-    "https://64.media.tumblr.com/97e808fda7863d31729da77de9f03285/03546756eb18cebb-2b/s400x600/7fc1a84a8d3f5922ca1f24fd6cc453d45ba88f7f.jpg",
-    "https://64.media.tumblr.com/380d1592fa32f1e2290531879cfdd329/03546756eb18cebb-61/s400x600/e9d78c4467fa3a8dc6223667e236b922bb943775.jpg",
-]
-# ============================================================================
-# UI HELPER FUNCTIONS
-# ============================================================================
-def get_session_id():
-    """Generate a unique session ID for the user"""
-    return str(uuid.uuid4())
-def format_books_html(books: List[dict]) -> str:
-    """Format final books as HTML for display in a 3-column layout with larger covers"""
-    html = "<div style='width: 100%;'>"
-    html += "<h2 style='color: #667eea; margin-bottom: 20px;'>📚 Your Personalized Recommendations</h2>"
-    html += "<div style='display: grid; grid-template-columns: repeat(3, 1fr); gap: 20px; align-items: start;'>"
-    for i, book in enumerate(books, 1):
-        desc = book.get("description", "")
-        html += f"""
-        <div style='padding: 16px; background: white;
-                    border-radius: 12px; border-left: 4px solid #667eea; box-shadow: 0 2px 8px rgba(0,0,0,0.08);'>
-            <div style='display: flex; gap: 16px; align-items: flex-start;'>
-                <img src='{book.get("cover_url", "")}'
-                     style='width: 120px; min-width: 120px; height: 180px; object-fit: cover; border-radius: 8px; box-shadow: 0 4px 12px rgba(0,0,0,0.15);'
-                     onerror='this.style.display="none"' />
-                <div style='flex: 1; min-width: 0;'>
-                    <h3 style='margin: 0 0 8px 0; color: #667eea; font-size: 1.1em; line-height: 1.3;'>{i}. {book["title"]}</h3>
-                    <p style='margin: 0; color: #666; font-style: italic; font-size: 0.9em;'>by {book["author"]}</p>
-                </div>
-            </div>
-            <p style='margin: 16px 0 0 0; color: #555; line-height: 1.6; font-size: 0.9em;'>{desc}</p>
-        </div>
-        """
-    html += "</div></div>"
-    return html
-def load_example_images():
-    """Load example images from URLs"""
-    return EXAMPLE_IMAGE_URLS
-# REMOVED: messages_to_chatbot_format - using agent's List[Dict] directly
-# ============================================================================
-# EVENT HANDLERS
-# ============================================================================
-def process_upload(images: List, session_id: str, progress=gr.Progress()):
-    """Handle image upload and start the agent workflow"""
-    if not images:
-        # Return empty list for the Chatbot component
-        yield [], "Please upload images.", "", None, gr.update(visible=True), ""
-        return
-    # Process image paths
-    image_paths = []
-    for img in images:
-        if hasattr(img, 'name'): image_paths.append(img.name)
-        # Added safety checks for common Gradio formats
-        elif isinstance(img, dict) and 'path' in img: image_paths.append(img['path'])
-        elif isinstance(img, str) and img.startswith('http'): image_paths.append(img)  # URLs
-        elif isinstance(img, str) and os.path.isfile(img): image_paths.append(img)
-        elif isinstance(img, tuple): image_paths.append(img[0])
-    if not image_paths:
-        yield [], "Error processing images.", "", None, gr.update(visible=True), ""
-        return
-    try:
-        # Show loading status
-        yield [], "", "", None, gr.update(visible=False), "🎨 Analyzing your vibe images..."
-        # Run agent with session_id acting as the thread_id
-        result = run_agent(images=image_paths, thread_id=session_id)
-        # CRUCIAL FIX: Use the agent's List[Dict] messages directly
-        chat_history = result["messages"]
-        reasoning = "\n".join(result.get("reasoning", []))
-        # Outputs: [chatbot, reasoning, recommendations, soundtrack, start_btn, status]
-        yield chat_history, reasoning, "", None, gr.update(visible=False), "✨ Vibe analysis complete!"
-    except Exception as e:
-        yield [], f"Error: {e}\n{traceback.format_exc()}", "", None, gr.update(visible=True), "❌ Error occurred"
-def add_user_message(user_message: str, history: List[Dict[str, str]]):
-    """
-    Step 1 of Chat: Add user message to history in the new Chatbot format.
-    """
-    if not user_message.strip():
-        return history, ""
-    # Append the new message in the List[Dict] format
-    new_message = {"role": "user", "content": user_message}
-    return history + [new_message], ""
-def generate_bot_response(history: List[Dict[str, str]], session_id: str):
-    """
-    Step 2 of Chat: Call agent and update history with response.
-    Uses yield to show loading status.
-    """
-    print(f"[DEBUG] generate_bot_response called with session_id={session_id}")
-    print(f"[DEBUG] history has {len(history) if history else 0} messages")
-    # Get the last user message from the List[Dict] history
-    if not history or history[-1]["role"] != "user":
-        # Should not happen in normal flow, but safety check
-        print("[DEBUG] No user message found in history")
-        yield history, "No message to process", "", None, ""
-        return
-    # The user message is already in history, we only need the content to resume the agent
-    user_content = history[-1]["content"]
-    # Gradio 6 may return content as a list of dicts with 'text' key
-    if isinstance(user_content, list):
-        user_message = " ".join(item.get("text", str(item)) for item in user_content if isinstance(item, dict))
-    else:
-        user_message = str(user_content)
-    print(f"[DEBUG] Resuming agent with user_message: {user_message[:50]}...")
-    try:
-        # Show loading status
-        yield history, "", "", None, "🔄 Processing your response..."
-        # Resume agent execution using the session_id
-        result = run_agent(images=[], user_message=user_message, thread_id=session_id)
-        print(f"[DEBUG] run_agent returned: {type(result)}")
-        if result:
-            print(f"[DEBUG] result keys: {result.keys() if isinstance(result, dict) else 'N/A'}")
-        if result is None:
-            print("[DEBUG] result is None - agent may not have resumed properly")
-            history.append({"role": "assistant", "content": "Error: Agent did not return a response."})
-            yield history, "Agent returned None", "", None, "❌ Agent error"
-            return
-        # CRUCIAL FIX: The agent returns the full updated history in the List[Dict] format
-        updated_history = result["messages"]
-        reasoning = "\n".join(result.get("reasoning", []))
-        print(f"[DEBUG] updated_history has {len(updated_history)} messages")
-        # Check for final results
-        books_html = ""
-        if result.get("final_books"):
-            books_html = format_books_html(result["final_books"])
-        soundtrack = result.get("soundtrack_url", "") or None
-        # Determine status based on what happened
-        if result.get("final_books"):
-            status = "✅ Recommendations ready!"
-        elif "retrieved_books" in result and result["retrieved_books"]:
-            status = "📚 Books retrieved, refining..."
-        else:
-            status = "💭 Awaiting your input..."
-        # Outputs: [chatbot, reasoning, recommendations, soundtrack, status]
-        yield updated_history, reasoning, books_html, soundtrack, status
-    except Exception as e:
-        # Append error to chat by updating the last user message's response
-        error_msg = f"Agent Error: {str(e)}"
-        print(f"[DEBUG] Exception in generate_bot_response: {e}")
-        traceback.print_exc()
-        # Append assistant error message
-        history.append({"role": "assistant", "content": error_msg})
-        yield history, f"Error trace: {traceback.format_exc()}", "", None, "❌ Error occurred"
-def reset_app():
-    """Reset the session"""
-    new_id = get_session_id()
-    # Returns: [session_id, chatbot, reasoning, books, soundtrack, input, images, start_btn, status]
-    return new_id, [], "", "", None, "", None, gr.update(visible=True), "Ready to analyze your vibe!"
-# ============================================================================
-# LAYOUT
-# ============================================================================
-with gr.Blocks() as demo:
-    # State management for multi-user support
-    session_id = gr.State(get_session_id())
-    gr.Markdown("# 📚 The Vibe Reader", elem_id='main-title')
-    gr.Markdown("""
-**How it works:**
-- 🎨 **Vision AI** extracts mood, themes, and aesthetic keywords from your images
-- 📚 **Semantic search** queries a vector DB of 50k+ book recs from r/BooksThatFeelLikeThis
-- 💬 **Conversational refinement** asks targeted questions to narrow down preferences
-- 📖 **Google Books MCP** enriches results with covers, descriptions, and metadata
-- 🎵 **ElevenLabs AI** generates a custom soundtrack that matches your reading vibe
-""", elem_id='subtitle')
-    with gr.Row():
-        # Left: Inputs
-        with gr.Column(scale=1):
-            gr.Markdown("### 1. Upload Your Vibe")
-            image_input = gr.Gallery(label="Visual Inspiration", columns=3, height="300px")
-            load_examples_btn = gr.Button("📷 Load Example Images (Credits: @thegorgonist)", variant="secondary", size="md")
-            start_btn = gr.Button("🔮 Analyze Vibe", variant="primary", size="lg")
-            status_display = gr.Textbox(label="Status", value="Ready to analyze your vibe!", interactive=False, elem_id="status-display")
-            reset_btn = gr.Button("🔄 Start Over", variant="secondary")
-        # Right: Chat
-        with gr.Column(scale=1):
-            gr.Markdown("### 2. Refine & Discover")
-            # Chatbot now uses the new List[Dict] format
-            chatbot = gr.Chatbot(height=500, label="Agent Conversation")
-            with gr.Row():
-                msg_input = gr.Textbox(
-                    show_label=False,
-                    placeholder="Type your response here...",
-                    scale=4,
-                    container=False
-                )
-                submit_btn = gr.Button("Send", variant="primary", scale=1)
-    # Outputs - Recommendations first, then reasoning
-    recommendations_output = gr.HTML(label="Recommendations")
-    soundtrack_player = gr.Audio(label="Vibe Soundtrack", type="filepath", interactive=False)
-    with gr.Accordion("🔍 Internal Reasoning", open=True):
-        reasoning_display = gr.Textbox(label="Agent Thoughts", lines=10, interactive=False)
-    # ============================================================================
-    # INTERACTION LOGIC
-    # ============================================================================
-    # 0. Load Example Images
-    load_examples_btn.click(
-        fn=load_example_images,
-        inputs=[],
-        outputs=[image_input]
-    )
-    # 1. Start Analysis
-    start_btn.click(
-        fn=process_upload,
-        inputs=[image_input, session_id],
-        outputs=[chatbot, reasoning_display, recommendations_output, soundtrack_player, start_btn, status_display]
-    )
-    # 2. Chat Interaction (User enters text -> History updates -> Bot responds)
-    # User adds message to history optimistically and clears input
-    user_event = msg_input.submit(
-        fn=add_user_message,
-        inputs=[msg_input, chatbot],
-        outputs=[chatbot, msg_input],
-        queue=False
-    )
-    # Bot generates response and updates the full history
-    user_event.then(
-        fn=generate_bot_response,
-        inputs=[chatbot, session_id],
-        outputs=[chatbot, reasoning_display, recommendations_output, soundtrack_player, status_display]
-    )
-    submit_btn.click(
-        fn=add_user_message,
-        inputs=[msg_input, chatbot],
-        outputs=[chatbot, msg_input],
-        queue=False
-    ).then(
-        fn=generate_bot_response,
-        inputs=[chatbot, session_id],
-        outputs=[chatbot, reasoning_display, recommendations_output, soundtrack_player, status_display]
-    )
-    # 3. Reset
-    reset_btn.click(
-        fn=reset_app,
-        inputs=[],
-        outputs=[session_id, chatbot, reasoning_display, recommendations_output, soundtrack_player, msg_input, image_input, start_btn, status_display]
-    )
-if __name__ == "__main__":
     demo.queue().launch(theme=gr.themes.Monochrome(), css_paths='app/custom.css')

+import gradio as gr
+from typing import List, Optional, Tuple, Dict, Any
+import uuid
+import os
+import sys
+import traceback
+from app.agent import run_agent
+# ============================================================================
+# CONSTANTS
+# ============================================================================
+# Example images hosted online (replace with your own URLs)
+EXAMPLE_IMAGE_URLS = [
+    "https://64.media.tumblr.com/456e9e6d8f42e677581f7d7994554600/03546756eb18cebb-2e/s400x600/7cd50d0a76327cf08cc75d17e540a11212b56a3b.jpg",
+    "https://64.media.tumblr.com/97e808fda7863d31729da77de9f03285/03546756eb18cebb-2b/s400x600/7fc1a84a8d3f5922ca1f24fd6cc453d45ba88f7f.jpg",
+    "https://64.media.tumblr.com/380d1592fa32f1e2290531879cfdd329/03546756eb18cebb-61/s400x600/e9d78c4467fa3a8dc6223667e236b922bb943775.jpg",
+]
+# ============================================================================
+# UI HELPER FUNCTIONS
+# ============================================================================
+def get_session_id():
+    """Generate a unique session ID for the user"""
+    return str(uuid.uuid4())
+def format_books_html(books: List[dict]) -> str:
+    """Format final books as HTML for display in a 3-column layout with larger covers"""
+    html = "<div style='width: 100%;'>"
+    html += "<h2 style='color: #667eea; margin-bottom: 20px;'>📚 Your Personalized Recommendations</h2>"
+    html += "<div style='display: grid; grid-template-columns: repeat(3, 1fr); gap: 20px; align-items: start;'>"
+    for i, book in enumerate(books, 1):
+        desc = book.get("description", "")
+        html += f"""
+        <div style='padding: 16px; background: white;
+                    border-radius: 12px; border-left: 4px solid #667eea; box-shadow: 0 2px 8px rgba(0,0,0,0.08);'>
+            <div style='display: flex; gap: 16px; align-items: flex-start;'>
+                <img src='{book.get("cover_url", "")}'
+                     style='width: 120px; min-width: 120px; height: 180px; object-fit: cover; border-radius: 8px; box-shadow: 0 4px 12px rgba(0,0,0,0.15);'
+                     onerror='this.style.display="none"' />
+                <div style='flex: 1; min-width: 0;'>
+                    <h3 style='margin: 0 0 8px 0; color: #667eea; font-size: 1.1em; line-height: 1.3;'>{i}. {book["title"]}</h3>
+                    <p style='margin: 0; color: #666; font-style: italic; font-size: 0.9em;'>by {book["author"]}</p>
+                </div>
+            </div>
+            <p style='margin: 16px 0 0 0; color: #555; line-height: 1.6; font-size: 0.9em;'>{desc}</p>
+        </div>
+        """
+    html += "</div></div>"
+    return html
+def load_example_images():
+    """Load example images from URLs"""
+    return EXAMPLE_IMAGE_URLS
+# REMOVED: messages_to_chatbot_format - using agent's List[Dict] directly
+# ============================================================================
+# EVENT HANDLERS
+# ============================================================================
+def process_upload(images: List, session_id: str, progress=gr.Progress()):
+    """Handle image upload and start the agent workflow"""
+    if not images:
+        # Return empty list for the Chatbot component
+        yield [], "Please upload images.", "", None, gr.update(visible=True), ""
+        return
+    # Process image paths
+    image_paths = []
+    for img in images:
+        if hasattr(img, 'name'): image_paths.append(img.name)
+        # Added safety checks for common Gradio formats
+        elif isinstance(img, dict) and 'path' in img: image_paths.append(img['path'])
+        elif isinstance(img, str) and img.startswith('http'): image_paths.append(img)  # URLs
+        elif isinstance(img, str) and os.path.isfile(img): image_paths.append(img)
+        elif isinstance(img, tuple): image_paths.append(img[0])
+    if not image_paths:
+        yield [], "Error processing images.", "", None, gr.update(visible=True), ""
+        return
+    try:
+        # Show loading status
+        yield [], "", "", None, gr.update(visible=False), "🎨 Analyzing your vibe images..."
+        # Run agent with session_id acting as the thread_id
+        result = run_agent(images=image_paths, thread_id=session_id)
+        # CRUCIAL FIX: Use the agent's List[Dict] messages directly
+        chat_history = result["messages"]
+        reasoning = "\n".join(result.get("reasoning", []))
+        # Outputs: [chatbot, reasoning, recommendations, soundtrack, start_btn, status]
+        yield chat_history, reasoning, "", None, gr.update(visible=False), "✨ Vibe analysis complete!"
+    except Exception as e:
+        yield [], f"Error: {e}\n{traceback.format_exc()}", "", None, gr.update(visible=True), "❌ Error occurred"
+def add_user_message(user_message: str, history: List[Dict[str, str]]):
+    """
+    Step 1 of Chat: Add user message to history in the new Chatbot format.
+    """
+    if not user_message.strip():
+        return history, ""
+    # Append the new message in the List[Dict] format
+    new_message = {"role": "user", "content": user_message}
+    return history + [new_message], ""
+def generate_bot_response(history: List[Dict[str, str]], session_id: str):
+    """
+    Step 2 of Chat: Call agent and update history with response.
+    Uses yield to show loading status.
+    """
+    print(f"[DEBUG] generate_bot_response called with session_id={session_id}")
+    print(f"[DEBUG] history has {len(history) if history else 0} messages")
+    # Get the last user message from the List[Dict] history
+    if not history or history[-1]["role"] != "user":
+        # Should not happen in normal flow, but safety check
+        print("[DEBUG] No user message found in history")
+        yield history, "No message to process", "", None, ""
+        return
+    # The user message is already in history, we only need the content to resume the agent
+    user_content = history[-1]["content"]
+    # Gradio 6 may return content as a list of dicts with 'text' key
+    if isinstance(user_content, list):
+        user_message = " ".join(item.get("text", str(item)) for item in user_content if isinstance(item, dict))
+    else:
+        user_message = str(user_content)
+    print(f"[DEBUG] Resuming agent with user_message: {user_message[:50]}...")
+    try:
+        # Show loading status
+        yield history, "", "", None, "🔄 Processing your response..."
+        # Resume agent execution using the session_id
+        result = run_agent(images=[], user_message=user_message, thread_id=session_id)
+        print(f"[DEBUG] run_agent returned: {type(result)}")
+        if result:
+            print(f"[DEBUG] result keys: {result.keys() if isinstance(result, dict) else 'N/A'}")
+        if result is None:
+            print("[DEBUG] result is None - agent may not have resumed properly")
+            history.append({"role": "assistant", "content": "Error: Agent did not return a response."})
+            yield history, "Agent returned None", "", None, "❌ Agent error"
+            return
+        # CRUCIAL FIX: The agent returns the full updated history in the List[Dict] format
+        updated_history = result["messages"]
+        reasoning = "\n".join(result.get("reasoning", []))
+        print(f"[DEBUG] updated_history has {len(updated_history)} messages")
+        # Check for final results
+        books_html = ""
+        if result.get("final_books"):
+            books_html = format_books_html(result["final_books"])
+        soundtrack = result.get("soundtrack_url", "") or None
+        # Determine status based on what happened
+        if result.get("final_books"):
+            status = "✅ Recommendations ready!"
+        elif "retrieved_books" in result and result["retrieved_books"]:
+            status = "📚 Books retrieved, refining..."
+        else:
+            status = "💭 Awaiting your input..."
+        # Outputs: [chatbot, reasoning, recommendations, soundtrack, status]
+        yield updated_history, reasoning, books_html, soundtrack, status
+    except Exception as e:
+        # Append error to chat by updating the last user message's response
+        error_msg = f"Agent Error: {str(e)}"
+        print(f"[DEBUG] Exception in generate_bot_response: {e}")
+        traceback.print_exc()
+        # Append assistant error message
+        history.append({"role": "assistant", "content": error_msg})
+        yield history, f"Error trace: {traceback.format_exc()}", "", None, "❌ Error occurred"
+def reset_app():
+    """Reset the session"""
+    new_id = get_session_id()
+    # Returns: [session_id, chatbot, reasoning, books, soundtrack, input, images, start_btn, status]
+    return new_id, [], "", "", None, "", None, gr.update(visible=True), "Ready to analyze your vibe!"
+# ============================================================================
+# LAYOUT
+# ============================================================================
+with gr.Blocks() as demo:
+    # State management for multi-user support
+    session_id = gr.State(get_session_id())
+    gr.Markdown("# 📚 The Vibe Reader", elem_id='main-title')
+    gr.Markdown("""
+**How it works:**
+- 🎨 **Vision AI** extracts mood, themes, and aesthetic keywords from your images
+- 📚 **Semantic search** queries a vector DB of 50k+ book recs from r/BooksThatFeelLikeThis
+- 💬 **Conversational refinement** asks targeted questions to narrow down preferences
+- 📖 **Google Books MCP** enriches results with covers, descriptions, and metadata
+- 🎵 **ElevenLabs AI** generates a custom soundtrack that matches your reading vibe
+""", elem_id='subtitle')
+    with gr.Row():
+        # Left: Inputs
+        with gr.Column(scale=1):
+            gr.Markdown("### 1. Upload Your Vibe")
+            image_input = gr.Gallery(label="Visual Inspiration", columns=3, height="300px")
+            load_examples_btn = gr.Button("📷 Load Example Images (Credits: @thegorgonist)", variant="secondary", size="md")
+            start_btn = gr.Button("🔮 Analyze Vibe", variant="primary", size="lg")
+            status_display = gr.Textbox(label="Status", value="Ready to analyze your vibe!", interactive=False, elem_id="status-display")
+            reset_btn = gr.Button("🔄 Start Over", variant="secondary")
+        # Right: Chat
+        with gr.Column(scale=1):
+            gr.Markdown("### 2. Refine & Discover")
+            # Chatbot now uses the new List[Dict] format
+            chatbot = gr.Chatbot(height=500, label="Agent Conversation")
+            with gr.Row():
+                msg_input = gr.Textbox(
+                    show_label=False,
+                    placeholder="Type your response here...",
+                    scale=4,
+                    container=False
+                )
+                submit_btn = gr.Button("Send", variant="primary", scale=1)
+    # Outputs - Recommendations first, then reasoning
+    recommendations_output = gr.HTML(label="Recommendations")
+    soundtrack_player = gr.Audio(label="Vibe Soundtrack", type="filepath", interactive=False)
+    with gr.Accordion("🔍 Internal Reasoning", open=True):
+        reasoning_display = gr.Textbox(label="Agent Thoughts", lines=10, interactive=False)
+    # ============================================================================
+    # INTERACTION LOGIC
+    # ============================================================================
+    # 0. Load Example Images
+    load_examples_btn.click(
+        fn=load_example_images,
+        inputs=[],
+        outputs=[image_input]
+    )
+    # 1. Start Analysis
+    start_btn.click(
+        fn=process_upload,
+        inputs=[image_input, session_id],
+        outputs=[chatbot, reasoning_display, recommendations_output, soundtrack_player, start_btn, status_display]
+    )
+    # 2. Chat Interaction (User enters text -> History updates -> Bot responds)
+    # User adds message to history optimistically and clears input
+    user_event = msg_input.submit(
+        fn=add_user_message,
+        inputs=[msg_input, chatbot],
+        outputs=[chatbot, msg_input],
+        queue=False
+    )
+    # Bot generates response and updates the full history
+    user_event.then(
+        fn=generate_bot_response,
+        inputs=[chatbot, session_id],
+        outputs=[chatbot, reasoning_display, recommendations_output, soundtrack_player, status_display]
+    )
+    submit_btn.click(
+        fn=add_user_message,
+        inputs=[msg_input, chatbot],
+        outputs=[chatbot, msg_input],
+        queue=False
+    ).then(
+        fn=generate_bot_response,
+        inputs=[chatbot, session_id],
+        outputs=[chatbot, reasoning_display, recommendations_output, soundtrack_player, status_display]
+    )
+    # 3. Reset
+    reset_btn.click(
+        fn=reset_app,
+        inputs=[],
+        outputs=[session_id, chatbot, reasoning_display, recommendations_output, soundtrack_player, msg_input, image_input, start_btn, status_display]
+    )
+if __name__ == "__main__":
     demo.queue().launch(theme=gr.themes.Monochrome(), css_paths='app/custom.css')