Spaces:

Pixeltable
/

Call-Analysis-AI-Tool

Running

App Files Files Community

PierreBrunelle commited on Oct 16, 2024

Commit

f7689c9

verified ·

1 Parent(s): b24fd86

Create app.py

Browse files

Files changed (1) hide show

app.py +258 -0

app.py ADDED Viewed

	@@ -0,0 +1,258 @@

+import gradio as gr
+import pixeltable as pxt
+from pixeltable.iterators import FrameIterator, StringSplitter
+from pixeltable.functions.video import extract_audio
+from pixeltable.functions.audio import get_metadata
+from pixeltable.functions import openai
+import os
+import getpass
+import numpy as np
+from pixeltable.functions.huggingface import sentence_transformer
+# Store OpenAI API Key
+if 'OPENAI_API_KEY' not in os.environ:
+    os.environ['OPENAI_API_KEY'] = getpass.getpass('Enter your OpenAI API key:')
+MAX_VIDEO_SIZE_MB = 35
+def process_video(video_file, progress=gr.Progress()):
+    progress(0, desc="Initializing...")
+    try:
+        # Create a Table, a View, and Computed Columns
+        pxt.drop_dir('gong_demo', force=True)
+        pxt.create_dir('gong_demo')
+        calls_table = pxt.create_table(
+            'gong_demo.calls', {
+            "video": pxt.VideoType(nullable=True),
+            }
+        )
+        frames_view = pxt.create_view(
+            "gong_demo.frames",
+            calls_table,
+            iterator=FrameIterator.create(video=calls_table.video, fps=1)
+        )
+        # Create computed columns to store transformations and persist outputs
+        calls_table['audio'] = extract_audio(calls_table.video, format='mp3')
+        calls_table['metadata'] = get_metadata(calls_table.audio)
+        calls_table['transcription'] = openai.transcriptions(audio=calls_table.audio, model='whisper-1')
+        calls_table['transcription_text'] = calls_table.transcription.text.astype(pxt.StringType())
+        sentences_view = pxt.create_view(
+            'gong_demo.sentences',
+            calls_table,
+            iterator=StringSplitter.create(
+                text=calls_table.transcription_text,
+                separators='sentence'
+            )
+        )
+        @pxt.expr_udf
+        def e5_embed(text: str) -> np.ndarray:
+            return sentence_transformer(text, model_id='intfloat/e5-large-v2')
+        sentences_view.add_embedding_index('text', string_embed=e5_embed)
+        progress(0.2, desc="Creating UDFs...")
+        # Custom User-Defined Function (UDF) for Generating Insights
+        @pxt.udf
+        def generate_insights(transcription: str) -> list[dict]:
+            system_msg = 'You are an AI assistant that analyzes call transcriptions. Analyze the following call transcription and provide insights on: 1. Main topics discussed 2. Action items 3. Sentiment analysis 4. Key questions asked'
+            user_msg = f'Transcription: "{transcription}"'
+            return [
+                {'role': 'system', 'content': system_msg},
+                {'role': 'user', 'content': user_msg}
+            ]
+        # Apply the UDF to create a new column
+        calls_table['insights_prompt'] = generate_insights(calls_table.transcription_text)
+        progress(0.4, desc="Generating insights...")
+        # Generate insights using OpenAI's chat completion API
+        calls_table['insights_response'] = openai.chat_completions(messages=calls_table.insights_prompt, model='gpt-3.5-turbo', max_tokens=500)
+        # Extract the content of the response
+        calls_table['insights'] = calls_table.insights_response.choices[0].message.content
+        if not video_file:
+            return "Please upload a video file.", ""
+        # Check video file size
+        video_size = os.path.getsize(video_file) / (1024 * 1024)  # Convert to MB
+        if video_size > MAX_VIDEO_SIZE_MB:
+            return f"The video file is larger than {MAX_VIDEO_SIZE_MB} MB. Please upload a smaller file.", ""
+        progress(0.6, desc="Processing video...")
+        # Insert a video into the table
+        calls_table.insert([{"video": video_file}])
+        progress(0.8, desc="Retrieving results...")
+        # Retrieve transcription and insights
+        result = calls_table.select(calls_table.transcription_text, calls_table.insights).tail(1)
+        transcription = result['transcription_text'][0]
+        insights = result['insights'][0]
+        progress(1.0, desc="Processing complete")
+        return transcription, insights, "Processing complete"
+    except Exception as e:
+        return f"An error occurred during video processing: {str(e)}", ""
+# Perform similarity search
+def similarity_search(query, num_results, progress=gr.Progress()):
+    sentences_view  = pxt.get_table('gong_demo.sentences')
+    progress(0.5, desc="Performing search...")
+    sim = sentences_view.text.similarity(query)
+    results = sentences_view.order_by(sim, asc=False).limit(num_results).select(sentences_view.text, sim=sim).collect().to_pandas()
+    return results
+    progress(1.0, desc="Search complete")
+def chatbot_response(message, chat_history):
+    @pxt.udf
+    def create_chatbot_prompt(context: str, question: str) -> list[dict]:
+        system_message = "You are an AI assistant that answers questions about a call based on the provided context. If the answer cannot be found in the context, say that you don't know."
+        user_message = f"Context:\n{context}\n\nQuestion: {question}"
+        return [
+            {"role": "system", "content": system_message},
+            {"role": "user", "content": user_message}
+        ]
+    try:
+        sentences_view = pxt.get_table('gong_demo.sentences')
+        # Perform similarity search to get relevant context
+        sim = sentences_view.text.similarity(message)
+        context = sentences_view.order_by(sim, asc=False).limit(5).select(sentences_view.text, sim=sim).collect()
+        # Prepare the context for the prompt
+        context_text = "\n".join([row['text'] for row in context])
+        # Create a temporary table for the chatbot interaction
+        temp_table = pxt.create_table('gong_demo.temp_chatbot', {'question': pxt.StringType()})
+        temp_table.insert([{'question': message}])
+        # Create computed columns for the prompt and response
+        temp_table['chatbot_prompt'] = create_chatbot_prompt(context_text, temp_table.question)
+        temp_table['chatbot_response'] = openai.chat_completions(
+            messages=temp_table.chatbot_prompt,
+            model='gpt-3.5-turbo',
+            max_tokens=150
+        )
+        temp_table['answer'] = temp_table.chatbot_response.choices[0].message.content
+        answer = temp_table.select(temp_table.answer).collect()['answer'][0]
+        # Clean up the temporary table
+        pxt.drop_table('gong_demo.temp_chatbot', force=True)
+        chat_history.append((message, answer))
+        return "", chat_history  # Return both expected outputs
+    except Exception as e:
+        error_message = f"An error occurred: {str(e)}"
+        chat_history.append((message, error_message))
+        return "", chat_history  # Return both expec
+# Gradio interface
+with gr.Blocks(theme=gr.themes.Base()) as demo:
+    gr.Markdown(
+        """
+        <div style="text-align: left; margin-bottom: 20px;">
+            <img src="https://raw.githubusercontent.com/pixeltable/pixeltable/main/docs/source/data/pixeltable-logo-large.png" alt="Pixeltable" style="max-width: 150px;" />
+            <h1 style="margin-top: 10px;">Call Analysis AI Tool</h1>
+        </div>
+        """
+    )
+    gr.HTML(
+        """
+        <p style="text-align: left;">
+            Powered by <a href="https://github.com/pixeltable/pixeltable" target="_blank" style="color: #F25022; text-decoration: none; font-weight: bold;">Pixeltable</a>
+            - Analyze calls, extract insights, and interact with AI-powered assistance.
+        </p>
+        """
+    )
+    with gr.Row():
+        with gr.Column():
+            with gr.Accordion("🎯 What does it do?", open=False):
+                gr.Markdown("""
+                - 🎙️ Transcribes call audio to text
+                - 💡 Generates insights and key points
+                - 🔍 Enables content-based similarity search
+                - 🤖 Provides an AI chatbot for in-depth analysis
+                - 📊 Offers summaries of call data
+                """)
+        with gr.Column():
+            with gr.Accordion("🛠️ How does it work?", open=False):
+                gr.Markdown("""
+                1. 📤 Upload your call recording (video)
+                2. ⚙️ AI processes and analyzes the content
+                3. 📝 Review the transcript and generated insights
+                4. 🔎 Use similarity search to explore specific topics
+                5. 💬 Interact with the AI chatbot for deeper understanding
+                """)
+    with gr.Row():
+        with gr.Column(scale=1):
+            video_file = gr.Video(
+                label=f"Upload Call Recording (max {MAX_VIDEO_SIZE_MB} MB)",
+            )
+            process_btn = gr.Button("Analyze Call", variant="primary")
+            status_output = gr.Textbox(label="Status", interactive=False)
+        with gr.Column(scale=2):
+            with gr.Tabs() as tabs:
+                with gr.TabItem("📝 Transcript"):
+                    output_transcription = gr.Textbox(label="Call Transcription", lines=15)
+                with gr.TabItem("💡 Insights"):
+                    output_insights = gr.Textbox(label="Key Takeaways", lines=10)
+                with gr.TabItem("🔍 Similarity Search"):
+                    with gr.Row():
+                        similarity_query = gr.Textbox(label="Search Query", placeholder="Enter a topic or phrase to search for")
+                        num_results = gr.Slider(minimum=1, maximum=20, value=5, step=1, label="Number of Results")
+                    similarity_search_btn = gr.Button("Search", variant="secondary")
+                    similarity_results = gr.DataFrame(
+                        headers=["Relevant Text", "Similarity Score"],
+                        label="Search Results"
+                    )
+                with gr.TabItem("🤖 AI Assistant"):
+                    chatbot = gr.Chatbot(height=400, label="Chat with AI about the call")
+                    with gr.Row():
+                        msg = gr.Textbox(label="Ask a question about the call", placeholder="e.g., What were the main points discussed?", scale=4)
+                        send_btn = gr.Button("Send", variant="secondary", scale=1)
+                    clear = gr.Button("Clear Chat")
+    process_btn.click(
+        process_video,
+        inputs=[video_file],
+        outputs=[output_transcription, output_insights, status_output],
+        show_progress="full"
+    )
+    similarity_search_btn.click(
+        similarity_search,
+        inputs=[similarity_query, num_results],
+        outputs=[similarity_results]
+    )
+    msg.submit(chatbot_response, [msg, chatbot], [msg, chatbot])
+    send_btn.click(chatbot_response, [msg, chatbot], [msg, chatbot])
+    clear.click(lambda: None, None, chatbot, queue=False)
+if __name__ == "__main__":
+    demo.launch(debug=True)