summarizer-tool

Running

App Files Files Community

Chris4K commited on 3 days ago

Commit

3ca5125

verified ·

1 Parent(s): 3b1ba42

Update app.py

Browse files

Files changed (1) hide show

app.py +249 -60

app.py CHANGED Viewed

@@ -1,70 +1,259 @@
-from simple_sentiment import SimpleSentimentTool
-# Create an instance of the tool without preloading to avoid startup errors
-sentiment_tool = SimpleSentimentTool(default_model="distilbert", preload=False)
-# Launch the Gradio interface
-if __name__ == "__main__":
-    import gradio as gr
-    with gr.Blocks(title="Sentiment Analysis Tool") as demo:
-        gr.Markdown("# Multi-Model Sentiment Analysis Tool")
-        with gr.Row():
-            with gr.Column():
-                text_input = gr.Textbox(
-                    label="Enter text to analyze",
-                    placeholder="Type your text here...",
-                    lines=5
-                )
-                model_dropdown = gr.Dropdown(
-                    choices=list(sentiment_tool.models.keys()),
-                    value=sentiment_tool.default_model,
-                    label="Select Model"
-                )
-                with gr.Row():
-                    analyze_btn = gr.Button("Analyze Sentiment")
-                    clear_btn = gr.Button("Clear")
-            with gr.Column():
-                output = gr.JSON(label="Sentiment Analysis Results")
-        def analyze_with_model(text, model_key):
-            """Call the tool's forward method directly with appropriate parameters."""
-            if not text:
-                return "{\"error\": \"Please enter some text to analyze\"}"
-            # The tool returns a JSON string now
-            json_str = sentiment_tool.forward(text, model_key)
-            # But we need to parse it for the Gradio JSON component
-            import json
-            try:
-                return json.loads(json_str)
-            except:
-                return {"error": "Failed to parse results"}
-        analyze_btn.click(
-            fn=analyze_with_model,
-            inputs=[text_input, model_dropdown],
-            outputs=output
         )
-        clear_btn.click(
-            fn=lambda: ("", None),
-            inputs=None,
-            outputs=[text_input, output]
-        )
-        gr.Examples(
-            examples=[
-                ["I love this product! It's amazing and works perfectly.", "distilbert"],
-                ["This movie was terrible. I was very disappointed.", "distilbert"],
-                ["The service was okay, but could be improved in several ways.", "distilbert"],
-                ["Ce produit est vraiment excellent!", "multilingual"],
-                ["Dieses Buch ist sehr interessant.", "german"]
-            ],
-            inputs=[text_input, model_dropdown]
-        )
-    demo.launch(share=True)

+import os
+import gradio as gr
+import warnings
+from smolagents import CodeAgent, InferenceClientModel
+import json
+# Suppress unnecessary warnings
+warnings.filterwarnings("ignore")
+# Import our Text Summarizer Tool
+from summarizer_tool import TextSummarizerTool
+# Initialize the Text Summarizer Tool
+summarizer_tool = TextSummarizerTool()
+# Load HuggingFace token from environment variable if available
+hf_token = os.environ.get("HF_TOKEN")
+# Sample texts for quick testing
+sample_texts = {
+    "News Article": """
+    The European Union has approved a landmark artificial intelligence law, establishing comprehensive
+    regulations for AI systems according to their potential risks. The regulation categorizes AI into
+    four risk levels: unacceptable risk, high risk, limited risk, and minimal risk. Systems deemed to
+    pose unacceptable risks, such as those using subliminal manipulation or social scoring, will be
+    banned. High-risk systems, including those used in critical infrastructure, education, employment,
+    and law enforcement, will face strict requirements before market entry. These requirements include
+    risk assessments, high-quality datasets, detailed documentation, human oversight, and transparency.
+    The law aims to ensure AI systems are safe, transparent, traceable, non-discriminatory, and
+    environmentally friendly, while fostering innovation and establishing Europe as a leader in
+    responsible AI development.
+    """,
+    "Scientific Paper Abstract": """
+    Recent advancements in large language models (LLMs) have demonstrated remarkable capabilities
+    across various tasks. However, these models still face challenges with reasoning, factuality,
+    and potential biases. This paper introduces a novel framework for enhancing LLM performance
+    through a multi-stage processing pipeline that integrates retrieval-augmented generation,
+    self-reflection mechanisms, and external knowledge verification. Our approach, which we call
+    RACER (Retrieval-Augmented Chain-of-thought Enhanced Reasoning), demonstrates significant
+    improvements across benchmarks testing reasoning (GSM8K, +12.3%), factuality (FACTOR, +17.8%),
+    and reduced bias (BBQ, -24.5%) compared to base models. Additionally, we show that RACER is
+    complementary to existing techniques like chain-of-thought prompting and can be applied to
+    various model architectures with minimal computational overhead. Through extensive ablation
+    studies, we identify the contribution of each component and provide insights for efficient
+    implementation in real-world applications.
+    """,
+    "Business Report": """
+    Q1 Financial Performance Summary: The company achieved significant growth in the first quarter,
+    with revenue reaching $78.5 million, a 24% increase compared to the same period last year. This
+    growth was primarily driven by our expanded product portfolio and increased market penetration in
+    European and Asian markets. Our flagship product line saw sales increase by 32%, while our new
+    service offerings contributed $12.3 million in revenue. Gross margin improved to 62.8% from 58.4%
+    in the previous year, reflecting our successful cost optimization initiatives and economies of scale.
+    Operating expenses were $28.7 million, up 15% year-over-year, primarily due to increased R&D
+    investments and marketing campaigns for new product launches. Despite these investments, operating
+    profit grew by 42% to $20.5 million, representing a 26.1% operating margin. Our customer base expanded
+    by 15%, with particularly strong growth in the enterprise segment. Looking ahead, we maintain our
+    full-year guidance of $320-340 million in revenue and anticipate continued margin improvement as we
+    scale operations.
+    """
+}
+# Function to directly use the summarizer tool
+def summarize_text(text, model, max_length, min_length, style):
+    try:
+        # Convert max_length and min_length to integers
+        max_length = int(max_length) if max_length else None
+        min_length = int(min_length) if min_length else None
+        # Call the summarizer tool
+        result = summarizer_tool(
+            text=text,
+            model=model,
+            max_length=max_length,
+            min_length=min_length,
+            style=style
+        )
+        return result
+    except Exception as e:
+        return f"Error summarizing text: {str(e)}"
+# Function to use the summarizer with an agent (if token available)
+def agent_summarize(text, instruction, temperature=0.7):
+    if not hf_token:
+        return "Agent summarization requires a HuggingFace API token. Please set the HF_TOKEN environment variable."
+    if not text or not instruction:
+        return "Please provide both text and instructions."
+    try:
+        # Initialize model for agent
+        model = InferenceClientModel(
+            model_id="mistralai/Mistral-7B-Instruct-v0.2",
+            token=hf_token,
+            temperature=float(temperature)
         )
+        # Create the agent with our summarizer tool
+        agent = CodeAgent(tools=[summarizer_tool], model=model)
+        # Format the prompt with the instruction and text
+        prompt = f"Instruction: {instruction}\n\nText to summarize: {text}"
+        # Run the agent
+        result = agent.run(prompt)
+        return result
+    except Exception as e:
+        return f"Error with agent summarization: {str(e)}"
+# Create Gradio interface
+with gr.Blocks(title="Advanced Text Summarizer") as demo:
+    gr.Markdown("# 📝 Advanced Text Summarizer")
+    gr.Markdown("Summarize text using different models and styles, with optional agent assistance.")
+    with gr.Tabs():
+        # Direct summarization tab
+        with gr.Tab("Direct Summarization"):
+            with gr.Row():
+                with gr.Column():
+                    # Input section
+                    direct_text_input = gr.Textbox(
+                        label="Text to Summarize",
+                        placeholder="Enter text to summarize...",
+                        lines=10
+                    )
+                    # Sample texts dropdown
+                    sample_dropdown = gr.Dropdown(
+                        choices=list(sample_texts.keys()),
+                        label="Or Select a Sample Text"
+                    )
+                    # Configuration options
+                    with gr.Row():
+                        with gr.Column():
+                            model_dropdown = gr.Dropdown(
+                                choices=list(summarizer_tool.available_models.keys()),
+                                value="facebook/bart-large-cnn",
+                                label="Summarization Model"
+                            )
+                            style_dropdown = gr.Dropdown(
+                                choices=["concise", "detailed", "bullet_points"],
+                                value="concise",
+                                label="Summary Style"
+                            )
+                        with gr.Column():
+                            max_length_slider = gr.Slider(
+                                minimum=50,
+                                maximum=250,
+                                value=130,
+                                step=10,
+                                label="Maximum Summary Length"
+                            )
+                            min_length_slider = gr.Slider(
+                                minimum=10,
+                                maximum=100,
+                                value=30,
+                                step=5,
+                                label="Minimum Summary Length"
+                            )
+                    direct_summarize_button = gr.Button("Summarize Text")
+                with gr.Column():
+                    # Output section
+                    direct_output = gr.Textbox(label="Summary", lines=12)
+        # Agent-assisted summarization tab
+        with gr.Tab("Agent-Assisted Summarization"):
+            with gr.Row():
+                with gr.Column():
+                    # Input section
+                    agent_text_input = gr.Textbox(
+                        label="Text to Summarize",
+                        placeholder="Enter text to summarize...",
+                        lines=10
+                    )
+                    # Agent instruction
+                    instruction_input = gr.Textbox(
+                        label="Instructions for the Agent",
+                        placeholder="E.g., 'Summarize this text and highlight the three most important points'",
+                        lines=2,
+                        value="Summarize this text in a professional tone, highlighting key information."
+                    )
+                    # Sample instructions
+                    instruction_examples = gr.Dropdown(
+                        choices=[
+                            "Summarize this text in a professional tone, highlighting key information.",
+                            "Create a very concise summary focusing only on actionable items.",
+                            "Summarize this for a high school student, explaining complex terms.",
+                            "Extract the main argument and supporting evidence from this text.",
+                            "Create a summary that focuses on financial implications mentioned in the text."
+                        ],
+                        label="Or Select Example Instructions"
+                    )
+                    # Temperature setting
+                    temperature_slider = gr.Slider(
+                        minimum=0.1,
+                        maximum=1.0,
+                        value=0.7,
+                        step=0.1,
+                        label="Agent Temperature (creativity)"
+                    )
+                    agent_summarize_button = gr.Button("Use Agent to Summarize")
+                with gr.Column():
+                    # Output section
+                    agent_output = gr.Textbox(label="Agent Response", lines=15)
+    # Set up event handlers
+    def load_sample(sample_name):
+        return sample_texts.get(sample_name, "")
+    def load_instruction(instruction):
+        return instruction
+    sample_dropdown.change(
+        load_sample,
+        inputs=sample_dropdown,
+        outputs=direct_text_input
+    )
+    instruction_examples.change(
+        load_instruction,
+        inputs=instruction_examples,
+        outputs=instruction_input
+    )
+    direct_summarize_button.click(
+        summarize_text,
+        inputs=[direct_text_input, model_dropdown, max_length_slider, min_length_slider, style_dropdown],
+        outputs=direct_output
+    )
+    agent_summarize_button.click(
+        agent_summarize,
+        inputs=[agent_text_input, instruction_input, temperature_slider],
+        outputs=agent_output
+    )
+    # Also allow using sample text for agent tab
+    sample_dropdown.change(
+        load_sample,
+        inputs=sample_dropdown,
+        outputs=agent_text_input
+    )
+# Launch the app
+if __name__ == "__main__":
+    demo.launch()