Spaces:

kingabzpro
/

RegRadar

Sleeping

App Files Files Community

Abid Ali Awan commited on Jun 24

Commit

6598f74

1 Parent(s): 8159b22

Enhance app.py to implement a Gradio interface for the RegRadar AI Regulatory Compliance Assistant, featuring a chatbot, example queries, and a tool information panel. Refactor UIHandler to streamline chat processing and improve regulatory query handling. Update web_tools.py to modularize crawling and searching functionalities, enhancing code readability and maintainability.

Browse files

Files changed (4) hide show

agents/ui_handler.py +75 -174
app.py +118 -1
tools/memory_tools.py +5 -3
tools/web_tools.py +65 -38

agents/ui_handler.py CHANGED Viewed

@@ -6,7 +6,6 @@ import gradio as gr
 from gradio import ChatMessage
 from agents.reg_radar import RegRadarAgent
-from config.settings import AVATAR_IMAGES
 from tools.llm import stream_llm
@@ -37,26 +36,37 @@ class UIHandler:
         is_regulatory = self.agent.is_regulatory_query(message)
         if not is_regulatory:
-            # General chat
-            history.append(
-                ChatMessage(role="assistant", content="💬 Processing general query...")
-            )
-            yield history, "", gr.update(interactive=False), user_id_state
-            # Clear processing message and stream response
-            history.pop()
-            streaming_content = ""
-            history.append(ChatMessage(role="assistant", content=""))
-            for chunk in stream_llm(message):
-                streaming_content += chunk
-                history[-1] = ChatMessage(role="assistant", content=streaming_content)
-                yield history, "", gr.update(interactive=False), user_id_state
-            # Re-enable input box at the end
-            yield history, "", gr.update(interactive=True), user_id_state
-            return
         # Show tool detection
         tool_key, tool_name = self.agent.determine_intended_tool(message)
@@ -102,51 +112,13 @@ class UIHandler:
         # Show collapsible raw results
         if crawl_results["results"]:
-            # Format results for display, remove duplicates by URL
-            seen_urls = set()
-            results_display = []
-            count = 0
-            for result in crawl_results["results"]:
-                url = result["url"]
-                if url in seen_urls:
-                    continue
-                seen_urls.add(url)
-                title = result["title"][:100] if result["title"] else "No Title"
-                count += 1
-                results_display.append(f"""
-**{count}. {result["source"]}**
-- Title: {title}...
-- URL: {url}
-""")
-            if results_display:
-                collapsible_results = f"""
-<details>
-<summary><strong>📋 Raw Regulatory Data</strong> - Click to expand</summary>
-{"".join(results_display)}
-</details>
-"""
-            else:
-                collapsible_results = "<details><summary><strong>📋 Raw Regulatory Data</strong> - Click to expand</summary>\nNo unique regulatory updates found.\n</details>"
             history.append(ChatMessage(role="assistant", content=collapsible_results))
             yield history, "", gr.update(interactive=False), user_id_state
         # Display memory results if available
         if memory_results:
-            top_memories = memory_results[:3]
-            memory_details = ""
-            for i, mem in enumerate(top_memories, 1):
-                memory_text = mem.get("memory", "N/A")
-                memory_details += f"\n**{i}. Memory:** {memory_text[:300]}...\n"
-            memory_msg = f"""
-<details>
-<summary><strong>💾 Related Past Queries</strong> - Click to expand</summary>
-Found {len(memory_results)} similar past queries in memory. Top 3 shown below:
-{memory_details}
-</details>
-"""
             history.append(ChatMessage(role="assistant", content=memory_msg))
             yield history, "", gr.update(interactive=False), user_id_state
@@ -186,124 +158,53 @@ Found {len(memory_results)} similar past queries in memory. Top 3 shown below:
             daemon=True,
         ).start()
-    def delayed_clear(self, user_id_state):
-        time.sleep(0.1)  # 100ms delay to allow generator cancellation
-        return [], "", gr.update(interactive=True), user_id_state
-    def create_ui(self):
-        """Create Gradio interface"""
-        with gr.Blocks(
-            title="RegRadar - AI Regulatory Compliance Assistant",
-            theme=gr.themes.Soft(),
-            css="""
-            .tool-status {
-                background-color: #f0f4f8;
-                padding: 10px;
-                border-radius: 5px;
-                margin: 10px 0;
-            }
-            """,
-        ) as demo:
-            # Header
-            gr.HTML("""
-            <center>
-                <h1>🛡️ RegRadar</h1>
-                AI-powered regulatory compliance assistant that monitors global regulations
-            </center>
-            """)
-            # Main chat interface
-            chatbot = gr.Chatbot(
-                height=400,
-                type="messages",
-                avatar_images=AVATAR_IMAGES,
-                show_copy_button=True,
-            )
-            with gr.Row(equal_height=True):
-                msg = gr.Textbox(
-                    placeholder="Ask about regulatory updates, compliance requirements, or any industry regulations...",
-                    show_label=False,
-                    scale=18,
-                    autofocus=True,
-                )
-                submit = gr.Button("Send", variant="primary", scale=1, min_width=60)
-                stop = gr.Button("Stop", variant="stop", scale=1, min_width=60)
-                clear = gr.Button("Clear", scale=1, min_width=60)
-            # Add user_id_state for session
-            user_id_state = gr.State()
-            # Example queries
-            example_queries = [
-                "Show me the latest SEC regulations for fintech",
-                "What are the new data privacy rules in the EU?",
-                "Any updates on ESG compliance for energy companies?",
-                "Scan for healthcare regulations in the US",
-                "What are the global trends in AI regulation?",
-            ]
-            gr.Examples(examples=example_queries, inputs=msg, label="Example Queries")
-            # Tool information panel
-            with gr.Accordion("🛠️ Available Tools", open=False):
-                gr.Markdown("""
-                ### RegRadar uses these intelligent tools:
-                **🧠 Query Type Detection**
-                - Automatically detects if your message is a regulatory compliance query or a general question
-                - Selects the appropriate tools and response style based on your intent
-                **📩 Information Extraction**
-                - Extracts key details (industry, region, keywords) from your command
-                - Ensures accurate and relevant regulatory analysis
-                **🔍 Regulatory Web Crawler**
-                - Crawls official regulatory websites (SEC, FDA, FTC, etc.)
-                - Searches for recent updates and compliance changes
-                - Focuses on last 30 days of content
-                **🌐 Regulatory Search Engine**
-                - Searches across multiple sources for regulatory updates
-                - Finds industry-specific compliance information
-                - Aggregates results from various regulatory bodies
-                **💾 Memory System**
-                - Remembers past queries and responses
-                - Learns from your compliance interests
-                - Provides context from previous interactions
-                - Each session creates a new user for personalization
-                **🤖 AI Analysis Engine**
-                - Analyzes and summarizes regulatory findings
-                - Generates actionable compliance recommendations
-                - Creates executive summaries and action items
-                """)
-            # Event handlers
-            submit_event = msg.submit(
-                self.streaming_chatbot,
-                [msg, chatbot, user_id_state],
-                [chatbot, msg, msg, user_id_state],
-            )
-            click_event = submit.click(
-                self.streaming_chatbot,
-                [msg, chatbot, user_id_state],
-                [chatbot, msg, msg, user_id_state],
-            )
-            stop.click(None, cancels=[submit_event, click_event])
-            clear.click(
-                self.delayed_clear,
-                inputs=[user_id_state],
-                outputs=[chatbot, msg, msg, user_id_state],
-            )
-            # Footer
-            gr.HTML("""
-            <div style="text-align: center; padding: 20px; color: #666; font-size: 0.9rem;">
-                <p>RegRadar monitors regulatory updates from the SEC, EU Commission, and other leading global authorities.</p>
-                <p>All analyses are AI-generated. Please verify findings with official regulatory sources.</p>
-            </div>
-            """)
-        return demo

 from gradio import ChatMessage
 from agents.reg_radar import RegRadarAgent
 from tools.llm import stream_llm
         is_regulatory = self.agent.is_regulatory_query(message)
         if not is_regulatory:
+            yield from self._handle_general_chat(message, history, user_id_state)
+            return
+        yield from self._handle_regulatory_chat(
+            message, history, user_id_state, user_id, start_time
+        )
+    def _handle_general_chat(self, message, history, user_id_state):
+        """Handle general (non-regulatory) chat flow."""
+        history.append(
+            ChatMessage(role="assistant", content="💬 Processing general query...")
+        )
+        yield history, "", gr.update(interactive=False), user_id_state
+        # Clear processing message and stream response
+        history.pop()
+        streaming_content = ""
+        history.append(ChatMessage(role="assistant", content=""))
+        for chunk in stream_llm(message):
+            streaming_content += chunk
+            history[-1] = ChatMessage(role="assistant", content=streaming_content)
+            yield history, "", gr.update(interactive=False), user_id_state
+        # Re-enable input box at the end
+        yield history, "", gr.update(interactive=True), user_id_state
+    def _handle_regulatory_chat(
+        self, message, history, user_id_state, user_id, start_time
+    ):
+        """Handle regulatory chat flow."""
         # Show tool detection
         tool_key, tool_name = self.agent.determine_intended_tool(message)
         # Show collapsible raw results
         if crawl_results["results"]:
+            collapsible_results = self._format_crawl_results(crawl_results["results"])
             history.append(ChatMessage(role="assistant", content=collapsible_results))
             yield history, "", gr.update(interactive=False), user_id_state
         # Display memory results if available
         if memory_results:
+            memory_msg = self._format_memory_results(memory_results)
             history.append(ChatMessage(role="assistant", content=memory_msg))
             yield history, "", gr.update(interactive=False), user_id_state
             daemon=True,
         ).start()
+    def _format_crawl_results(self, results):
+        """Format crawl results for display, removing duplicates by URL."""
+        seen_urls = set()
+        results_display = []
+        count = 0
+        for result in results:
+            url = result["url"]
+            if url in seen_urls:
+                continue
+            seen_urls.add(url)
+            title = result["title"][:100] if result["title"] else "No Title"
+            count += 1
+            results_display.append(f"""
+**{count}. {result["source"]}**
+- Title: {title}...
+- URL: {url}
+""")
+        if results_display:
+            collapsible_results = f"""
+<details>
+<summary><strong>📋 Raw Regulatory Data</strong> - Click to expand</summary>
+{"".join(results_display)}
+</details>
+"""
+        else:
+            collapsible_results = "<details><summary><strong>📋 Raw Regulatory Data</strong> - Click to expand</summary>\nNo unique regulatory updates found.\n</details>"
+        return collapsible_results
+    def _format_memory_results(self, memory_results):
+        """Format memory results for display."""
+        top_memories = memory_results[:3]
+        memory_details = ""
+        for i, mem in enumerate(top_memories, 1):
+            memory_text = mem.get("memory", "N/A")
+            memory_details += f"\n**{i}. Memory:** {memory_text[:300]}...\n"
+        memory_msg = f"""
+<details>
+<summary><strong>💾 Related Past Queries</strong> - Click to expand</summary>
+Found {len(memory_results)} similar past queries in memory. Top 3 shown below:
+{memory_details}
+</details>
+"""
+        return memory_msg
+    def delayed_clear(self, user_id_state):
+        time.sleep(0.1)  # 100ms delay to allow generator cancellation
+        return [], "", gr.update(interactive=True), user_id_state

app.py CHANGED Viewed

@@ -7,14 +7,131 @@ compliance guidance for various industries and regions.
 import warnings
 from agents.ui_handler import UIHandler
 warnings.filterwarnings("ignore", category=DeprecationWarning)
 def create_demo():
     ui_handler = UIHandler()  # New user for each session
-    return ui_handler.create_ui()
 def main():

 import warnings
+import gradio as gr
 from agents.ui_handler import UIHandler
+from config.settings import AVATAR_IMAGES
 warnings.filterwarnings("ignore", category=DeprecationWarning)
 def create_demo():
     ui_handler = UIHandler()  # New user for each session
+    with gr.Blocks(
+        title="RegRadar - AI Regulatory Compliance Assistant",
+        theme=gr.themes.Soft(),
+        css="""
+        .tool-status {
+            background-color: #f0f4f8;
+            padding: 10px;
+            border-radius: 5px;
+            margin: 10px 0;
+        }
+        """,
+    ) as demo:
+        # Header
+        gr.HTML("""
+        <center>
+            <h1>🛡️ RegRadar</h1>
+            AI-powered regulatory compliance assistant that monitors global regulations
+        </center>
+        """)
+        # Main chat interface
+        chatbot = gr.Chatbot(
+            height=400,
+            type="messages",
+            avatar_images=AVATAR_IMAGES,
+            show_copy_button=True,
+        )
+        with gr.Row(equal_height=True):
+            msg = gr.Textbox(
+                placeholder="Ask about regulatory updates, compliance requirements, or any industry regulations...",
+                show_label=False,
+                scale=18,
+                autofocus=True,
+            )
+            submit = gr.Button("Send", variant="primary", scale=1, min_width=60)
+            stop = gr.Button("Stop", variant="stop", scale=1, min_width=60)
+            clear = gr.Button("Clear", scale=1, min_width=60)
+        # Add user_id_state for session
+        user_id_state = gr.State()
+        # Example queries
+        example_queries = [
+            "Show me the latest SEC regulations for fintech",
+            "What are the new data privacy rules in the EU?",
+            "Any updates on ESG compliance for energy companies?",
+            "Scan for healthcare regulations in the US",
+            "What are the global trends in AI regulation?",
+        ]
+        gr.Examples(examples=example_queries, inputs=msg, label="Example Queries")
+        # Tool information panel
+        with gr.Accordion("🛠️ Available Tools", open=False):
+            gr.Markdown("""
+            ### RegRadar uses these intelligent tools:
+            **🧠 Query Type Detection**
+            - Automatically detects if your message is a regulatory compliance query or a general question
+            - Selects the appropriate tools and response style based on your intent
+            **📩 Information Extraction**
+            - Extracts key details (industry, region, keywords) from your command
+            - Ensures accurate and relevant regulatory analysis
+            **🔍 Regulatory Web Crawler**
+            - Crawls official regulatory websites (SEC, FDA, FTC, etc.)
+            - Searches for recent updates and compliance changes
+            - Focuses on last 30 days of content
+            **🌐 Regulatory Search Engine**
+            - Searches across multiple sources for regulatory updates
+            - Finds industry-specific compliance information
+            - Aggregates results from various regulatory bodies
+            **💾 Memory System**
+            - Remembers past queries and responses
+            - Learns from your compliance interests
+            - Provides context from previous interactions
+            - Each session creates a new user for personalization
+            **🤖 AI Analysis Engine**
+            - Analyzes and summarizes regulatory findings
+            - Generates actionable compliance recommendations
+            - Creates executive summaries and action items
+            """)
+        # Event handlers
+        submit_event = msg.submit(
+            ui_handler.streaming_chatbot,
+            [msg, chatbot, user_id_state],
+            [chatbot, msg, msg, user_id_state],
+        )
+        click_event = submit.click(
+            ui_handler.streaming_chatbot,
+            [msg, chatbot, user_id_state],
+            [chatbot, msg, msg, user_id_state],
+        )
+        stop.click(None, cancels=[submit_event, click_event])
+        clear.click(
+            ui_handler.delayed_clear,
+            inputs=[user_id_state],
+            outputs=[chatbot, msg, msg, user_id_state],
+        )
+        # Footer
+        gr.HTML("""
+        <div style="text-align: center; padding: 20px; color: #666; font-size: 0.9rem;">
+            <p>RegRadar monitors regulatory updates from the SEC, EU Commission, and other leading global authorities.</p>
+            <p>All analyses are AI-generated. Please verify findings with official regulatory sources.</p>
+        </div>
+        """)
+    return demo
 def main():

tools/memory_tools.py CHANGED Viewed

@@ -1,10 +1,13 @@
-from typing import List, Dict
 from mem0 import MemoryClient
 from config.settings import MEM0_API_KEY
 # Initialize memory client
 mem0_client = MemoryClient(api_key=MEM0_API_KEY)
 class MemoryTools:
     def save_to_memory(self, user_id: str, query: str, response: str):
         """Save interaction to memory"""
@@ -26,6 +29,5 @@ class MemoryTools:
         try:
             memories = mem0_client.search(query=query, user_id=user_id, limit=3)
             return memories
-        except:
             return []

+from typing import Dict, List
 from mem0 import MemoryClient
 from config.settings import MEM0_API_KEY
 # Initialize memory client
 mem0_client = MemoryClient(api_key=MEM0_API_KEY)
 class MemoryTools:
     def save_to_memory(self, user_id: str, query: str, response: str):
         """Save interaction to memory"""
         try:
             memories = mem0_client.search(query=query, user_id=user_id, limit=3)
             return memories
+        except Exception:
             return []

tools/web_tools.py CHANGED Viewed

@@ -15,46 +15,71 @@ class WebTools:
         self.cached_searches = {}
     def generate_cache_key(self, industry: str, region: str, keywords: str) -> str:
-        """Generate a unique cache key"""
         key = f"{industry}:{region}:{keywords}".lower()
         return hashlib.md5(key.encode()).hexdigest()
     def crawl_regulatory_sites(self, industry: str, region: str, keywords: str) -> Dict:
-        """Crawl regulatory websites for updates"""
-        # Check cache first
         cache_key = self.generate_cache_key(industry, region, keywords)
         if cache_key in self.cached_searches:
             return self.cached_searches[cache_key]
         urls_to_crawl = REGULATORY_SOURCES.get(region, REGULATORY_SOURCES["US"])
         all_results = []
         crawl_instructions = (
             f"Recent {industry} {region} regulatory updates: {keywords}, 30 days"
         )
-        # Crawl regulatory sites
         for source_name, url in list(urls_to_crawl.items())[:3]:
-            try:
-                crawl_response = tavily_client.crawl(
-                    url=url, max_depth=2, limit=5, instructions=crawl_instructions
-                )
-                for result in crawl_response.get("results", []):
-                    title = result.get("title")
-                    if not title or title == "No Title...":
-                        title = SOURCE_FULL_NAMES.get(source_name, source_name)
-                    all_results.append(
-                        {
-                            "source": source_name,
-                            "url": result.get("url", url),
-                            "title": title,
-                            "content": result.get("raw_content", "")[:1500],
-                        }
-                    )
-            except Exception as e:
-                print(f"Crawl error for {source_name}: {e}")
         # General search
         try:
             search_results = tavily_client.search(
                 query=f"{industry} {region} regulatory updates compliance {keywords} 2024 2025",
@@ -62,7 +87,7 @@ class WebTools:
                 include_raw_content=True,
             )
             for result in search_results.get("results", []):
-                all_results.append(
                     {
                         "source": "Web Search",
                         "url": result.get("url", ""),
@@ -72,24 +97,26 @@ class WebTools:
                 )
         except Exception as e:
             print(f"Search error: {e}")
-        results = {"results": all_results, "total_found": len(all_results)}
-        self.cached_searches[cache_key] = results
         return results
     def extract_parameters(self, message: str) -> Dict:
-        """Extract industry, region, and keywords from the query using LLM (no function calling)."""
-        prompt = f"""
-        Extract the following information from the user query below and return ONLY a valid JSON object with keys: industry, region, keywords.
-        - industry: The industry mentioned or implied (e.g., fintech, healthcare, energy, general).
-        - region: The region or country explicitly mentioned (e.g., US, EU, UK, Asia, Global).
-        - keywords: The most important regulatory topics or terms, separated by commas. Do NOT include generic words or verbs.
-        User query: {message}
-        Example output:
-        {{"industry": "fintech", "region": "US", "keywords": "SEC regulations"}}
         """
         import json
         response = call_llm(prompt)

         self.cached_searches = {}
     def generate_cache_key(self, industry: str, region: str, keywords: str) -> str:
+        """
+        Generate a unique cache key based on industry, region, and keywords.
+        """
         key = f"{industry}:{region}:{keywords}".lower()
         return hashlib.md5(key.encode()).hexdigest()
     def crawl_regulatory_sites(self, industry: str, region: str, keywords: str) -> Dict:
+        """
+        Crawl regulatory websites for updates.
+        """
         cache_key = self.generate_cache_key(industry, region, keywords)
         if cache_key in self.cached_searches:
             return self.cached_searches[cache_key]
         urls_to_crawl = REGULATORY_SOURCES.get(region, REGULATORY_SOURCES["US"])
         all_results = []
         crawl_instructions = (
             f"Recent {industry} {region} regulatory updates: {keywords}, 30 days"
         )
+        # Crawl regulatory sites (limit to 3 sources)
         for source_name, url in list(urls_to_crawl.items())[:3]:
+            crawl_results = self._get_crawl_results(
+                source_name, url, crawl_instructions
+            )
+            all_results.extend(crawl_results)
         # General search
+        search_results = self._get_search_results(industry, region, keywords)
+        all_results.extend(search_results)
+        results = {"results": all_results, "total_found": len(all_results)}
+        self.cached_searches[cache_key] = results
+        return results
+    def _get_crawl_results(self, source_name: str, url: str, instructions: str) -> list:
+        """
+        Crawl a single regulatory source and return formatted results.
+        """
+        results = []
+        try:
+            crawl_response = tavily_client.crawl(
+                url=url, max_depth=2, limit=5, instructions=instructions
+            )
+            for result in crawl_response.get("results", []):
+                title = result.get("title")
+                if not title or title == "No Title...":
+                    title = SOURCE_FULL_NAMES.get(source_name, source_name)
+                results.append(
+                    {
+                        "source": source_name,
+                        "url": result.get("url", url),
+                        "title": title,
+                        "content": result.get("raw_content", "")[:1500],
+                    }
+                )
+        except Exception as e:
+            print(f"Crawl error for {source_name}: {e}")
+        return results
+    def _get_search_results(self, industry: str, region: str, keywords: str) -> list:
+        """
+        Perform a general web search and return formatted results.
+        """
+        results = []
         try:
             search_results = tavily_client.search(
                 query=f"{industry} {region} regulatory updates compliance {keywords} 2024 2025",
                 include_raw_content=True,
             )
             for result in search_results.get("results", []):
+                results.append(
                     {
                         "source": "Web Search",
                         "url": result.get("url", ""),
                 )
         except Exception as e:
             print(f"Search error: {e}")
         return results
     def extract_parameters(self, message: str) -> Dict:
         """
+        Extract industry, region, and keywords from the query using LLM (no function calling).
+        """
+        prompt = (
+            """
+            Extract the following information from the user query below and return ONLY a valid JSON object with keys: industry, region, keywords.
+            - industry: The industry mentioned or implied (e.g., fintech, healthcare, energy, general).
+            - region: The region or country explicitly mentioned (e.g., US, EU, UK, Asia, Global).
+            - keywords: The most important regulatory topics or terms, separated by commas. Do NOT include generic words or verbs.
+            User query: {message}
+            Example output:
+            {{"industry": "fintech", "region": "US", "keywords": "SEC regulations"}}
+            """
+        ).replace("{message}", message)
         import json
         response = call_llm(prompt)