Spaces:

ajalisatgi
/

Gradio

Sleeping

App Files Files Community

ajalisatgi commited on Feb 18

Commit

2e77d5f

verified ·

1 Parent(s): a130567

Update app.py

Browse files

Files changed (1) hide show

app.py +63 -38

app.py CHANGED Viewed

@@ -7,52 +7,83 @@ from langchain_community.embeddings import HuggingFaceEmbeddings
 import torch
 import psutil
 import GPUtil
-# Set up logging with performance metrics
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 def get_system_metrics():
-    cpu_percent = psutil.cpu_percent()
-    memory_percent = psutil.virtual_memory().percent
-    if torch.cuda.is_available():
-        gpu = GPUtil.getGPUs()[0]
-        gpu_util = gpu.load * 100
-        gpu_memory = gpu.memoryUtil * 100
-    else:
-        gpu_util = 0
-        gpu_memory = 0
-    return cpu_percent, memory_percent, gpu_util, gpu_memory
 def process_query(query, dataset_choice="all"):
     start_time = time.time()
     try:
-        # Original query processing code here...
-        response = "Sample response"
-        # Calculate performance metrics
-        end_time = time.time()
-        processing_time = end_time - start_time
-        cpu_percent, memory_percent, gpu_util, gpu_memory = get_system_metrics()
-        metrics = f"""
-        Performance Metrics:
-        Processing Time: {processing_time:.2f}s
-        CPU Usage: {cpu_percent}%
-        Memory Usage: {memory_percent}%
-        GPU Utilization: {gpu_util:.1f}%
-        GPU Memory: {gpu_memory:.1f}%
         """
-        return response, metrics
     except Exception as e:
-        return str(e), "Metrics unavailable"
-# Enhanced Gradio interface with performance metrics
 demo = gr.Interface(
     fn=process_query,
     inputs=[
-        gr.Textbox(label="Question", placeholder="Ask any question..."),
         gr.Dropdown(
             choices=["all"] + dataset_names,
             label="Select Dataset",
@@ -63,16 +94,10 @@ demo = gr.Interface(
         gr.Textbox(label="Response"),
         gr.Textbox(label="Performance Metrics")
     ],
-    title="E5-Powered Multi-Dataset Knowledge Base",
-    description="Search across RagBench datasets with real-time performance monitoring",
-    analytics_enabled=True,
-    examples=[
-        ["What role does T-cell count play in severe human adenovirus type 55 (HAdV-55) infection?", "covidqa"],
-        ["In what school district is Governor John R. Rogers High School located?", "hotpotqa"],
-        ["What are the key financial metrics for Q3?", "finqa"]
-    ]
 )
 if __name__ == "__main__":
-    demo.queue()  # Enable queuing for performance monitoring
-    demo.launch(debug=True, show_api=True)

 import torch
 import psutil
 import GPUtil
+# Set up logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
+# Initialize OpenAI API key
+openai.api_key = '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'
+# Initialize with E5 embedding model
+model_name = 'intfloat/e5-base-v2'
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+embedding_model = HuggingFaceEmbeddings(model_name=model_name)
+embedding_model.client.to(device)
+# Load datasets
+datasets = {}
+dataset_names = ['covidqa', 'hotpotqa', 'pubmedqa']  # Starting with key datasets
+for name in dataset_names:
+    datasets[name] = load_dataset("rungalileo/ragbench", name, split='train')
+    logger.info(f"Loaded {name}")
 def get_system_metrics():
+    metrics = {
+        'cpu_percent': psutil.cpu_percent(),
+        'memory_percent': psutil.virtual_memory().percent,
+        'gpu_util': GPUtil.getGPUs()[0].load * 100 if torch.cuda.is_available() else 0,
+        'gpu_memory': GPUtil.getGPUs()[0].memoryUtil * 100 if torch.cuda.is_available() else 0
+    }
+    return metrics
 def process_query(query, dataset_choice="all"):
     start_time = time.time()
     try:
+        relevant_contexts = []
+        search_datasets = [dataset_choice] if dataset_choice != "all" else datasets.keys()
+        for dataset_name in search_datasets:
+            if dataset_name in datasets:
+                for doc in datasets[dataset_name]['documents']:
+                    if any(keyword.lower() in doc.lower() for keyword in query.split()):
+                        relevant_contexts.append((doc, dataset_name))
+        context_info = f"From {relevant_contexts[0][1]}: {relevant_contexts[0][0]}" if relevant_contexts else "Searching across datasets..."
+        response = openai.chat.completions.create(
+            model="gpt-3.5-turbo",
+            messages=[
+                {"role": "system", "content": "You are a knowledgeable expert using E5 embeddings for precise information retrieval."},
+                {"role": "user", "content": f"Context: {context_info}\nQuestion: {query}"}
+            ],
+            max_tokens=300,
+            temperature=0.7,
+        )
+        # Get performance metrics
+        metrics = get_system_metrics()
+        metrics['processing_time'] = time.time() - start_time
+        metrics_display = f"""
+        Processing Time: {metrics['processing_time']:.2f}s
+        CPU Usage: {metrics['cpu_percent']}%
+        Memory Usage: {metrics['memory_percent']}%
+        GPU Utilization: {metrics['gpu_util']:.1f}%
+        GPU Memory: {metrics['gpu_memory']:.1f}%
         """
+        return response.choices[0].message.content.strip(), metrics_display
     except Exception as e:
+        return str(e), "Metrics collection in progress"
+# Create Gradio interface
 demo = gr.Interface(
     fn=process_query,
     inputs=[
+        gr.Textbox(label="Question", placeholder="Ask your question here"),
         gr.Dropdown(
             choices=["all"] + dataset_names,
             label="Select Dataset",
         gr.Textbox(label="Response"),
         gr.Textbox(label="Performance Metrics")
     ],
+    title="E5-Powered Knowledge Base",
+    description="Search across RagBench datasets with performance monitoring"
 )
 if __name__ == "__main__":
+    demo.queue()
+    demo.launch(debug=True)