Spaces:

mihirinamdar
/

arxiv-rag-optimized

Running

App Files Files Community

mihirinamdar commited on Jun 12

Commit

15f008d

verified ·

1 Parent(s): 0c71790

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -7

app.py CHANGED Viewed

@@ -256,11 +256,24 @@ class OptimizedRagSystem:
                 papers = []
                 search_query = query.strip()
-                # Simple query validation
                 if not search_query or len(search_query) < 2:
                     logger.warning("Query too short, using default search")
                     search_query = "machine learning"
                 if categories and len(categories) > 0:
                     category_filter = " OR ".join([f"cat:{cat.strip()}" for cat in categories if cat.strip()])
                     if category_filter:
@@ -269,6 +282,7 @@ class OptimizedRagSystem:
                 logger.info(f"🔍 ArXiv search attempt {attempt + 1}: '{search_query}'")
                 # Create search with timeout and retry settings
                 search = arxiv.Search(
                     query=search_query,
                     max_results=min(max_results, 50),  # Limit to prevent API issues
@@ -489,15 +503,23 @@ class OptimizedRagSystem:
             bm25_scores = bm25_scores[:min_length]
             chunks = self.chunks[:min_length]
-            # Normalize scores
-            if len(semantic_scores) > 0:
-                semantic_scores = (semantic_scores - semantic_scores.min()) / (semantic_scores.max() - semantic_scores.min() + 1e-8)
-            if len(bm25_scores) > 0:
-                bm25_scores = (bm25_scores - bm25_scores.min()) / (bm25_scores.max() - bm25_scores.min() + 1e-8)
-            # Combine scores
             combined_scores = semantic_weight * semantic_scores + (1 - semantic_weight) * bm25_scores
             # Get top results
             top_indices = np.argsort(combined_scores)[::-1][:top_k]
             results = [(chunks[i], float(combined_scores[i])) for i in top_indices]

                 papers = []
                 search_query = query.strip()
+                # Simple query validation and enhancement
                 if not search_query or len(search_query) < 2:
                     logger.warning("Query too short, using default search")
                     search_query = "machine learning"
+                # Enhance transformer-related queries for better results
+                transformer_keywords = ["transformer", "attention", "bert", "gpt", "llm", "language model"]
+                if any(keyword in search_query.lower() for keyword in transformer_keywords):
+                    # Add related terms to improve relevance
+                    enhanced_terms = []
+                    if "attention" in search_query.lower():
+                        enhanced_terms.extend(["self-attention", "multi-head attention", "scaled dot-product"])
+                    if "transformer" in search_query.lower():
+                        enhanced_terms.extend(["encoder", "decoder", "positional encoding"])
+                    if enhanced_terms:
+                        search_query = f"({search_query}) OR ({' OR '.join(enhanced_terms)})"
                 if categories and len(categories) > 0:
                     category_filter = " OR ".join([f"cat:{cat.strip()}" for cat in categories if cat.strip()])
                     if category_filter:
                 logger.info(f"🔍 ArXiv search attempt {attempt + 1}: '{search_query}'")
                 # Create search with timeout and retry settings
+                # Use relevance sorting for better results, but mix with recent papers
                 search = arxiv.Search(
                     query=search_query,
                     max_results=min(max_results, 50),  # Limit to prevent API issues
             bm25_scores = bm25_scores[:min_length]
             chunks = self.chunks[:min_length]
+            # Normalize scores properly to [0, 1] range
+            if len(semantic_scores) > 0 and semantic_scores.max() > semantic_scores.min():
+                semantic_scores = (semantic_scores - semantic_scores.min()) / (semantic_scores.max() - semantic_scores.min())
+            else:
+                semantic_scores = np.ones_like(semantic_scores) * 0.5
+            if len(bm25_scores) > 0 and bm25_scores.max() > bm25_scores.min():
+                bm25_scores = (bm25_scores - bm25_scores.min()) / (bm25_scores.max() - bm25_scores.min())
+            else:
+                bm25_scores = np.ones_like(bm25_scores) * 0.5
+            # Combine scores (both should be in [0, 1] range now)
             combined_scores = semantic_weight * semantic_scores + (1 - semantic_weight) * bm25_scores
+            # Ensure final scores are positive
+            combined_scores = np.maximum(combined_scores, 0.0)
             # Get top results
             top_indices = np.argsort(combined_scores)[::-1][:top_k]
             results = [(chunks[i], float(combined_scores[i])) for i in top_indices]