TaimoorKhan10
diff --git a/‎docs/assets/generate_charts.py‎
Lines changed: 353 additions & 182 deletions b/‎docs/assets/generate_charts.py‎
Lines changed: 353 additions & 182 deletions
diff --git a/‎examples/basic_query_example.py‎
Lines changed: 19 additions & 23 deletions b/‎examples/basic_query_example.py‎
Lines changed: 19 additions & 23 deletions
diff --git a/‎examples/document_indexing_example.py‎
Lines changed: 18 additions & 19 deletions b/‎examples/document_indexing_example.py‎
Lines changed: 18 additions & 19 deletions
@@ -14,57 +14,53 @@
 
 from src.enterprise_rag import RAGSystem
 
+
 def main():
     """Run a basic query example."""
-    
+
     # Initialize the RAG system with a basic configuration
     rag_system = RAGSystem(
         vector_store_config={
             "type": "faiss",
             "index_path": "data/index",
-            "embedding_model": "sentence-transformers/all-mpnet-base-v2"
-        },
-        retrieval_config={
-            "type": "hybrid",
-            "top_k": 5,
-            "use_reranker": True
+            "embedding_model": "sentence-transformers/all-mpnet-base-v2",
         },
+        retrieval_config={"type": "hybrid", "top_k": 5, "use_reranker": True},
         generation_config={
             "model": "gpt-3.5-turbo",
             "temperature": 0.7,
-            "max_tokens": 500
-        }
+            "max_tokens": 500,
+        },
     )
-    
+
     # Define your query
-    query = "What are the key benefits of using a RAG system for enterprise applications?"
-    
+    query = (
+        "What are the key benefits of using a RAG system for enterprise applications?"
+    )
+
     # Optional query parameters
     query_options = {
         "filters": {
             "metadata.doc_type": "pdf",  # Optional filter by document type
-            "metadata.date": {"$gt": "2022-01-01"}  # Filter by date
+            "metadata.date": {"$gt": "2022-01-01"},  # Filter by date
         },
-        "retrieval_options": {
-            "use_semantic": True,
-            "use_keyword": True
-        }
+        "retrieval_options": {"use_semantic": True, "use_keyword": True},
     }
-    
+
     # Execute the query
     print(f"Querying: '{query}'")
-    
+
     response = rag_system.query(query, options=query_options)
-    
+
     # Print the results
     print("\n----- ANSWER -----")
     print(response["answer"])
-    
+
     print("\n----- SOURCES -----")
     for i, source in enumerate(response["sources"], 1):
         print(f"{i}. {source['title']} (score: {source['score']:.3f})")
         print(f"   Snippet: {source['text'][:150]}...")
-    
+
     # Print performance metrics
     print("\n----- PERFORMANCE METRICS -----")
     for key, value in response["metrics"].items():
@@ -80,5 +76,5 @@ def main():
         print("WARNING: OPENAI_API_KEY environment variable is not set.")
         print("Set it with: export OPENAI_API_KEY=your_api_key_here")
         print("For this example, using a mock response instead.\n")
-    
+
     main()
@@ -23,27 +23,28 @@
 from src.enterprise_rag import RAGSystem
 from src.document_processing.processor import DocumentProcessor
 
+
 def main():
     """Run a document indexing example."""
-    
+
     # Initialize the RAG system
     rag_system = RAGSystem(
         vector_store_config={
             "type": "faiss",
             "index_path": "data/index",
-            "embedding_model": "sentence-transformers/all-mpnet-base-v2"
+            "embedding_model": "sentence-transformers/all-mpnet-base-v2",
         }
     )
-    
+
     # Define document paths (replace with your actual documents)
     documents_dir = Path("examples/sample_documents")
     if not documents_dir.exists():
         logger.warning(f"Sample documents directory not found: {documents_dir}")
         logger.info("Creating sample documents directory and a sample text file")
-        
+
         # Create directory
         documents_dir.mkdir(parents=True, exist_ok=True)
-        
+
         # Create a sample text file
         sample_text = """
         # Enterprise-Ready RAG System
@@ -68,43 +69,41 @@ def main():
            
         5. **Cost Efficiency**: More efficient than fine-tuning large models on domain-specific data.
         """
-        
+
         with open(documents_dir / "rag_overview.txt", "w", encoding="utf-8") as f:
             f.write(sample_text)
-    
+
     # Process documents
     document_processor = DocumentProcessor(
-        chunking_strategy="recursive",
-        chunk_size=1000,
-        chunk_overlap=200
+        chunking_strategy="recursive", chunk_size=1000, chunk_overlap=200
     )
-    
+
     # Find documents
     document_paths = list(documents_dir.glob("**/*.*"))
     logger.info(f"Found {len(document_paths)} documents to process")
-    
+
     # Process and index documents
     for doc_path in document_paths:
         try:
             logger.info(f"Processing document: {doc_path}")
-            
+
             # Process document into chunks
             doc_chunks = document_processor.process_document(str(doc_path))
-            
+
             logger.info(f"Created {len(doc_chunks)} chunks from {doc_path.name}")
-            
+
             # Add document chunks to RAG system
             doc_ids = rag_system.add_documents(doc_chunks)
-            
+
             logger.info(f"Indexed document with {len(doc_ids)} chunks")
-            
+
         except Exception as e:
             logger.error(f"Error processing document {doc_path}: {str(e)}")
-    
+
     # Save the index
     rag_system.save_index()
     logger.info(f"Index saved to {rag_system.vector_store.index_path}")
-    
+
     # Print statistics
     stats = rag_system.get_stats()
     print("\n----- INDEX STATISTICS -----")