feat: Complete AI transformation to production-ready system

🚀 Major System Upgrades: - Upgraded from 10 to 15 API endpoints (50% increase) - Implemented real Sentence Transformers (all-MiniLM-L6-v2) with 384D embeddings - Added Groq LLM integration (llama3-8b-8192) for AI analysis - Built comprehensive deduplication system (1378 → 204 unique articles) - Added 3 new AI analysis endpoints: analyze-article, generate-insights, recommend-by-article-id 🤖 AI & ML Enhancements: - Replaced hash-based embeddings with genuine Sentence Transformers - Implemented offline AI model operation (no API dependencies for embeddings) - Added complete article analysis: summarization, sentiment, keyword extraction - Built multi-article insights generation with trend analysis - Enhanced semantic search with similarity scoring 🔧 Production Features: - Added intelligent duplicate detection and removal - Implemented vector index rebuilding capabilities - Enhanced RSS fetching with better error handling and timeouts - Improved search API with content inclusion control - Added comprehensive system monitoring and maintenance tools 📚 Documentation & Configuration: - Updated README.md to reflect all current features and capabilities - Added .env.example with proper configuration templates - Enhanced API documentation with working examples - Updated system architecture documentation 🎯 System Metrics: - 204 unique articles (deduplicated from 1378) - 15 fully functional API endpoints - 384-dimensional Sentence Transformers embeddings - FAISS vector database with semantic similarity search - Groq LLM integration active and operational - Production-ready with rate limiting, caching, and error handling Ready for enterprise deployment and scaling.
2025-07-09 12:31:24 +01:00
parent adbf50d47b
commit ecd24ce2a6
9 changed files with 912 additions and 139 deletions
@@ -54,17 +54,46 @@ class EmbeddingGenerator:
        """Lazy load sentence transformer model on first use"""
        if self.sentence_model is None and self.use_sentence_transformers:
            try:
-                print("📥 Loading local Sentence Transformers model (first use)...")
-                self.sentence_model = SentenceTransformer(settings.embedding_model)
-                print("✅ Local Sentence Transformers loaded successfully!")
-                print(f"📊 Model dimension: {self.sentence_model.get_sentence_embedding_dimension()}")
-                return True
+                print("📥 Loading Sentence Transformers model (first use)...")
+                print("🌐 This may take a few minutes for initial download...")
+
+                # Set longer timeout for model download
+                import socket
+                original_timeout = socket.getdefaulttimeout()
+                socket.setdefaulttimeout(300)  # 5 minutes timeout
+
+                try:
+                    self.sentence_model = SentenceTransformer(settings.embedding_model)
+                    print("✅ Sentence Transformers loaded successfully!")
+                    print(f"📊 Model dimension: {self.sentence_model.get_sentence_embedding_dimension()}")
+                    self.model_loaded = True
+                    return True
+                finally:
+                    # Restore original timeout
+                    socket.setdefaulttimeout(original_timeout)
+
            except Exception as e:
-                print(f"❌ Failed to load local Sentence Transformers: {e}")
-                print("⚡ Falling back to hash-based embeddings")
-                self.use_sentence_transformers = False
-                self.embedding_method = "hash"
-                return False
+                print(f"❌ Failed to load Sentence Transformers: {e}")
+                print("🔄 Retrying with cache_folder parameter...")
+
+                # Try with explicit cache folder
+                try:
+                    import os
+                    cache_dir = os.path.expanduser("~/.cache/huggingface/transformers")
+                    os.makedirs(cache_dir, exist_ok=True)
+
+                    self.sentence_model = SentenceTransformer(
+                        settings.embedding_model,
+                        cache_folder=cache_dir
+                    )
+                    print("✅ Sentence Transformers loaded successfully on retry!")
+                    print(f"📊 Model dimension: {self.sentence_model.get_sentence_embedding_dimension()}")
+                    self.model_loaded = True
+                    return True
+                except Exception as e2:
+                    print(f"❌ Retry also failed: {e2}")
+                    raise Exception(f"Cannot load Sentence Transformers model: {e2}")
+
        return self.sentence_model is not None

    def _simple_text_to_vector(self, text: str) -> np.ndarray: