Spaces:

artush-habetyan
/

vibe_sip

Sleeping

App Files Files Community

artush-habetyan commited on Jun 25

Commit

fb3a3b8

verified ·

1 Parent(s): ba33ad2

Upload 8 files

Browse files

Files changed (3) hide show

requirements.txt +0 -5
ultra_lightweight_llm.py +92 -0
venue_ai_complete.py +31 -47

requirements.txt CHANGED Viewed

@@ -4,8 +4,3 @@ numpy>=1.24.0
 geopy>=2.3.0
 scikit-learn>=1.3.0
 regex>=2023.6.3
-huggingface_hub>=0.20.0
-transformers>=4.35.0
-torch>=2.0.0
-accelerate>=0.20.0
-bitsandbytes>=0.41.0

 geopy>=2.3.0
 scikit-learn>=1.3.0
 regex>=2023.6.3

ultra_lightweight_llm.py ADDED Viewed

	@@ -0,0 +1,92 @@

+import logging
+from typing import Optional
+# Ultra-lightweight models smaller than TinyLlama
+ULTRA_LIGHTWEIGHT_MODELS = {
+    # MobiLlama 0.5B - 60% smaller than TinyLlama, shared FFN architecture
+    "mobillama": {
+        "model_name": "mbzuai-oryx/MobiLlama-05B-Chat",
+        "size": "0.5B",
+        "memory": "~1.5GB",
+        "description": "Shared FFN design, very efficient"
+    },
+    # GPT-2 variants - much smaller
+    "gpt2": {
+        "model_name": "gpt2",  # 124M parameters
+        "size": "124M",
+        "memory": "~500MB",
+        "description": "Classic, very small, fast"
+    },
+    # Sum-small - extremely tiny
+    "sum_small": {
+        "model_name": "omi-health/sum-small",
+        "size": "~100M",
+        "memory": "~400MB",
+        "description": "Ultra-compact summarization model"
+    }
+}
+class UltraLightweightLLM:
+    def __init__(self, model_choice="gpt2"):
+        self.model_choice = model_choice
+        self.model = None
+        self.tokenizer = None
+        self.model_info = ULTRA_LIGHTWEIGHT_MODELS.get(model_choice, ULTRA_LIGHTWEIGHT_MODELS["gpt2"])
+        self.setup_model()
+    def setup_model(self):
+        """Setup ultra-lightweight model for HF Spaces"""
+        try:
+            # For HF Spaces, we'll use template-based responses to avoid any model loading
+            # This ensures sub-second response times
+            logging.info(f"Ultra-lightweight mode: Using template responses for optimal HF Spaces performance")
+            logging.info(f"Selected model profile: {self.model_info['description']} ({self.model_info['size']})")
+            self.model = "template_based"  # Flag for template mode
+        except Exception as e:
+            logging.warning(f"Model setup failed, using template mode: {e}")
+            self.model = "template_based"
+    def generate_response(self, venue_context, user_query, max_length=200):
+        """Generate ultra-fast template-based responses"""
+        if not self.model:
+            return "I can help you find venues in Yerevan! Please specify what type of place you're looking for."
+        # Ultra-fast template responses for common queries
+        query_lower = user_query.lower()
+        # Greeting responses
+        if any(word in query_lower for word in ['hello', 'hi', 'hey', 'good']):
+            return "Hello! I'm your Yerevan venue assistant. I can help you find great pubs, bars, restaurants, and cafes in Yerevan. What are you looking for today?"
+        # Thank you responses
+        if any(word in query_lower for word in ['thank', 'thanks']):
+            return "You're welcome! I'm here to help you discover the best venues in Yerevan. Feel free to ask for more recommendations!"
+        # Venue-specific quick responses
+        if 'pub' in query_lower or 'bar' in query_lower:
+            return "Great choice! Yerevan has amazing pubs and bars. I can help you find places with craft beer, live music, outdoor seating, or cozy atmospheres. Any specific preferences?"
+        if 'restaurant' in query_lower or 'food' in query_lower:
+            return "Yerevan's restaurant scene is fantastic! From traditional Armenian cuisine to international options, I can help you find the perfect dining spot. What type of cuisine interests you?"
+        if 'cafe' in query_lower or 'coffee' in query_lower:
+            return "Yerevan has wonderful cafes! Whether you want a quiet study spot, artisanal coffee, or a place to meet friends, I can suggest great options. Any location preferences?"
+        # Location-based responses
+        if any(loc in query_lower for loc in ['opera', 'republic', 'cascade', 'northern']):
+            return "Excellent area choice! That's one of Yerevan's most vibrant districts with lots of great venues nearby. Let me help you find specific recommendations in that area."
+        # Default helpful response
+        return "I'm here to help you discover Yerevan's best venues! Tell me what you're looking for - pubs, restaurants, cafes, or something specific, and I'll provide personalized recommendations."
+# Simple function to get model info
+def get_model_info():
+    return {
+        "current_mode": "Ultra-lightweight template system",
+        "response_time": "~100ms",
+        "memory_usage": "~50MB",
+        "models_available": ULTRA_LIGHTWEIGHT_MODELS
+    }

venue_ai_complete.py CHANGED Viewed

@@ -30,13 +30,14 @@ except Exception as e:
 from lightweight_rag import LightweightRAGEnhancer
 try:
-    from lightweight_conversational_llm import LightweightConversationalLLM
-    LIGHTWEIGHT_LLM_AVAILABLE = True
-    logger.info("Lightweight conversational LLM available")
 except ImportError as e:
-    logger.warning(f"Lightweight conversational LLM not available: {e}")
-    LIGHTWEIGHT_LLM_AVAILABLE = False
 class CompleteYerevanVenueAI:
     """
@@ -765,12 +766,19 @@ class CompleteYerevanVenueAI:
                 armenian_category = category_map.get(category, category)
                 info_parts.append(f"🏷️ {armenian_category}")
-            # Add metadata features
             features = []
-            if venue.get('serves_beer'): features.append("գարեջուր")
             if venue.get('serves_cocktails'): features.append("կոկտեյլ")
             if venue.get('live_music'): features.append("կենդանի երաժշտություն")
             if venue.get('outdoor_seating'): features.append("բացօթյա նստարան")
             if features:
                 info_parts.append(f"✨ {', '.join(features)}")
@@ -803,14 +811,19 @@ class CompleteYerevanVenueAI:
             if venue.get('category'):
                 info_parts.append(f"🏷️ {venue['category']}")
-            # Add metadata features
             features = []
-            if venue.get('serves_beer'): features.append("serves beer")
             if venue.get('serves_cocktails'): features.append("cocktails")
             if venue.get('live_music'): features.append("live music")
             if venue.get('outdoor_seating'): features.append("outdoor seating")
             if venue.get('good_for_date_night'): features.append("romantic")
             if venue.get('good_for_groups'): features.append("good for groups")
             if features:
                 info_parts.append(f"✨ {', '.join(features)}")
@@ -866,8 +879,8 @@ class CompleteYerevanVenueAI:
         # Handle venue queries with the existing logic
         location_context = self._extract_enhanced_location_context(user_query)
-        # Perform venue search
-        venues = self._smart_venue_search(user_query, top_k=50)
         # Filter venues
         filtered_venues = self._filter_venues(venues, min_rating, price_range, max_distance, location_context)
@@ -890,46 +903,17 @@ class CompleteYerevanVenueAI:
         }
     def _initialize_conversational_llm(self):
-        """Initialize conversational LLM with lightweight model preferred"""
-        # Try lightweight transformers-based model first (no compilation needed)
-        if LIGHTWEIGHT_LLM_AVAILABLE:
             try:
-                logger.info("Initializing lightweight conversational LLM...")
-                self.conversational_llm = LightweightConversationalLLM()
-                logger.info("Successfully initialized lightweight conversational LLM")
                 return
             except Exception as e:
-                logger.warning(f"Failed to initialize lightweight LLM: {e}")
-        # Legacy llama-cpp fallback (if available)
-        if LLAMA_CPP_AVAILABLE:
-            try:
-                from huggingface_hub import hf_hub_download
-                logger.info("Downloading TinyLlama model from Hugging Face Hub...")
-                model_path = hf_hub_download(
-                    repo_id="TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF",
-                    filename="tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf",
-                    cache_dir="./model_cache"
-                )
-                from llama_cpp import Llama
-                self.conversational_llm = Llama(
-                    model_path=model_path,
-                    n_ctx=1024,
-                    n_threads=2,
-                    n_gpu_layers=0,
-                    verbose=False,
-                    use_mmap=True,
-                    use_mlock=False
-                )
-                logger.info("Successfully loaded legacy TinyLlama model")
-                return
-            except Exception as e:
-                logger.warning(f"Failed to initialize legacy conversational LLM: {e}")
-        logger.info("No conversational LLM available, using template-based responses")
         self.conversational_llm = None
     def _add_to_conversation_history(self, user_message: str, ai_response: str):

 from lightweight_rag import LightweightRAGEnhancer
+# Ultra-lightweight LLM for optimal HF Spaces performance
 try:
+    from ultra_lightweight_llm import UltraLightweightLLM
+    ULTRA_LIGHTWEIGHT_LLM_AVAILABLE = True
+    logger.info("Ultra-lightweight LLM available for optimal performance")
 except ImportError as e:
+    logger.warning(f"Ultra-lightweight LLM not available: {e}")
+    ULTRA_LIGHTWEIGHT_LLM_AVAILABLE = False
 class CompleteYerevanVenueAI:
     """
                 armenian_category = category_map.get(category, category)
                 info_parts.append(f"🏷️ {armenian_category}")
+            # Add metadata features (skip common ones for pubs/bars)
             features = []
+            venue_category = venue.get('category', '').lower()
+            # Only show beer for non-pub/bar venues
+            if venue.get('serves_beer') and venue_category not in ['pub', 'bar']:
+                features.append("գարեջուր")
             if venue.get('serves_cocktails'): features.append("կոկտեյլ")
             if venue.get('live_music'): features.append("կենդանի երաժշտություն")
             if venue.get('outdoor_seating'): features.append("բացօթյա նստարան")
+            if venue.get('good_for_date_night'): features.append("ռոմանտիկ")
+            if venue.get('good_for_groups'): features.append("խմբերի համար")
             if features:
                 info_parts.append(f"✨ {', '.join(features)}")
             if venue.get('category'):
                 info_parts.append(f"🏷️ {venue['category']}")
+            # Add metadata features (skip common ones for pubs/bars)
             features = []
+            venue_category = venue.get('category', '').lower()
+            # Only show beer for non-pub/bar venues
+            if venue.get('serves_beer') and venue_category not in ['pub', 'bar']:
+                features.append("serves beer")
             if venue.get('serves_cocktails'): features.append("cocktails")
             if venue.get('live_music'): features.append("live music")
             if venue.get('outdoor_seating'): features.append("outdoor seating")
             if venue.get('good_for_date_night'): features.append("romantic")
             if venue.get('good_for_groups'): features.append("good for groups")
             if features:
                 info_parts.append(f"✨ {', '.join(features)}")
         # Handle venue queries with the existing logic
         location_context = self._extract_enhanced_location_context(user_query)
+        # Perform venue search (full search for comprehensive results)
+        venues = self._smart_venue_search(user_query, top_k=100)
         # Filter venues
         filtered_venues = self._filter_venues(venues, min_rating, price_range, max_distance, location_context)
         }
     def _initialize_conversational_llm(self):
+        """Initialize ultra-lightweight conversational system"""
+        if ULTRA_LIGHTWEIGHT_LLM_AVAILABLE:
             try:
+                logger.info("Initializing ultra-lightweight conversational system...")
+                self.conversational_llm = UltraLightweightLLM()
+                logger.info("Successfully initialized ultra-lightweight conversational system")
                 return
             except Exception as e:
+                logger.warning(f"Failed to initialize ultra-lightweight LLM: {e}")
+        logger.info("Using template-based responses for optimal performance")
         self.conversational_llm = None
     def _add_to_conversation_history(self, user_message: str, ai_response: str):