Spaces:

Nexari-Research
/

Nexari-Server

Sleeping

App Files Files Community

Nexari-Research commited on 23 days ago

Commit

aebecbc

verified ·

1 Parent(s): 853b07e

Update tools_engine.py

Browse files

Files changed (1) hide show

tools_engine.py +62 -35

tools_engine.py CHANGED Viewed

@@ -1,74 +1,101 @@
 """
-Nexari Tools Engine (Smart Override Edition)
 Author: Piyush
-Description: Prevents silly mistakes on short messages by using a 'Hardcoded Logic Layer' before the Neural Network.
 """
 from duckduckgo_search import DDGS
 from transformers import pipeline
 print(">>> Tools: Loading Intent Classification Model...")
 intent_classifier = pipeline("zero-shot-classification", model="typeform/distilbert-base-uncased-mnli")
 def analyze_intent(user_text):
     """
-    Decides intent with a Safety Layer for short greetings to prevent hallucination.
     """
     text_lower = user_text.lower().strip()
-    # === LAYER 1: HARDCODED SAFETY (The Fix for 'Hi' -> Searching) ===
-    # Agar user bas hello bol raha hai, to AI brain mat lagao. Direct chat karo.
-    direct_chat_triggers = ["hi", "hello", "hey", "hlo", "hola", "namaste", "what is your name", "who are you"]
-    # Agar input EXACTLY inme se ek hai, ya start hota hai
     if text_lower in direct_chat_triggers or any(text_lower.startswith(t + " ") for t in direct_chat_triggers):
-        print(f">>> Brain Override: Detected Greeting/Identity -> Force 'general conversation'")
-        return "general conversation"
-    # === LAYER 2: NEURAL NETWORK DECISION ===
     candidate_labels = [
-        "internet search",
-        "general conversation",
-        "coding request",
         "checking time"
     ]
     try:
         result = intent_classifier(user_text, candidate_labels)
-        top_intent = result['labels'][0]
         confidence = result['scores'][0]
-        print(f">>> Brain: Detected '{top_intent}' ({confidence:.2f})")
-        # Confidence Threshold badha diya (0.4 -> 0.5) taaki ghalat search na kare
         if confidence > 0.5:
-            return top_intent
     except Exception as e:
         print(f"Intent Error: {e}")
-    return "general conversation"
-def perform_web_search(user_text):
     """
-    Executes search only when triggered.
     """
     try:
         clean_query = user_text.lower()
-        remove_phrases = ["search for", "google", "find", "tell me about", "latest info on", "news about"]
         for phrase in remove_phrases:
             clean_query = clean_query.replace(phrase, "")
         clean_query = clean_query.strip()
-        if len(clean_query) < 2: clean_query = user_text
         print(f">>> Action: Searching Web for '{clean_query}'...")
-        results = DDGS().text(clean_query, max_results=3)
         if results:
-            summary = "\n".join([f"- {r['title']}: {r['body']}" for r in results])
-            return f"### WEB DATA ###\n{summary}\nINSTRUCTION: Answer based on this data."
         return ""
     except Exception as e:
         print(f"Search Error: {e}")
-        return ""

 """
+Nexari Tools Engine (UPDATED)
 Author: Piyush
+Improvements:
+ - Canonical intent labels returned
+ - More robust greeting detection
+ - Safer web search formatting
+ - Defensive error handling
 """
 from duckduckgo_search import DDGS
 from transformers import pipeline
+import re
 print(">>> Tools: Loading Intent Classification Model...")
+# zero-shot pipeline; if heavy, Docker predownload already handles it
 intent_classifier = pipeline("zero-shot-classification", model="typeform/distilbert-base-uncased-mnli")
 def analyze_intent(user_text):
     """
+    Returns canonical intent labels:
+      - "internet_search"
+      - "coding_request"
+      - "checking_time"
+      - "general"
     """
+    if not user_text:
+        return "general"
     text_lower = user_text.lower().strip()
+    # === HARDCODED SAFETY (Greeting/Identity) ===
+    direct_chat_triggers = [
+        "hi", "hello", "hey", "hlo", "hola", "namaste",
+        "what is your name", "who are you", "who r you", "your name"
+    ]
+    # exact match or common short greeting at start
     if text_lower in direct_chat_triggers or any(text_lower.startswith(t + " ") for t in direct_chat_triggers):
+        print(f">>> Brain Override: Detected Greeting/Identity -> Force 'general'")
+        return "general"
+    # === ZERO-SHOT PASSES ===
     candidate_labels = [
+        "internet search",
+        "general conversation",
+        "coding request",
         "checking time"
     ]
     try:
         result = intent_classifier(user_text, candidate_labels)
+        top_label = result['labels'][0]
         confidence = result['scores'][0]
+        print(f">>> Brain: Detected '{top_label}' ({confidence:.2f})")
         if confidence > 0.5:
+            # map to canonical labels
+            mapping = {
+                "internet search": "internet_search",
+                "general conversation": "general",
+                "coding request": "coding_request",
+                "checking time": "checking_time"
+            }
+            return mapping.get(top_label, "general")
     except Exception as e:
         print(f"Intent Error: {e}")
+    return "general"
+def perform_web_search(user_text, max_results=3):
     """
+    Execute a brief web search and return a compact summary.
     """
     try:
         clean_query = user_text.lower()
+        remove_phrases = ["search for", "google", "find", "tell me about", "latest info on", "news about", "lookup"]
         for phrase in remove_phrases:
             clean_query = clean_query.replace(phrase, "")
         clean_query = clean_query.strip()
+        if len(clean_query) < 2:
+            clean_query = user_text
         print(f">>> Action: Searching Web for '{clean_query}'...")
+        results = list(DDGS().text(clean_query, max_results=max_results))
         if results:
+            parts = []
+            for r in results:
+                title = r.get('title', '').strip()
+                body = re.sub(r'\s+', ' ', r.get('body', '').strip())
+                # keep short
+                if len(body) > 250:
+                    body = body[:250].rsplit(' ', 1)[0] + "..."
+                parts.append(f"- {title}: {body}")
+            summary = "\n".join(parts)
+            return f"### WEB DATA (short) ###\n{summary}\nINSTRUCTION: Use this to inform the answer; prefer concise synthesis."
         return ""
     except Exception as e:
         print(f"Search Error: {e}")
+        return ""