Spaces:

amitbhatt6075
/

reachify-ai-service

Running

App Files Files Community

amitbhatt6075 commited on 5 days ago

Commit

5ac001d

1 Parent(s): 4f2c694

Added Community AI Module: Toxicity Check and Smart Tagging

Browse files

Files changed (2) hide show

api/main.py +86 -36
core/community_brain.py +114 -0

api/main.py CHANGED Viewed

@@ -30,6 +30,7 @@ from core.utils import get_supabase_client, extract_colors_from_url
 from core.document_parser import parse_pdf_from_url
 from core.creative_chat import CreativeDirector
 from core.matcher import load_embedding_model
 try:
     from core.rag.store import VectorStore
@@ -67,6 +68,7 @@ _likes_predictor = None
 _comments_predictor = None
 _revenue_forecaster = None
 _performance_scorer = None
 def to_snake(name: str) -> str:
     return re.sub(r'(?<!^)(?=[A-Z])', '_', name).lower()
@@ -150,6 +152,28 @@ class ForecastRequest(BaseModel):
     budget: float; category: str; follower_count: int; engagement_rate: float
     config: Optional[Dict[str, str]] = None
 # ==========================================================
 # 🎯 FIX 2: NOW DEFINE ForecastResponse
 # PerformanceForecast and PayoutForecast are already defined above.
@@ -203,10 +227,10 @@ app = FastAPI(title="Reachify AI Service (Deploy-Ready)", version="11.0.0")
 @app.on_event("startup")
 def startup_event():
     # Make sure we can modify the global variables
-    global _llm_instance, _creative_director, _support_agent, _ai_strategist, _vector_store, \
-           _budget_predictor, _influencer_matcher, _performance_predictor, _payout_forecaster, \
-           _earnings_optimizer, _earnings_encoder, _likes_predictor, _comments_predictor, \
-           _revenue_forecaster, _performance_scorer
     # --- STEP 1: DOWNLOAD AND LOAD THE LLM MODEL ---
     print("--- 🚀 AI Service Starting Up... ---")
@@ -243,10 +267,17 @@ def startup_event():
             if VectorStore:
                 _vector_store = VectorStore()
                 print("   - RAG Engine Ready.")
             _ai_strategist = AIStrategist(llm_instance=_llm_instance, store=_vector_store)
             _support_agent = SupportAgent(llm_instance=_llm_instance, embedding_path=EMBEDDING_MODEL_PATH, db_path=DB_PATH)
-            print("   - ✅ Core AI components (Director, Strategist, Agent) are online.")
         except Exception as e:
             print(f"   - ❌ FAILED to initialize core AI components: {e}")
@@ -282,6 +313,7 @@ def startup_event():
     print("\n--- ✅ AI Service startup sequence finished! ---")
 @app.get("/")
 def health_check():
     if _llm_instance:
@@ -723,65 +755,44 @@ def analyze_content_quality(request: ContentQualityRequest):
     caption = request.caption
-    # This is a very structured prompt that asks the LLM to act as a specialist
-    # and return a JSON object, which is easier and more reliable to parse.
     prompt = f"""
 [SYSTEM]
-You are a social media expert. Analyze the following caption based on four criteria: Readability, Engagement, Call to Action (CTA), and Hashtag Strategy.
-For each criterion, provide a score from 1 (poor) to 10 (excellent).
-Also, provide a final overall score (average of the four scores) and short, actionable feedback.
-Respond ONLY with a valid JSON object in the following format:
-{{
-  "overall_score": <float>,
-  "scores": {{
-    "readability": <int>,
-    "engagement": <int>,
-    "call_to_action": <int>,
-    "hashtag_strategy": <int>
-  }},
-  "feedback": "<string>"
-}}
 [CAPTION TO ANALYZE]
 "{caption}"
 [YOUR JSON RESPONSE]
 """
     try:
         print("--- Sending caption to LLM for quality analysis...")
         response = _llm_instance(prompt, max_tokens=512, temperature=0.2, stop=["[SYSTEM]", "\n\n"], echo=False)
-        # Extract the JSON part of the response
         json_text = response['choices'][0]['text'].strip()
-        # Find the start and end of the JSON object
         start_index = json_text.find('{')
         end_index = json_text.rfind('}') + 1
         if start_index == -1 or end_index == 0:
             raise ValueError("LLM did not return a valid JSON object.")
         clean_json_text = json_text[start_index:end_index]
         import json
         analysis_result = json.loads(clean_json_text)
         final_result = {
-            "overall_score": analysis_result_raw.get("overall_score"),
-            "feedback": analysis_result_raw.get("feedback"),
-            "scores": analysis_result_raw.get("scores") or analysis_result_raw.get("score")
         }
         print("--- Successfully received and parsed JSON response from LLM.")
         return ContentQualityResponse(**final_result)
-    except (json.JSONDecodeError, KeyError, ValueError) as e:
-        print(f"🚨 ERROR parsing LLM response: {e}. Raw response was: {json_text}")
-        raise HTTPException(status_code=500, detail="Failed to parse the analysis from the AI model. The model may have returned an unexpected format.")
     except Exception as e:
-        print(f"🚨 An unexpected error occurred during content analysis: {e}")
-        traceback.print_exc()
-        raise HTTPException(status_code=500, detail=str(e))
 @app.post("/rank/campaigns-for-influencer", response_model=RankCampaignsResponse, summary="Ranks a list of campaigns for one influencer")
 async def rank_campaigns_for_influencer_route(request: RankCampaignsRequest):
@@ -1663,4 +1674,43 @@ def create_campaign_from_prompt_endpoint(payload: DirectPromptPayload):
         )
         return {"response": response_text}
     except Exception as e:
-        raise HTTPException(status_code=500, detail=str(e))

 from core.document_parser import parse_pdf_from_url
 from core.creative_chat import CreativeDirector
 from core.matcher import load_embedding_model
+from core.community_brain import CommunityBrain
 try:
     from core.rag.store import VectorStore
 _comments_predictor = None
 _revenue_forecaster = None
 _performance_scorer = None
+_community_brain: Optional[CommunityBrain] = None
 def to_snake(name: str) -> str:
     return re.sub(r'(?<!^)(?=[A-Z])', '_', name).lower()
     budget: float; category: str; follower_count: int; engagement_rate: float
     config: Optional[Dict[str, str]] = None
+# --- COMMUNITY LAYER MODELS ---
+class ContentCheckRequest(BaseModel):
+    text: str
+    user_id: Optional[str] = None
+class TagGenerationRequest(BaseModel):
+    content: str
+    niche: Optional[str] = "General"
+class ContentCheckResponse(BaseModel):
+    toxicity_score: float
+    is_safe: bool
+    tags: List[str]
+class ThreadSummaryRequest(BaseModel):
+    comments: List[str]
+class ThreadSummaryResponse(BaseModel):
+    summary: str
 # ==========================================================
 # 🎯 FIX 2: NOW DEFINE ForecastResponse
 # PerformanceForecast and PayoutForecast are already defined above.
 @app.on_event("startup")
 def startup_event():
     # Make sure we can modify the global variables
+    global _llm_instance, _creative_director, _support_agent, _ai_strategist, _community_brain, \
+           _vector_store, _budget_predictor, _influencer_matcher, _performance_predictor, \
+           _payout_forecaster, _earnings_optimizer, _earnings_encoder, _likes_predictor, \
+           _comments_predictor, _revenue_forecaster, _performance_scorer
     # --- STEP 1: DOWNLOAD AND LOAD THE LLM MODEL ---
     print("--- 🚀 AI Service Starting Up... ---")
             if VectorStore:
                 _vector_store = VectorStore()
                 print("   - RAG Engine Ready.")
             _ai_strategist = AIStrategist(llm_instance=_llm_instance, store=_vector_store)
+            # 👇 NEW: COMMUNITY MODULE INJECTION
+            from core.community_brain import CommunityBrain  # Late import prevents circular issues
+            _community_brain = CommunityBrain(llm_instance=_llm_instance)
+            print("   - ✅ Community Brain (Mod/Tags) initialized.")
             _support_agent = SupportAgent(llm_instance=_llm_instance, embedding_path=EMBEDDING_MODEL_PATH, db_path=DB_PATH)
+            print("   - ✅ Core AI components (Director, Strategist, CommunityBrain, Agent) are online.")
         except Exception as e:
             print(f"   - ❌ FAILED to initialize core AI components: {e}")
     print("\n--- ✅ AI Service startup sequence finished! ---")
 @app.get("/")
 def health_check():
     if _llm_instance:
     caption = request.caption
     prompt = f"""
 [SYSTEM]
+You are a social media expert. Analyze the following caption... Respond ONLY with a valid JSON object.
 [CAPTION TO ANALYZE]
 "{caption}"
 [YOUR JSON RESPONSE]
 """
     try:
         print("--- Sending caption to LLM for quality analysis...")
         response = _llm_instance(prompt, max_tokens=512, temperature=0.2, stop=["[SYSTEM]", "\n\n"], echo=False)
         json_text = response['choices'][0]['text'].strip()
         start_index = json_text.find('{')
         end_index = json_text.rfind('}') + 1
         if start_index == -1 or end_index == 0:
             raise ValueError("LLM did not return a valid JSON object.")
         clean_json_text = json_text[start_index:end_index]
         import json
+        # ✅ Corrected Variable Name
         analysis_result = json.loads(clean_json_text)
         final_result = {
+            "overall_score": analysis_result.get("overall_score"),  # FIXED: Removed _raw
+            "feedback": analysis_result.get("feedback"),            # FIXED: Removed _raw
+            "scores": analysis_result.get("scores") or analysis_result.get("score") # FIXED: Removed _raw
         }
         print("--- Successfully received and parsed JSON response from LLM.")
         return ContentQualityResponse(**final_result)
     except Exception as e:
+        print(f"🚨 Error in Content Quality Analysis: {e}")
+        raise HTTPException(status_code=500, detail="Failed to parse analysis.")
 @app.post("/rank/campaigns-for-influencer", response_model=RankCampaignsResponse, summary="Ranks a list of campaigns for one influencer")
 async def rank_campaigns_for_influencer_route(request: RankCampaignsRequest):
         )
         return {"response": response_text}
     except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+        # ==============================================================
+# 🧠 COMMUNITY INTELLIGENCE ENDPOINTS
+# ==============================================================
+@app.post("/community/moderate-and-tag", response_model=ContentCheckResponse)
+def moderate_and_tag(request: ContentCheckRequest):
+    """
+    Called when a user hits 'Post'. Checks toxicity AND generates tags in one go.
+    """
+    print(f"\n🧠 Checking community post content...")
+    # 1. Moderation Check (Fast)
+    if not _community_brain:
+        # Fail safe
+        return ContentCheckResponse(toxicity_score=0.0, is_safe=True, tags=["#NewPost"])
+    mod_result = _community_brain.moderate_content(request.text)
+    # 2. Tagging (Only if safe)
+    tags = []
+    if mod_result['is_safe']:
+        # If model exists, run extraction
+        tags = _community_brain.generate_smart_tags(request.text)
+    return ContentCheckResponse(
+        toxicity_score=mod_result['toxicity_score'],
+        is_safe=mod_result['is_safe'],
+        tags=tags
+    )
+@app.post("/community/summarize-discussion", response_model=ThreadSummaryResponse)
+def summarize_community_thread(request: ThreadSummaryRequest):
+    if not _community_brain:
+        return ThreadSummaryResponse(summary="Summary unavailable.")
+    summary = _community_brain.summarize_thread(request.comments)
+    return ThreadSummaryResponse(summary=summary)

core/community_brain.py ADDED Viewed

	@@ -0,0 +1,114 @@

+import re
+import json
+import traceback
+from typing import List, Dict, Any
+from llama_cpp import Llama
+class CommunityBrain:
+    def __init__(self, llm_instance: Llama):
+        self.llm = llm_instance
+        print("--- Community Brain initialized. ---")
+    # 🛑 HYBRID MODERATION (Fast + Cheap)
+    def moderate_content(self, text: str) -> Dict[str, Any]:
+        """
+        Check content for toxicity using a local Keyword list first,
+        then AI for deeper semantic checks if needed.
+        """
+        # 1. First Line of Defense: Static Python Keyword Match (Instant)
+        # Add your Hindi/English blacklist here
+        TOXIC_KEYWORDS = [
+            "abuse", "kill", "suicide", "hate", "idiot", "scam",
+            "hack", "betting", "casino", "stupid", "fuck"
+        ]
+        score = 0.0
+        flags = []
+        text_lower = text.lower()
+        # Simple string matching
+        for word in TOXIC_KEYWORDS:
+            if word in text_lower:
+                score += 0.4
+                flags.append(f"Potential inappropriate word: {word}")
+        # If highly toxic by keywords alone, fail immediately (Don't waste LLM)
+        if score > 0.5:
+            return {"toxicity_score": min(score, 1.0), "is_safe": False, "flags": flags}
+        # 2. Second Line of Defense: Contextual Analysis via AI (Mocked for speed if needed)
+        # Note: Running LLM for every post creates latency. We strictly format tags here.
+        # Returning current score if keyword check passed semi-clean
+        return {
+            "toxicity_score": score,
+            "is_safe": score < 0.5,
+            "flags": flags
+        }
+    # 🏷️ SMART TAGGING
+    def generate_smart_tags(self, content: str) -> List[str]:
+        """
+        Extracts 3-5 relevant hashtags from the content using LLM.
+        """
+        try:
+            prompt = f"""[INST] Extract 4 relevant hashtags for this post. Return ONLY hashtags separated by spaces. No explanation.
+            Post: "I just bought this amazing lipstick shade, the red is so vibrant and it lasts all day! Perfect for summer looks."
+            Hashtags: #Beauty #Lipstick #Makeup #SummerVibes
+            Post: "{content[:300]}"
+            Hashtags: [/INST]"""
+            response = self.llm(
+                prompt,
+                max_tokens=30,
+                temperature=0.3, # Low temp for precision
+                stop=["[INST]", "\n"],
+                echo=False
+            )
+            raw_tags = response['choices'][0]['text'].strip()
+            # Clean up hashtags (ensure they start with #)
+            tags = [t.strip() for t in raw_tags.split() if t.strip()]
+            # Format correction
+            clean_tags = []
+            for t in tags:
+                if not t.startswith('#'): t = f"#{t}"
+                # Remove symbols excluding #
+                t = re.sub(r'[^a-zA-Z0-9#]', '', t)
+                clean_tags.append(t)
+            return clean_tags[:5] # Max 5 tags
+        except Exception as e:
+            print(f"Smart Tag Error: {e}")
+            return ["#Community"]
+    # 🧠 DISCUSSION SUMMARIZATION
+    def summarize_thread(self, comments: List[str]) -> str:
+        """
+        Summarizes a list of comments into a key insight.
+        """
+        if not comments: return "No activity yet."
+        # Combine last 10 comments (truncate context)
+        context_text = " | ".join(comments[:15])[:1500]
+        prompt = f"""[INST] Summarize the main sentiment and topic of this discussion in one sentence.
+        Discussion: {context_text}
+        Summary: [/INST]"""
+        try:
+            response = self.llm(
+                prompt,
+                max_tokens=60,
+                temperature=0.5,
+                stop=["[INST]", "\n"],
+                echo=False
+            )
+            return response['choices'][0]['text'].strip()
+        except Exception as e:
+            return "Discussion is active."