Spaces:

SamanthaStorm
/

Tether

Running on Zero

App Files Files Community

SamanthaStorm commited on 27 days ago

Commit

3bc2661

verified ·

1 Parent(s): 56a2dd5

Update app.py

Browse files

Files changed (1) hide show

app.py +58 -3

app.py CHANGED Viewed

@@ -23,6 +23,18 @@ device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 logger.info(f"Using device: {device}")
 # Set up custom logging
 # Set up custom logging
 class CustomFormatter(logging.Formatter):
     """Custom formatter with colors and better formatting"""
     grey = "\x1b[38;21m"
@@ -110,7 +122,7 @@ THRESHOLDS = {
 PATTERN_WEIGHTS = {
-    "recovery": 0.7,
     "control": 1.4,
     "gaslighting": 1.3,
     "guilt tripping": 1.2,
@@ -329,6 +341,18 @@ def get_risk_stage(patterns, sentiment):
         logger.error(f"Error determining risk stage: {e}")
         return 1
 @spaces.GPU
 def compute_abuse_score(matched_scores, sentiment):
     """Compute abuse score from matched patterns and sentiment"""
@@ -440,6 +464,15 @@ def analyze_single_message(text, thresholds):
                 weight *= 1.5
             matched_scores.append((label, score, weight))
         # Get sentiment
         sent_inputs = sentiment_tokenizer(text, return_tensors="pt", truncation=True, padding=True)
         sent_inputs = {k: v.to(device) for k, v in sent_inputs.items()}
@@ -452,7 +485,8 @@ def analyze_single_message(text, thresholds):
         abuse_score = compute_abuse_score(matched_scores, sentiment)
         if explicit_abuse:
             abuse_score = max(abuse_score, 70.0)
         # Get DARVO score
         darvo_score = predict_darvo_score(text)
@@ -464,8 +498,9 @@ def analyze_single_message(text, thresholds):
             logger.debug("Message classified as likely non-abusive (supportive, neutral, and obscure language). Returning low risk.")
             return 0.0, [], [], {"label": "supportive"}, 1, 0.0, "neutral"  # Return non-abusive values
         # Set stage
-        stage = 2 if explicit_abuse or abuse_score > 70 else 1
         logger.debug("=== DEBUG END ===\n")
@@ -664,7 +699,24 @@ def analyze_composite(msg1, msg2, msg3, *answers_and_none):
                     logger.debug(f"  • {severity} | {label}: {score:.3f} (weight: {weight})")
             else:
                 logger.debug("\n✓ No abuse patterns detected")
         # Extract scores and metadata
         abuse_scores = [r[0][0] for r in results]
         stages = [r[0][4] for r in results]
@@ -831,6 +883,9 @@ def analyze_composite(msg1, msg2, msg3, *answers_and_none):
             "Low"
         )
         logger.debug(f"\n⚠️ Final Escalation Risk: {escalation_risk}")
         # Generate Output Text
         logger.debug("\n📝 GENERATING OUTPUT")
         logger.debug("=" * 50)

 logger.info(f"Using device: {device}")
 # Set up custom logging
 # Set up custom logging
+# Add cleanup function here
+def cleanup():
+    """Cleanup function to free memory"""
+    try:
+        if torch.cuda.is_available():
+            torch.cuda.empty_cache()
+        logger.info("Cleanup completed")
+    except Exception as e:
+        logger.error(f"Error during cleanup: {e}")
+atexit.register(cleanup)
 class CustomFormatter(logging.Formatter):
     """Custom formatter with colors and better formatting"""
     grey = "\x1b[38;21m"
 PATTERN_WEIGHTS = {
+    "recovery phase": 0.7,
     "control": 1.4,
     "gaslighting": 1.3,
     "guilt tripping": 1.2,
         logger.error(f"Error determining risk stage: {e}")
         return 1
+def detect_compound_threat(patterns):
+    """Helper function to standardize threat detection logic"""
+    pattern_set = set(p.lower() for p in patterns)
+    primary_threats = {"insults", "control"}
+    supporting_risks = {"gaslighting", "dismissiveness", "blame shifting"}
+    has_primary = bool(primary_threats & pattern_set)
+    has_supporting = bool(supporting_risks & pattern_set)
+    return has_primary and has_supporting
 @spaces.GPU
 def compute_abuse_score(matched_scores, sentiment):
     """Compute abuse score from matched patterns and sentiment"""
                 weight *= 1.5
             matched_scores.append((label, score, weight))
+        logger.debug("\n🧨 SINGLE-MESSAGE COMPOUND THREAT CHECK")
+        compound_threat_flag = detect_compound_threat([label for label, _, _ in matched_scores])
+        compound_threat_boost = compound_threat_flag
+        if compound_threat_flag:
+            logger.debug("⚠️ Compound high-risk patterns detected in single message.")
+        else:
+            logger.debug("✓ No compound threats detected in message.")
         # Get sentiment
         sent_inputs = sentiment_tokenizer(text, return_tensors="pt", truncation=True, padding=True)
         sent_inputs = {k: v.to(device) for k, v in sent_inputs.items()}
         abuse_score = compute_abuse_score(matched_scores, sentiment)
         if explicit_abuse:
             abuse_score = max(abuse_score, 70.0)
+        if compound_threat_boost:
+            abuse_score = max(abuse_score, 85.0)  # force high score if compound risk detected
         # Get DARVO score
         darvo_score = predict_darvo_score(text)
             logger.debug("Message classified as likely non-abusive (supportive, neutral, and obscure language). Returning low risk.")
             return 0.0, [], [], {"label": "supportive"}, 1, 0.0, "neutral"  # Return non-abusive values
         # Set stage
+        stage = 2 if explicit_abuse or abuse_score > 70 or compound_threat_boost else 1
         logger.debug("=== DEBUG END ===\n")
                     logger.debug(f"  • {severity} | {label}: {score:.3f} (weight: {weight})")
             else:
                 logger.debug("\n✓ No abuse patterns detected")
+             # Compound Threat Detection (across all active messages)
+            logger.debug("\n🧨 COMPOUND THREAT DETECTION")
+            logger.debug("=" * 50)
+            compound_threat_flag = any(
+                detect_compound_threat(result[0][1])  # patterns are in result[0][1]
+                for result in results
+            )
+            if compound_threat_flag:
+                logger.debug("⚠️ ALERT: Compound threat patterns detected across messages")
+                logger.debug("  • High-risk combination of primary and supporting patterns found")
+            else:
+                logger.debug("✓ No compound threats detected across messages")
+            logger.debug(f"  • Threat messages: {threat_count}")
+            logger.debug(f"  • Supporting risk messages: {supporting_risk_count}")
+            logger.debug(f"  • Compound threat triggered: {'YES' if compound_threat_flag else 'NO'}")
         # Extract scores and metadata
         abuse_scores = [r[0][0] for r in results]
         stages = [r[0][4] for r in results]
             "Low"
         )
         logger.debug(f"\n⚠️ Final Escalation Risk: {escalation_risk}")
+        if compound_threat_flag:
+            escalation_risk = "Critical"
+            logger.debug("❗ Compound threat detected — overriding risk to CRITICAL.")
         # Generate Output Text
         logger.debug("\n📝 GENERATING OUTPUT")
         logger.debug("=" * 50)