Spaces:

SamanthaStorm
/

Tether

Running on Zero

SamanthaStorm commited on Apr 9

Commit

bd4971f

verified ·

1 Parent(s): 28fc37c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -71,7 +71,7 @@ def calculate_abuse_level(scores, thresholds, motif_hits=None):
     # Boost score if high-risk motifs were detected
     motif_hits = motif_hits or []
     if any(label in motif_hits for label in {"physical_threat", "suicidal_threat", "extreme_control"}):
-        base_score = max(base_score, 60.0)  # Push to "Severe / Harmful Pattern Present"
     return base_score
@@ -116,7 +116,9 @@ def analyze_messages(input_text, risk_flags):
     high_risk_context = any(flag in contextual_flags for flag in critical_flags)
     non_abusive_score = scores[LABELS.index('non_abusive')]
-    if non_abusive_score > adjusted_thresholds['non_abusive']:
         return "This message is classified as non-abusive."
     abuse_level = calculate_abuse_level(scores, adjusted_thresholds, motif_hits=[label for label, _ in matched_phrases])

     # Boost score if high-risk motifs were detected
     motif_hits = motif_hits or []
     if any(label in motif_hits for label in {"physical_threat", "suicidal_threat", "extreme_control"}):
+        base_score = max(base_score, 75.0)  # Push to "Severe / Harmful Pattern Present"
     return base_score
     high_risk_context = any(flag in contextual_flags for flag in critical_flags)
     non_abusive_score = scores[LABELS.index('non_abusive')]
+    non_abusive_confident = non_abusive_score > adjusted_thresholds['non_abusive']
+    if non_abusive_confident and danger_flag_count == 0 and not matched_phrases:
         return "This message is classified as non-abusive."
     abuse_level = calculate_abuse_level(scores, adjusted_thresholds, motif_hits=[label for label, _ in matched_phrases])