Spaces:

aeresd
/

test_1

Sleeping

aeresd commited on May 20

Commit

d6593c8

verified ·

1 Parent(s): 5981972

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -74,7 +74,11 @@ st.markdown("## Input or Upload Text for Classification")
 col1, col2 = st.columns([2, 1])
 with col1:
-    user_input = st.text_area("Enter sentence with emojis:", value="you are 🐷", height=150)
     if st.button("Analyze Text"):
         with st.spinner("Processing..."):
             try:
@@ -135,18 +139,25 @@ if st.session_state.history:
     )
     st.plotly_chart(radar_fig)
-    # Top inputs per category
-    st.markdown("### Top Inputs by Offensive Category")
     categories = df['label'].unique()
     for cat in categories:
-        cat_df = df[df['label'] == cat].sort_values(by='score', ascending=False)
         st.markdown(f"**{cat}**")
-        top_n = cat_df.head(5)
-        for idx, row in top_n.iterrows():
-            st.markdown(f"- `{row['text']}` ({row['score']:.2%})")
-        if len(cat_df) > 5:
             with st.expander("Show more"):
-                for idx, row in cat_df.iloc[5:].iterrows():
-                    st.markdown(f"- `{row['text']}` ({row['score']:.2%})")
 else:
     st.info("No data available. Please analyze some text first.")

 col1, col2 = st.columns([2, 1])
 with col1:
+    user_input = st.text_area(
+        "Enter sentence with emojis:",
+        value="春竹你🐎是不是💩了,窩🌿泥🐎SB",
+        height=150
+    )
     if st.button("Analyze Text"):
         with st.spinner("Processing..."):
             try:
     )
     st.plotly_chart(radar_fig)
+    # Analyze words related to each offensive category
+    st.markdown("### Top Offensive Terms by Category")
     categories = df['label'].unique()
     for cat in categories:
         st.markdown(f"**{cat}**")
+        # collect max score per word in texts of this category
+        word_scores = {}
+        for _, row in df[df['label'] == cat].iterrows():
+            words = row['text'].split()
+            for w in words:
+                word_scores[w] = max(word_scores.get(w, 0), row['score'])
+        sorted_words = sorted(word_scores.items(), key=lambda x: x[1], reverse=True)
+        # display top 5 by default
+        for w, s in sorted_words[:5]:
+            st.markdown(f"- `{w}` ({s:.2%})")
+        # show more if exists
+        if len(sorted_words) > 5:
             with st.expander("Show more"):
+                for w, s in sorted_words[5:]:
+                    st.markdown(f"- `{w}` ({s:.2%})")
 else:
     st.info("No data available. Please analyze some text first.")