Spaces:

tassid
/

sentiment-phrases

Running

App Files Files Community

tassid commited on 8 days ago

Commit

2129645

verified ·

1 Parent(s): 724b0cd

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -7

app.py CHANGED Viewed

@@ -124,7 +124,7 @@ print(f"- Moderadores: {len(moderators)}")
 print(f"{'='*60}\n")
 # Limiar AUMENTADO para evitar falsos positivos
-TOXICITY_THRESHOLD = 0.75  # Aumentado de 0.70 para 0.75
 # Mapeamento expandido de labels
 LABEL_MAPPING = {
@@ -151,6 +151,7 @@ LABEL_MAPPING = {
 def verificar_linguagem(texto):
     """
     Verifica linguagem imprópria com MAIS modelos e threshold MAIOR
     """
     if not moderators or len(texto.strip()) < 3:
         return False, 0.0
@@ -163,14 +164,25 @@ def verificar_linguagem(texto):
             label = resultado['label'].lower()
             score = resultado['score']
-            # Interpretar com mais cuidado
-            is_toxic_label = any(word in label for word in ['toxic', 'hate', 'offensive', 'hateful'])
-            if is_toxic_label:
                 toxicity = score
-            else:
-                # Se label é "normal" ou "not toxic", inverter
                 toxicity = 1 - score
             scores_toxicos.append(toxicity)
@@ -286,6 +298,12 @@ def analisar_texto(texto):
     # VERIFICAR LINGUAGEM (com threshold mais alto)
     has_improper, improper_score = verificar_linguagem(texto)
     # Formatar resultado
     if has_improper:
         resultado_texto = f"""**{classificacao}**
@@ -395,7 +413,11 @@ with gr.Blocks(title="Análise de Sentimentos Avançada") as demo:
         **Moderadores Ativos:** {len(moderators)} / {len(MODERATION_MODELS)}
-        **Threshold:** {TOXICITY_THRESHOLD*100:.0f}% (balanceado para evitar falsos positivos)
         **Modelos:**
         - DistilBERT Toxicity

 print(f"{'='*60}\n")
 # Limiar AUMENTADO para evitar falsos positivos
+TOXICITY_THRESHOLD = 0.80  # Aumentado para reduzir falsos positivos
 # Mapeamento expandido de labels
 LABEL_MAPPING = {
 def verificar_linguagem(texto):
     """
     Verifica linguagem imprópria com MAIS modelos e threshold MAIOR
+    Com interpretação melhorada de labels
     """
     if not moderators or len(texto.strip()) < 3:
         return False, 0.0
             label = resultado['label'].lower()
             score = resultado['score']
+            # Interpretar labels com MAIS cuidado
+            # Labels que indicam TOXICIDADE
+            toxic_keywords = ['toxic', 'hate', 'offensive', 'hateful', 'obscene', 'threat', 'insult']
+            # Labels que indicam NORMALIDADE
+            normal_keywords = ['not', 'normal', 'neutral', 'clean']
+            is_toxic_label = any(word in label for word in toxic_keywords)
+            is_normal_label = any(word in label for word in normal_keywords)
+            # Calcular toxicity score com lógica melhorada
+            if is_toxic_label and not is_normal_label:
+                # Label diz que é tóxico
                 toxicity = score
+            elif is_normal_label or 'not' in label:
+                # Label diz que NÃO é tóxico
                 toxicity = 1 - score
+            else:
+                # Label ambíguo, assumir score direto se alto
+                toxicity = score if score > 0.5 else 1 - score
             scores_toxicos.append(toxicity)
     # VERIFICAR LINGUAGEM (com threshold mais alto)
     has_improper, improper_score = verificar_linguagem(texto)
+    # LÓGICA INTELIGENTE: Se Positivo com boa confiança, provavelmente não é ofensivo
+    if classificacao == 'Positivo' and confianca_final > 0.70:
+        has_improper = False  # Ignora alerta para textos claramente positivos
+    # Se Neutro ou Negativo, ainda verifica normalmente
     # Formatar resultado
     if has_improper:
         resultado_texto = f"""**{classificacao}**
         **Moderadores Ativos:** {len(moderators)} / {len(MODERATION_MODELS)}
+        **Threshold:** {TOXICITY_THRESHOLD*100:.0f}% (mais alto para evitar falsos positivos)
+        **Lógica Inteligente:**
+        - Textos claramente positivos (>70% confiança) não geram alertas
+        - Foco em detectar problemas reais
         **Modelos:**
         - DistilBERT Toxicity