Created a new Python file that will include functions for bias detection specifically for text. Also added content for success page for text (only tuples for rating)

omerert · omerert · commit d83bedc9ff66 · 2024-04-11T10:56:21.000-05:00
diff --git a/db.sqlite3 b/db.sqlite3
diff --git a/nlpFiles/detectionInText.py b/nlpFiles/detectionInText.py
@@ -0,0 +1,20 @@
+from transformers import AutoTokenizer, TFAutoModelForSequenceClassification, pipeline
+from nltk.tokenize import sent_tokenize
+from selenium import webdriver
+import os
+from bs4 import BeautifulSoup
+from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer
+
+def biasInText(userText) -> list:
+    # Get models
+    tokenizer = AutoTokenizer.from_pretrained("d4data/bias-detection-model")
+    model = TFAutoModelForSequenceClassification.from_pretrained("d4data/bias-detection-model")
+    classifier = pipeline('text-classification', model=model, tokenizer=tokenizer)
+    analyzer = SentimentIntensityAnalyzer()
+    resultList = []
+    # Separate user text by sentences
+    sentences = sent_tokenize(userText)
+    for sent in sentences:
+        resultList.append(f"{classifier(sent)[0]}")
+    return resultList
+# print(biasInText("My name is Omer. I am testing the new bias detection in text. Hopefully it works."))
diff --git a/nlpFiles/getTextFromWeb.py b/nlpFiles/getTextFromWeb.py
@@ -1,12 +1,8 @@
-import nltk
-import transformers
 from transformers import AutoTokenizer, TFAutoModelForSequenceClassification, pipeline
-from nltk.tokenize import sent_tokenize, word_tokenize
-import urllib.request
+from nltk.tokenize import sent_tokenize
 from selenium import webdriver
 import os
 from bs4 import BeautifulSoup
-from nltk.corpus import wordnet as wn
 from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer
 
 # class BiasDetection:
@@ -51,9 +47,7 @@
 #         soupText = BeautifulSoup(pageSource, 'html.parser')
 #         wantedText = soupText.findAll("p")
 #         return wantedText
-#!!!!! IMPORTANT !!!!!
-# GOING TO REWORK BIAS DETECTION TO ACTUALLY DETECT BIAS, CONCERNING WHERE IT IS IN THE TEXT AND IT'S TYPE(BIAS TOWARDS WHO?, WHAT KIND OF BIAS?, ETC)
-#!!!!! IMPORTANT !!!!!
+
 
 def percentToInt(list):
     # Remove '%' from strings and convert to float
@@ -127,12 +121,11 @@ def highRatedSent(paraList):
     return highList
 
 def polarityRating(list, pageSource):
-    # Starting up our models and analyzers
+    # Starting up our models
     tokenizer = AutoTokenizer.from_pretrained("d4data/bias-detection-model")
     model = TFAutoModelForSequenceClassification.from_pretrained("d4data/bias-detection-model")
     classifier = pipeline('text-classification', model=model, tokenizer=tokenizer)
     analyzer = SentimentIntensityAnalyzer()
-
     wantedText = getParagraph(pageSource)
     # Declare variables for average polarity
     count = 0
@@ -170,4 +163,20 @@ def polarityRating(list, pageSource):
     overallList = [str(round(totBias / count * 100, 1)) + "%", str(round(totNon / count * 100, 1)) + "%", str(round(totPos / polarityCount * 100, 1)) + "%", str(round(totNeg / polarityCount * 100, 1)) + "%" , round(totNeg / polarityCount * 100, 1)]
     overallList.append(round(totBias / count * 100, 0))
     if count != 0:
-        list.insert(0,overallList)
+        list.insert(0,overallList)
+# def getText(pageSource):
+#     tokenizer = AutoTokenizer.from_pretrained("d4data/bias-detection-model")
+#     model = TFAutoModelForSequenceClassification.from_pretrained("d4data/bias-detection-model")
+#     classifier = pipeline('text-classification', model=model, tokenizer=tokenizer)
+#     # analyzer = SentimentIntensityAnalyzer()
+
+#     wantedText = getParagraph(pageSource)
+#     for para in wantedText:
+#         sentences = sent_tokenize(para.text.strip())
+#         for sent in sentences:
+#             if sent != "":
+#                 print(classifier(sent)[0])
+# getText(webScrape("https://www.breitbart.com/2024-election/2024/04/11/doj-unmasks-inconsistencies-in-fani-williss-federal-grant-funds-use/"))
+# list1 = []
+# polarityRating(list1, webScrape("https://www.breitbart.com/2024-election/2024/04/11/doj-unmasks-inconsistencies-in-fani-williss-federal-grant-funds-use/"))
+# print(list1)
diff --git a/nlpFiles/trainedModel.py b/nlpFiles/trainedModel.py
@@ -0,0 +1,6 @@
+def model():
+    # Starting up our models and analyzers
+    tokenizer = AutoTokenizer.from_pretrained("d4data/bias-detection-model")
+    model = TFAutoModelForSequenceClassification.from_pretrained("d4data/bias-detection-model")
+    return pipeline('text-classification', model=model, tokenizer=tokenizer)
+    
diff --git a/nobiasapp/templates/successPage.html b/nobiasapp/templates/successPage.html
@@ -129,7 +129,7 @@
 
             </label>
             <nav class="navbar">
-                <a href="../" style="--i:0;">Home<span></span></a>
+                <a href="home" style="--i:0;">Home<span></span></a>
                 <a href="aboutus" style="--i:1;">About Us<span></span></a>
                 <a href="#" style="--i:2;"> Contacts<span></span></a>
                 <a href="tech" style="--i:3;"> How We Detect Bias<span></span></a>
diff --git a/nobiasapp/templates/textPage.html b/nobiasapp/templates/textPage.html
@@ -1,12 +1,154 @@
 {% load static %}
+
 <!DOCTYPE html>
 <html lang="en">
-<head>
-    <meta charset="UTF-8">
-    <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>Document</title>
-</head>
-<body>
-   <h1> {{ thisVar }}</h1>
-</body>
+
+    <head>
+        <meta charset="UTF-8">
+        <meta name="viewport" content="width=device-width, initial-scale=1.0">
+        <title>Successfuly Submitted Text</title>
+        <link rel="stylesheet" href="{% static 'css/style.css' %}">
+    </head>
+    <style>
+        .logo img {
+                width: 100px;
+                float: left;
+                padding-left: 10%;
+                padding-top: 2%;
+            }
+        canvas {
+        position: relative;
+        top: 50%;
+        left: 50%;
+        transform: translate(-50%, -50%);
+        }
+        .text {
+        color: white;
+        font-weight: 600;
+        font-size: 24px;
+        position: absolute;
+        bottom: 55px;
+        left: 50%;
+        transform: translate(-50%, -50%);
+        }
+        .helpstuff {
+            display: flex;
+            margin:auto;
+            width:500px;
+        }
+
+        .tooltip {
+            position: relative;
+            display: inline-block;
+        }
+          
+        .tooltip .tooltiptext {
+            visibility: hidden;
+            width: 200px;
+            background-color: white;
+            background: #415f77;
+            color: #fff;
+            text-align: center;
+            padding: 5px 0;
+            border-radius: 6px;
+            opacity:0.77;
+           
+            position: absolute;
+            position: right;
+            z-index: 1;
+        }
+
+        .tooltip:hover .tooltiptext {
+            visibility: visible;
+        }
+        
+        .hoverstuff {
+            display: flex;
+            align-items: center;
+            justify-content: center;
+        }
+
+        .box {
+            background-color: #f8f8f8;
+            padding: 20px;
+            border-radius: 10px;
+            box-shadow: 0 0 20px rgba(0, 0, 0, 0.1);
+            line-height: 30px;
+            padding-top: 25px;
+        }
+
+        .polarity-bar {
+            width: 100%;
+            height: 20px;
+            background-color: #ddd;
+            border-radius: 5px;
+            overflow: hidden;
+            --cwidth1: {{ thisVar.0.0 }};
+            --cwidth2: {{ thisVar.0.1 }};
+            --cwidth3: {{ thisVar.0.2 }};
+        }
+
+        .polarity-bar .section {
+            height: 100%;
+            float: left;
+        }
+
+        .red-section {
+            background-color: #ff4646;
+            width: var(--cwidth1);
+        }
+
+        .grey-section {
+            background-color: #a0a0a0;
+            width: var(--cwidth2);
+        }
+
+        .green-section {
+            background-color: #4caf50;
+            width: var(--cwidth3);
+        }
+        h2{
+            color: black;
+        }
+
+    </style>
+
+    <body>
+        <header class="header">
+
+            <div class="logo">
+                <img src="{% static 'img/logo.png' %}" alt="1st-logo-1" style="scale: 0.8;">
+            </div>
+
+
+            <input type="checkbox" id="check">
+            <label for="check" class="icons">
+                <i class="bx bx-menu" id="menu-icon"></i>
+                <i class="bx bx-x" id="close-icon"></i>
+
+
+            </label>
+            <nav class="navbar">
+                <a href="home" style="--i:0;">Home<span></span></a>
+                <a href="aboutus" style="--i:1;">About Us<span></span></a>
+                <a href="#" style="--i:2;"> Contacts<span></span></a>
+                <a href="tech" style="--i:3;"> How We Detect Bias<span></span></a>
+            </nav>
+        </header>
+        <br><br>
+        <div class="box">
+            
+            <ul style="list-style-type: none; padding: 0; ">
+                
+                {% for link in sentences %}
+                    <li style="font-family: 'Open Sans', sans-serif; color: #003366; word-wrap: break-word;line-height: 40px;">
+                        {{ link }}
+                    </li>
+                {% endfor %}
+            </ul>
+        </div>
+
+
+    </body>
+
 </html>
diff --git a/nobiasapp/views.py b/nobiasapp/views.py
@@ -1,5 +1,6 @@
 from django.shortcuts import render
 from nlpFiles.getTextFromWeb import polarityRating, highRatedSent, getTitle, webScrape
+from nlpFiles.detectionInText import biasInText
 from .forms import SubmitLinkForm, SubmitTextBoxForm
 
 # def submitLink(request):
@@ -37,12 +38,13 @@ def home(request):
             title = getTitle(pageSource)
             polarityRating(paragraph, pageSource)
             highValuedList = highRatedSent(paragraph)
-            return render(request, 'successPage.html', {'thisVar': paragraph, "highValuedList": highValuedList, 'title': title})
+            return render(request, 'successPage.html', {'thisVar': paragraph, "highValuedList": highValuedList, 'title': title}) #Redirects to successpage when a link is submitted
         
         elif text_form.is_valid():
             text_object = text_form.save()
+            sentences = biasInText(str(text_object))
             # Do something with the text form submission
-            return render(request, 'textPage.html', {'thisVar': text_object})  # Render a success page for text form submission
+            return render(request, 'textPage.html', {'sentences': sentences}) #Redirects to the successpage when text is submitted
         
     else:
         link_form = SubmitLinkForm()