Spaces:

nguyennghia0902
/

SentimentAnalysis_usingBERT

Sleeping

App Files Files Community

nguyennghia0902 commited on Jul 29, 2023

Commit

b64accf

•

1 Parent(s): e3efb90

Upload all files without model

Browse files

Files changed (10) hide show

Homepage.py +43 -0
README.md +6 -7
Sentiment_Analysis.py +117 -0
bert-sentiment-analysis.ipynb +0 -0
dataset/reviews.csv +0 -0
gitattributes.txt +35 -0
requirements.txt +10 -0
streamlit_app.py/Homepage.py +43 -0
streamlit_app.py/pages/Homepage.py +43 -0
streamlit_app.py/pages/Sentiment_Analysis.py +117 -0

Homepage.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import streamlit as st
+from st_pages import Page, show_pages
+st.set_page_config(page_title="Sentiment Analysis", page_icon="🏠")
+show_pages(
+    [
+        Page("streamlit_app.py/Homepage.py", "Home", "🏠"),
+        Page(
+            "streamlit_app.py/pages/Sentiment_Analysis.py", "Sentiment Analysis", "📝"
+        ),
+    ]
+)
+st.title("Seminar Công nghệ Tri thức - Transformer trong NLP")
+st.markdown(
+    """
+    **Team members:**
+    | Student ID | Full Name                |
+    | ---------- | ------------------------ |
+    | 19120600   | Bùi Nguyên Nghĩa         |
+    | 19120607   | Phạm Thị Nguyệt          |
+    """
+)
+st.header("The Need for Sentiment Analysis")
+st.markdown(
+    """
+    Sentiment analysis algorithms are used to detect sentiment in a comment or a review.
+    It is said that around 90% of consumers read online reviews before visiting a business or buying a product.
+    These reviews can be positive or negative or neutral, and it is important to know what the customers are saying about your business.
+    """
+)
+st.header("Technology used")
+st.markdown(
+    """
+    In this demo, we used BERT as the model for sentiment analysis. BERT is a transformer-based model that was proposed in 2018 by Google.
+    It is a pre-trained model that can be used for various NLP tasks such as sentiment analysis, question answering, etc.
+    """
+)

README.md CHANGED Viewed

@@ -1,13 +1,12 @@
 ---
-title: SentimentAnalysis UsingBERT
-emoji: 💻
-colorFrom: yellow
-colorTo: indigo
 sdk: streamlit
-sdk_version: 1.25.0
-app_file: app.py
 pinned: false
-license: openrail
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Sentiment Detection Using Bert
+emoji: 🐨
+colorFrom: gray
+colorTo: gray
 sdk: streamlit
+sdk_version: 1.21.0
+app_file: streamlit_app.py/Homepage.py
 pinned: false
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

Sentiment_Analysis.py ADDED Viewed

	@@ -0,0 +1,117 @@

+from os import path
+import streamlit as st
+# import pickle
+# from tensorflow import keras
+import tensorflow as tf
+import torch
+from torch import nn
+from transformers import BertModel, BertTokenizer
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+MODEL_NAME = "bert-base-cased"
+MODEL_PATH = path.join(path.dirname(__file__), "bert_model.h5")
+# Build the Sentiment Classifier class
+class SentimentClassifier(nn.Module):
+    # Constructor class
+    def __init__(self, n_classes):
+        super(SentimentClassifier, self).__init__()
+        self.bert = BertModel.from_pretrained(MODEL_NAME)
+        self.drop = nn.Dropout(p=0.3)
+        self.out = nn.Linear(self.bert.config.hidden_size, n_classes)
+    # Forward propagaion class
+    def forward(self, input_ids, attention_mask):
+        _, pooled_output = self.bert(
+            input_ids=input_ids, attention_mask=attention_mask, return_dict=False
+        )
+        #  Add a dropout layer
+        output = self.drop(pooled_output)
+        return self.out(output)
+@st.cache_resource
+def load_model_and_tokenizer():
+    model = SentimentClassifier(3)
+    model.load_state_dict(torch.load(MODEL_PATH, map_location=torch.device("cpu")))
+    model.eval()
+    return model, BertTokenizer.from_pretrained("bert-base-cased")
+def predict(content):
+    model, tokenizer = load_model_and_tokenizer()
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    encoded_review = tokenizer.encode_plus(
+        content,
+        max_length=160,
+        add_special_tokens=True,
+        return_token_type_ids=False,
+        pad_to_max_length=True,
+        return_attention_mask=True,
+        return_tensors="pt",
+    )
+    input_ids = encoded_review["input_ids"].to(device)
+    attention_mask = encoded_review["attention_mask"].to(device)
+    output = model(input_ids, attention_mask)
+    _, prediction = torch.max(output, dim=1)
+    class_names = ["negative", "neutral", "positive"]
+    return class_names[prediction]
+def main():
+    st.set_page_config(page_title="Sentiment Analysis", page_icon="📝")
+    # giving a title to our page
+    st.title("Sentiment analysis")
+    contents = st.text_area(
+        "Please enter reviews/sentiment/setences/contents:",
+        placeholder="Enter your text here",
+        height=200,
+    )
+    prediction = ""
+    # Create a prediction button
+    if st.button("Analyze Sentiment"):
+        stripped = contents.strip()
+        if not stripped:
+            st.error("Please enter some text.")
+            return
+        prediction = predict(contents)
+        if prediction == "positive":
+            st.success("This is positive 😄")
+        elif prediction == "negative":
+            st.error("This is negative 😟")
+        else:
+            st.warning("This is neutral 🙂")
+    upload_file = st.file_uploader("Or upload a file", type=["txt"])
+    if upload_file is not None:
+        contents = upload_file.read().decode("utf-8")
+        for line in contents.splitlines():
+            line = line.strip()
+            if not line:
+                continue
+            prediction = predict(line)
+            if prediction == "positive":
+                st.success(line + "\n\nThis is positive 😄")
+            elif prediction == "negative":
+                st.error(line + "\n\nThis is negative 😟")
+            else:
+                st.warning(line + "\n\nThis is neutral 🙂")
+if __name__ == "__main__":
+    main()

bert-sentiment-analysis.ipynb ADDED Viewed

The diff for this file is too large to render. See raw diff

dataset/reviews.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

gitattributes.txt ADDED Viewed

	@@ -0,0 +1,35 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+transformers
+numpy
+pandas
+seaborn
+matplotlib
+scikit-learn
+torch
+tensorflow
+streamlit
+st-pages

streamlit_app.py/Homepage.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import streamlit as st
+from st_pages import Page, show_pages
+st.set_page_config(page_title="Sentiment Analysis", page_icon="🏠")
+show_pages(
+    [
+        Page("streamlit_app.py/Homepage.py", "Home", "🏠"),
+        Page(
+            "streamlit_app.py/pages/Sentiment_Analysis.py", "Sentiment Analysis", "📝"
+        ),
+    ]
+)
+st.title("Seminar Công nghệ Tri thức - Transformer trong NLP")
+st.markdown(
+    """
+    **Team members:**
+    | Student ID | Full Name                |
+    | ---------- | ------------------------ |
+    | 19120600   | Bùi Nguyên Nghĩa         |
+    | 19120607   | Phạm Thị Nguyệt          |
+    """
+)
+st.header("The Need for Sentiment Analysis")
+st.markdown(
+    """
+    Sentiment analysis algorithms are used to detect sentiment in a comment or a review.
+    It is said that around 90% of consumers read online reviews before visiting a business or buying a product.
+    These reviews can be positive or negative or neutral, and it is important to know what the customers are saying about your business.
+    """
+)
+st.header("Technology used")
+st.markdown(
+    """
+    In this demo, we used BERT as the model for sentiment analysis. BERT is a transformer-based model that was proposed in 2018 by Google.
+    It is a pre-trained model that can be used for various NLP tasks such as sentiment analysis, question answering, etc.
+    """
+)

streamlit_app.py/pages/Homepage.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import streamlit as st
+from st_pages import Page, show_pages
+st.set_page_config(page_title="Sentiment Analysis", page_icon="🏠")
+show_pages(
+    [
+        Page("streamlit_app.py/Homepage.py", "Home", "🏠"),
+        Page(
+            "streamlit_app.py/pages/Sentiment_Analysis.py", "Sentiment Analysis", "📝"
+        ),
+    ]
+)
+st.title("Seminar Công nghệ Tri thức - Transformer trong NLP")
+st.markdown(
+    """
+    **Team members:**
+    | Student ID | Full Name                |
+    | ---------- | ------------------------ |
+    | 19120600   | Bùi Nguyên Nghĩa         |
+    | 19120607   | Phạm Thị Nguyệt          |
+    """
+)
+st.header("The Need for Sentiment Analysis")
+st.markdown(
+    """
+    Sentiment analysis algorithms are used to analyze sentiment in a comment or a review.
+    It is said that around 90% of consumers read online reviews before visiting a business or buying a product.
+    These reviews can be positive or negative or neutral, and it is important to know what the customers are saying about your business.
+    """
+)
+st.header("Technology used")
+st.markdown(
+    """
+    In this demo, we used BERT as the model for sentiment analysis. BERT is a transformer-based model that was proposed in 2018 by Google.
+    It is a pre-trained model that can be used for various NLP tasks such as sentiment analysis, question answering, etc.
+    """
+)

streamlit_app.py/pages/Sentiment_Analysis.py ADDED Viewed

	@@ -0,0 +1,117 @@

+from os import path
+import streamlit as st
+# import pickle
+# from tensorflow import keras
+import tensorflow as tf
+import torch
+from torch import nn
+from transformers import BertModel, BertTokenizer
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+MODEL_NAME = "bert-base-cased"
+MODEL_PATH = path.join(path.dirname(__file__), "bert_model.h5")
+# Build the Sentiment Classifier class
+class SentimentClassifier(nn.Module):
+    # Constructor class
+    def __init__(self, n_classes):
+        super(SentimentClassifier, self).__init__()
+        self.bert = BertModel.from_pretrained(MODEL_NAME)
+        self.drop = nn.Dropout(p=0.3)
+        self.out = nn.Linear(self.bert.config.hidden_size, n_classes)
+    # Forward propagaion class
+    def forward(self, input_ids, attention_mask):
+        _, pooled_output = self.bert(
+            input_ids=input_ids, attention_mask=attention_mask, return_dict=False
+        )
+        #  Add a dropout layer
+        output = self.drop(pooled_output)
+        return self.out(output)
+@st.cache_resource
+def load_model_and_tokenizer():
+    model = SentimentClassifier(3)
+    model.load_state_dict(torch.load(MODEL_PATH, map_location=torch.device("cpu")))
+    model.eval()
+    return model, BertTokenizer.from_pretrained("bert-base-cased")
+def predict(content):
+    model, tokenizer = load_model_and_tokenizer()
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    encoded_review = tokenizer.encode_plus(
+        content,
+        max_length=160,
+        add_special_tokens=True,
+        return_token_type_ids=False,
+        pad_to_max_length=True,
+        return_attention_mask=True,
+        return_tensors="pt",
+    )
+    input_ids = encoded_review["input_ids"].to(device)
+    attention_mask = encoded_review["attention_mask"].to(device)
+    output = model(input_ids, attention_mask)
+    _, prediction = torch.max(output, dim=1)
+    class_names = ["negative", "neutral", "positive"]
+    return class_names[prediction]
+def main():
+    st.set_page_config(page_title="Sentiment Analysis", page_icon="📝")
+    # giving a title to our page
+    st.title("Sentiment analysis")
+    contents = st.text_area(
+        "Please enter reviews/sentiment/setences/contents:",
+        placeholder="Enter your text here",
+        height=200,
+    )
+    prediction = ""
+    # Create a prediction button
+    if st.button("Analyze Sentiment"):
+        stripped = contents.strip()
+        if not stripped:
+            st.error("Please enter some text.")
+            return
+        prediction = predict(contents)
+        if prediction == "positive":
+            st.success("This is positive 😄")
+        elif prediction == "negative":
+            st.error("This is negative 😟")
+        else:
+            st.warning("This is neutral 🙂")
+    upload_file = st.file_uploader("Or upload a file", type=["txt"])
+    if upload_file is not None:
+        contents = upload_file.read().decode("utf-8")
+        for line in contents.splitlines():
+            line = line.strip()
+            if not line:
+                continue
+            prediction = predict(line)
+            if prediction == "positive":
+                st.success(line + "\n\nThis is positive 😄")
+            elif prediction == "negative":
+                st.error(line + "\n\nThis is negative 😟")
+            else:
+                st.warning(line + "\n\nThis is neutral 🙂")
+if __name__ == "__main__":
+    main()