Spaces:

gridflowai
/

SentimentAnalysis-baselines-rnn

Sleeping

App Files Files Community

gridflowai commited on Dec 19, 2023

Commit

0c396ba

1 Parent(s): c24562e

Upload 12 files

Browse files

Files changed (8) hide show

.gitattributes +1 -0
README.md +5 -5
app.py +70 -44
classifier.pkl +3 -0
requirements.txt +2 -0
rnn_model.h5 +3 -0
test.py +70 -0
tok.json +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tok.json filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,10 +1,10 @@
 ---
-title: SentimentAnalysis Baselines
-emoji: 🏃
-colorFrom: gray
-colorTo: purple
 sdk: gradio
-sdk_version: 4.9.1
 app_file: app.py
 pinned: false
 ---

 ---
+title: ThreatClassification Oilspill - MNB
+emoji: 🌖
+colorFrom: yellow
+colorTo: yellow
 sdk: gradio
+sdk_version: 3.50.2
 app_file: app.py
 pinned: false
 ---

app.py CHANGED Viewed

@@ -1,27 +1,35 @@
 import gradio as gr
 import numpy as np
-from tensorflow.keras.models import load_model
-import re
-#importing skearn and joblib modules
 import joblib
-import sklearn
-# setting the joblib
-sklearn.externals.joblib = joblib# Load the models
 lr_model = joblib.load("logistic_model.pkl")
 svm_model = joblib.load("svm_model.pkl")
 nn_model = load_model("dl_model.h5")
 mnb_model = joblib.load("mnb_model.pkl")
 TAG_RE = re.compile(r'<[^>]+>')
 def remove_tags(text):
     return TAG_RE.sub('', text)
-# Load other necessary files like vectorizers or scalers
-tfidf_vectorizer = joblib.load("tfidf_vectorizer.pkl")
 def preprocess_text(sen):
     # Removing html tags
     sentence = remove_tags(sen)
@@ -37,64 +45,85 @@ def preprocess_text(sen):
     return sentence
-# Function to predict sentiment using Logistic Regression
-# Function to predict sentiment using Logistic Regression
 def predict_lr(text):
     preprocessed_text = preprocess_text(text)
     vectorized_text = tfidf_vectorizer.transform([preprocessed_text])
-    dense_vectorized_text = vectorized_text.toarray()  # Convert to dense array
-    prediction = int(lr_model.predict(dense_vectorized_text)[0])
-    return prediction
-# Function to predict sentiment using SVM
 def predict_svm(text):
     preprocessed_text = preprocess_text(text)
     vectorized_text = tfidf_vectorizer.transform([preprocessed_text])
-    dense_vectorized_text = vectorized_text.toarray()  # Convert to dense array
-    prediction = int(svm_model.predict(dense_vectorized_text)[0])
-    return prediction
-# Function to predict sentiment using Neural Network
 def predict_nn(text):
     preprocessed_text = preprocess_text(text)
     vectorized_text = tfidf_vectorizer.transform([preprocessed_text])
-    dense_vectorized_text = vectorized_text.toarray()  # Convert to dense array
     prediction_probs = nn_model.predict(dense_vectorized_text)[0]
     prediction = int(np.argmax(prediction_probs))
-    return prediction
-# Function to predict sentiment using Multinomial Naive Bayes
 def predict_mnb(text):
     preprocessed_text = preprocess_text(text)
     vectorized_text = tfidf_vectorizer.transform([preprocessed_text])
-    dense_vectorized_text = vectorized_text.toarray()  # Convert to dense array
-    prediction = int(mnb_model.predict(dense_vectorized_text)[0])
-    return prediction
-# Set the function based on the selected model
 def sentiment_prediction(text, model):
     if model == "Logistic Regression":
-        prediction = predict_lr(text)
     elif model == "SVM":
-        prediction = predict_svm(text)
     elif model == "Neural Network":
-        prediction = predict_nn(text)
     elif model == "Multinomial Naive Bayes":
-        prediction = predict_mnb(text)
-    threshold = 0.5
-    # Logic for determining positive or negative sentiment based on the model's prediction
-    if prediction >= threshold:
-        return "Positive"
-    else:
-        return "Negative"
 # Create the Gradio interface
 iface = gr.Interface(
     fn=sentiment_prediction,
-    inputs=[gr.Textbox(type="text", label="Enter Text"), gr.Dropdown(["Logistic Regression", "SVM", "Neural Network", "Multinomial Naive Bayes"], label="Select Model")],
-    outputs=gr.Label(),
     live=True,
     title="Sentiment Analysis with Model Selection",
     description="Enter a text and choose a model for sentiment prediction.",
@@ -102,6 +131,3 @@ iface = gr.Interface(
 # Launch the Gradio interface
 iface.launch()
-iface.launch()

 import gradio as gr
 import numpy as np
+from keras.models import load_model
+import re
+from keras.preprocessing.sequence import pad_sequences
+from keras.preprocessing.text import tokenizer_from_json
+import re
 import joblib
+import json
+# Load the JSON data from the file
+with open('tok.json', 'r') as json_file:
+    tokenizer_json = json.load(json_file)
+# Assuming tokenizer_class is the class of your tokenizer
+tokenizer = tokenizer_from_json(tokenizer_json)
+rnn_model = load_model("rnn_model.h5")
+# setting the joblib
 lr_model = joblib.load("logistic_model.pkl")
 svm_model = joblib.load("svm_model.pkl")
 nn_model = load_model("dl_model.h5")
 mnb_model = joblib.load("mnb_model.pkl")
+# Load other necessary files like vectorizers or scalers
+tfidf_vectorizer = joblib.load("tfidf_vectorizer.pkl")
 TAG_RE = re.compile(r'<[^>]+>')
 def remove_tags(text):
     return TAG_RE.sub('', text)
 def preprocess_text(sen):
     # Removing html tags
     sentence = remove_tags(sen)
     return sentence
+def preprocess_text_for_rnn(text, tokenizer, maxlen):
+    text = preprocess_text(text)
+    sequence = tokenizer.texts_to_sequences([text])
+    padded_sequence = pad_sequences(sequence, padding='post', maxlen=maxlen)
+    return padded_sequence
 def predict_lr(text):
     preprocessed_text = preprocess_text(text)
     vectorized_text = tfidf_vectorizer.transform([preprocessed_text])
+    dense_vectorized_text = vectorized_text.toarray()
+    prediction_probs = lr_model.predict_proba(dense_vectorized_text)[0]
+    prediction = int(np.argmax(prediction_probs))
+    return prediction, prediction_probs
 def predict_svm(text):
     preprocessed_text = preprocess_text(text)
     vectorized_text = tfidf_vectorizer.transform([preprocessed_text])
+    dense_vectorized_text = vectorized_text.toarray()
+    prediction_probs = svm_model.predict_proba(dense_vectorized_text)[0]
+    prediction = int(np.argmax(prediction_probs))
+    return prediction, prediction_probs
 def predict_nn(text):
     preprocessed_text = preprocess_text(text)
     vectorized_text = tfidf_vectorizer.transform([preprocessed_text])
+    dense_vectorized_text = vectorized_text.toarray()
     prediction_probs = nn_model.predict(dense_vectorized_text)[0]
     prediction = int(np.argmax(prediction_probs))
+    return prediction, prediction_probs
 def predict_mnb(text):
     preprocessed_text = preprocess_text(text)
     vectorized_text = tfidf_vectorizer.transform([preprocessed_text])
+    dense_vectorized_text = vectorized_text.toarray()
+    prediction_probs = mnb_model.predict_proba(dense_vectorized_text)[0]
+    prediction = int(np.argmax(prediction_probs))
+    return prediction, prediction_probs
+def predict_rnn(text):
+    processed_text = preprocess_text_for_rnn(text, tokenizer, maxlen=170)
+    prediction_probs = rnn_model.predict(processed_text)[0]
+    prediction = int(np.argmax(prediction_probs))
+    return prediction, prediction_probs
 def sentiment_prediction(text, model):
+    prediction, percentages = 0, []
     if model == "Logistic Regression":
+        prediction, percentages = predict_lr(text)
     elif model == "SVM":
+        prediction, percentages = predict_svm(text)
     elif model == "Neural Network":
+        prediction, percentages = predict_nn(text)
     elif model == "Multinomial Naive Bayes":
+        prediction, percentages = predict_mnb(text)
+    elif model == "Recurrent Neural Network":
+        prediction, percentages = predict_rnn(text)
+    # Displaying emojis based on sentiment
+    emoji_positive = "😃"
+    emoji_negative = "😢"
+    emoji = emoji_positive if prediction == 1 else emoji_negative
+    # Create labels for predictions
+    labels = ["Negative", "Positive"]
+    # Create label for the prediction
+    prediction_label = labels[prediction]
+    # Calculate percentages for both labels
+    percentage_negative = percentages[0]
+    percentage_positive = percentages[1]
+    return prediction_label, f"{labels[0]}: {percentage_negative:.2%}, Percentage {labels[1]}: {percentage_positive:.2%}", emoji
 # Create the Gradio interface
 iface = gr.Interface(
     fn=sentiment_prediction,
+    inputs=[gr.Textbox(type="text", label="Enter Text"), gr.Dropdown(["Logistic Regression", "SVM", "Neural Network", "Multinomial Naive Bayes", "Recurrent Neural Network"], label="Select Model")],
+    outputs=[gr.Label(), gr.Label(), gr.Label()],
     live=True,
     title="Sentiment Analysis with Model Selection",
     description="Enter a text and choose a model for sentiment prediction.",
 # Launch the Gradio interface
 iface.launch()

classifier.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9189d53b69f0d9ff501d0a51aa9ab344b2455e03bf347653fb84ed075f788f3b
+size 386759

requirements.txt CHANGED Viewed

@@ -4,3 +4,5 @@ numpy
 nltk
 tensorflow==2.15.0
 joblib==1.3.2

 nltk
 tensorflow==2.15.0
 joblib==1.3.2
+keras==2.15.0
+h5py==3.9.0

rnn_model.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:08682f8d8b196bfff00560f2c029e4dd57a51b6cfaece9f3fba85fb646b0e977
+size 47449360

test.py ADDED Viewed

	@@ -0,0 +1,70 @@

+from keras.models import load_model
+from keras.preprocessing.text import tokenizer_from_json
+from keras.preprocessing.sequence import pad_sequences
+import json
+import joblib
+import re
+rnn_model = load_model("rnn_model.h5")
+# Load the JSON data from the file
+with open('tok.json', 'r') as json_file:
+    tokenizer_json = json.load(json_file)
+# Assuming tokenizer_class is the class of your tokenizer
+tokenizer = tokenizer_from_json(tokenizer_json)
+TAG_RE = re.compile(r'<[^>]+>')
+def remove_tags(text):
+    return TAG_RE.sub('', text)
+# Load other necessary files like vectorizers or scalers
+tfidf_vectorizer = joblib.load("tfidf_vectorizer.pkl")
+def preprocess_text(sen):
+    # Removing html tags
+    sentence = remove_tags(sen)
+    # Remove punctuations and numbers
+    sentence = re.sub('[^a-zA-Z]', ' ', sentence)
+    # Single character removal
+    sentence = re.sub(r"\s+[a-zA-Z]\s+", ' ', sentence)
+    # Removing multiple spaces
+    sentence = re.sub(r'\s+', ' ', sentence)
+    return sentence
+def preprocess_text_for_rnn(text, tokenizer, maxlen):
+    text = preprocess_text(text)
+    sequence = tokenizer.texts_to_sequences([text])
+    padded_sequence = pad_sequences(sequence, padding='post', maxlen=maxlen)
+    return padded_sequence
+# Function to predict sentiment using Multinomial Naive Bayes
+def predict_rnn(text):
+    processed_text = preprocess_text_for_rnn(text, tokenizer, maxlen=170)
+    prediction = rnn_model.predict(processed_text)
+    # Assuming class 0 is negative and class 1 is positive
+    if prediction[0][0] > prediction[0][1]:
+        return 0  # Negative sentiment
+    else:
+        return 1  # Positive sentiment
+print(predict_rnn('Apart from having the longest reign in British history years Queen Victoria also holds two other distinctions She was apart from our current Queen the oldest ever British monarch living to the age of And she was also the youngest ever British as opposed to English or Scottish monarch coming to the throne as girl of eighteen And yet whenever television or the cinema make programme or film about her they seem far more interested in the older Victoria than they do in the young girl the version of Victoria with which modern audiences will probably be most familiar is Judi Dench in Mrs Brown The Young Victoria tries to redress the balance by showing us the events surrounding her accession and the early years of her reign It has the rare distinction of being produced by former Royal Sarah Duchess of York whose daughter Princess Beatrice makes brief appearance as an extra There are three main strands to the plot The first concerns the intrigues of Victoria mother the Duchess of Kent highly unpopular figure even with her own daughter largely because of the influence of her adviser Sir John Conroy who was widely rumoured to be her lover According to one unfounded rumour he and not the late Duke of Kent was Victoria natural father The second strand concerns the growing romance between Victoria and her German cousin Prince Albert and the attempts of King Leopold of Belgium who was uncle to both of them to influence this romance Leopold hope was to increase the prestige of the House of Saxe Coburg to which both he and Albert belonged The third concerns one of the strangest episodes in British political history the Bedchamber Crisis of when supporters of the Tory Party which had traditionally supported strong monarchy rioted because the young Queen was perceived to favour the Whig Party and their leader Lord Melbourne even though the Whigs had historically supported quasi republican system of government with the monarch reduced to figurehead Scriptwriter Julian Fellowes is known for his Conservative views and at times wondered if this may have coloured his treatment of political themes as he seems to lean to the side of the Tories the predecessors of the modern Conservative party Their leader Robert Peel is shown as statesmanlike and dignified whereas Melbourne for all his dash and charm is shown as devious and uninterested in social reform There may be some truth is these characterisations but Fellowes glosses over the fact that only few years earlier the Tories had opposed the Reform Act which ended the corrupt electoral system of rotten boroughs and that they had benefited from William IV unconstitutional dismissal of Whig administration Lessons in dynastic and constitutional history do not always transfer well to the cinema screen and this one contains its share of inaccuracies Prince Albert for example was not injured in Edward Oxford attempt on Victoria life and Melbourne in his late fifties at the time of Victoria accession was not as youthful as he is portrayed here by Paul Bettany King William IV certainly disliked the Duchess of Kent who was his sister in law but doubt if he would have gone so far as to bawl abuse at her during state banquet as he is shown doing here also failed to understand the significance of the scene in which the Duchess and Conroy try to force Victoria to sign Regency Order the Duchess constitutional position was made clear by the Regency Act which provided that she would become Regent if her daughter was still under eighteen at the time of her accession No piece of paper signed by Victoria could have altered the provisions of the Act There are also occasional infelicities In one early scene we see Victoria and Albert playing chess while comparing themselves to pawns being moved around chessboard metaphor so hackneyed that the whole scene should have come complete with Danger Major clich ahead warning Yet in spite of scenes like this came to enjoy the film There were some good performances especially from Miranda Richardson as the scheming Duchess and Mark Strong as the obnoxious Conroy It is visually very attractive being shot in sumptuous style we have come to associate with British historical drama Jim Broadbent gives an amusing turn as King William although he does occasionally succumb to the temptation of going over the top Although not as disastrously over the top as he was in Moulin Rouge The main reason for the film success however is the performances of Emily Blunt and Rupert Friend as the two young lovers Victoria and Albert Blunt is probably more attractive than Victoria was in real life but in her delightful portrayal the Queen is no longer the old lady of the popular imagination the black clad Widow of Windsor who was perpetually not amused but determined strong minded and loving young woman Her love for Albert and their happy family life together was one of the main reasons why the monarchy succeeded in reestablishing itself in the affections of the British people With the exception of George III Victoria Hanoverian ancestors had been notoriously lacking in the matrimonial virtues Blunt and Friend make The Young Victoria touching romance and gripping human drama as well as an exploration of key period in British history '))

tok.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d5cc0f92c384fa972a7c734c438d63e288aa20a9c34d450389e70cc93cb4d32
+size 10838553