pycoder2000
diff --git a/‎.gitattributes
Lines changed: 2 additions & 0 deletions b/‎.gitattributes
Lines changed: 2 additions & 0 deletions
diff --git a/‎Procfile
Lines changed: 1 addition & 0 deletions b/‎Procfile
Lines changed: 1 addition & 0 deletions
diff --git a/‎README.md
Lines changed: 10 additions & 0 deletions b/‎README.md
Lines changed: 10 additions & 0 deletions
diff --git a/‎app.py
Lines changed: 43 additions & 0 deletions b/‎app.py
Lines changed: 43 additions & 0 deletions
diff --git a/‎model.h5
18.9 MB b/‎model.h5
18.9 MB
diff --git a/‎nltk.txt
Lines changed: 1 addition & 0 deletions b/‎nltk.txt
Lines changed: 1 addition & 0 deletions
diff --git a/‎requirements.txt
Lines changed: 6 additions & 0 deletions b/‎requirements.txt
Lines changed: 6 additions & 0 deletions
@@ -0,0 +1,2 @@
+# Auto detect text files and perform LF normalization
+* text=auto
@@ -0,0 +1 @@
+web: gunicorn app:app
@@ -0,0 +1,10 @@
+# Sentiment Analysis
+A simple sentiment analysis application made using following packages:
+- Tensorflow Keras
+- Natural Language Toolkit (NLTK)
+- TfidfVectorizer
+
+
+The model was trained using tweets from [Sentiment140 dataset with 1.6 million tweets](http://www.kaggle.com/kazanova/sentiment140).
+
+The app has has been deployed using Flask and Heroku. The app can be found [here](http://sentiment-analysis-mp.herokuapp.com/).
@@ -0,0 +1,43 @@
+import numpy as np
+from flask import Flask, request, jsonify, render_template
+import pickle
+import os
+os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
+import tensorflow as tf
+import re
+from nltk.corpus import stopwords
+from nltk.stem import SnowballStemmer
+
+app = Flask(__name__)
+vect = pickle.load(open("vectorizer.pickle",'rb'))
+model = tf.keras.models.load_model('model.h5')
+
+def preprocess(text, stem=False):
+  text = re.sub("@\S+|https?:\S+|http?:\S|[^A-Za-z0-9]+", ' ', str(text).lower()).strip()
+  stop_words = stopwords.words('english')
+  stemmer = SnowballStemmer('english')
+  tokens = []
+  for token in text.split():
+    if token not in stop_words:
+      if stem:
+        tokens.append(stemmer.stem(token))
+      else:
+        tokens.append(token)
+  return " ".join(tokens)
+
+
+@app.route('/')
+def home():
+    return render_template('index.html')
+
+@app.route('/predict',methods=['POST'])
+def predict():
+    inp = [x for x in request.form.values()]
+    inp = preprocess(inp)
+    inp = vect.transform([inp]).toarray().reshape(1,1,2500)
+    output = model.predict(inp)[0]
+
+    return render_template('index.html', prediction_text='{}'.format(output[0]))
+
+if __name__ == "__main__":
+    app.run(debug=True)
@@ -0,0 +1 @@
+stopwords
@@ -0,0 +1,6 @@
+Flask==1.1.2
+numpy==1.18.5
+nltk==3.5
+tensorflow==2.3.1
+scikit-learn==0.23.2
+gunicorn==20.0.4
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+# Auto detect text files and perform LF normalization`
	`2`	`+* text=auto`