Spaces:

NazmusAshrafi
/

stock_tweet_topic_modeling_sa_app

Runtime error

App Files Files Community

NazmusAshrafi commited on Dec 22, 2023

Commit

57f0fa1

•

1 Parent(s): c303720

updated with larger model

Browse files

Files changed (2) hide show

app.py +24 -11
instructions.txt +7 -0

app.py CHANGED Viewed

@@ -6,7 +6,7 @@ from transformers import pipeline, AutoModelForSequenceClassification, AutoToken
 def get_model():
     tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased")
     pulled_model = AutoModelForSequenceClassification.from_pretrained(
-        "NazmusAshrafi/stock_twitter_topic_Bert")
     return tokenizer, pulled_model
@@ -21,21 +21,34 @@ classifier = pipeline("sentiment-analysis",
 st.title("Find the topic of a stock related tweets")
 st.subheader(
-    'This model can predict 3 topics - :blue[Investment decision], :green[User Volume], :orange[Market crisis] - Entering a topic related tweet will yeild the best results')
 st.markdown(
-    ':blue[Investment decision example: "AAP Dow Theory = Will go down in future, Do not buy"]')
 st.markdown(
-    ':green[User Volume example: "Loosing a lot of volume, user are leaving this platform"]')
 st.markdown(
-    ':orange[Market crisis example: "Market is in danger because of corona virus"]')
 st.subheader("", divider='rainbow')
-# 0 = Investment decision
-# 1 = User volume
-# 2 = Market crisis
 user_input = st.text_area("Enter a tweet about a stock")
@@ -50,5 +63,5 @@ if user_input and button:
     st.write("Confidence Score: ", classifier(user_input)[0]['score'])
-st.markdown(
-    'Note: Model may be predicting "Investment decision" way too often, this is because of the data imbalance. The model was trained on 3 topics, but the data was not balanced. The model was trained on a dataset where a large portion of the data was on "Investment decision" topic. This is why the model is biased towards "Investment decision" topic. This is a flaw of this model, and it can be fixed by training the model on a balanced dataset.')

 def get_model():
     tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased")
     pulled_model = AutoModelForSequenceClassification.from_pretrained(
+        "NazmusAshrafi/large_dataset_stock_twitter_topic_Bert")
     return tokenizer, pulled_model
 st.title("Find the topic of a stock related tweets")
 st.subheader(
+    'This model can predict 5 topics - :blue[Tesla Investment News], :green[Technology stock watchlist], :orange[Esports News], :blue[Apple Market Updates], :green[Amazon Updates] - Entering a topic related tweet will yeild the best results')
+# elif topic == 0:
+#     return 'Tesla Investment News'
+# elif topic == 1:
+#     return 'Technology stock watchlist'
+# elif topic == 2:
+#     return 'Esports News'
+# elif topic == 3:
+#     return 'Apple Market Updates'
+# elif topic == 4:
+#     return 'Amazon Updates'
+st.subheader(
+    'Examples:')
+st.markdown(
+    ':blue[Tesla Investment News: Electric cars stock going to go up in future, buy now"]')
 st.markdown(
+    ':green[Technology stock watchlist: "Keep a look out for that stock, its really good!"]')
 st.markdown(
+    ':orange[Esports News: "Ninja is going to play in the next tournament, the best is back playing Fortnite."]')
 st.markdown(
+    ':blue[Apple Market Updates: "$AAPL released a new phone but the looks never change much. Buy anyway!"]')
+st.markdown(
+    ':green[Amazon Updates: "Black Fridays at Amazon, hail Jeff Bezos"]')
 st.subheader("", divider='rainbow')
 user_input = st.text_area("Enter a tweet about a stock")
     st.write("Confidence Score: ", classifier(user_input)[0]['score'])
+# st.markdown(
+#     'Note: Model may be predicting "Investment decision" way too often, this is because of the data imbalance. The model was trained on 3 topics, but the data was not balanced. The model was trained on a dataset where a large portion of the data was on "Investment decision" topic. This is why the model is biased towards "Investment decision" topic. This is a flaw of this model, and it can be fixed by training the model on a balanced dataset.')

instructions.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Run using:
+streamlit run app.py
+Push using:
+git add .
+git comit -m "New feature added"
+git push