Spaces:

gArthur98
/

distill_sentiment_classifier

Sleeping

App Files Files Community

distill_sentiment_classifier / pages /2_DistilledBert.py

gArthur98

Upload 19 files

0db5ea1 over 1 year ago

raw

history blame

3.15 kB


	import streamlit as st
	import torch
	from transformers import AutoTokenizer
	from transformers import AutoModelForSequenceClassification
	from transformers import AutoConfig
	import numpy as np
	import pandas as pd
	import re
	from scipy.special import softmax
	from transformers import pipeline
	import xformers
	import requests
	import json

	from streamlit_lottie import st_lottie


	import streamlit as st
	from transformers import AutoTokenizer, AutoModelForSequenceClassification
	import re
	from transformers import pipeline

	## Creating a cache to store my model for efficiency
	@st.cache_data(ttl=86400)
	def load_model(model_name):
	model = AutoModelForSequenceClassification.from_pretrained(model_name)
	return model

	## Creating my tokenizer
	@st.cache_data(ttl=86400)
	def load_tokenizer(tokenizer_name):
	tokenizer = AutoTokenizer.from_pretrained(tokenizer_name)
	return tokenizer

	## Front end
	st.title("Welcome to the Fine-Tuned DisTilled-Bert Sentiment Classifier Page")

	##including an animation to my page

	def load_lottiefile(filepath: str):
	with open(filepath, "r") as f:
	return json.load(f)

	# initializaing my session state
	if 'lottie_hello_2' not in st.session_state:
	st.session_state.lottie_hello_2 = load_lottiefile("./lottie_animations/dsbert.json")

	# creating a funciton to upload the file while implementing session state
	def handle_uploaded_file(uploaded_file):
	if uploaded_file is not None:
	st.session_state.lottie_hello_2 = load_lottiefile(uploaded_file.name)


	# displaying the Lottie animation
	st_lottie(st.session_state.lottie_hello_2, height=200)

	text = st.text_input("Please Enter a Covid-19 Themed Sentence Below: ")



	## Cleaning
	def data_cleaner(text):
	text = text.lower()
	## Removing hashtags
	text = re.sub(r'#\w+', '', text)
	## Removing punctuations
	text = re.sub("[^\w\s]", repl="", string=text)
	text = re.sub(r'\d+', '', text)
	text = " ".join([word for word in text.split() if not word.isdigit()])
	return text

	## Running my input through my function
	text_input = data_cleaner(text)

	if 'ro_model' not in st.session_state:
	st.session_state.ro_model = load_model("gArthur98/Greg-DistilBert-classifier")

	if 'ro_token' not in st.session_state:
	st.session_state.ro_token = load_tokenizer("gArthur98/Greg-DistilBert-classifier")

	pipe = pipeline("sentiment-analysis", model=st.session_state.ro_model, tokenizer=st.session_state.ro_token)

	result = pipe(text_input)

	final = st.button("Predict Sentiment")

	## Initializing my session state
	if final:
	for results in result:
	if results['label'] == 'LABEL_0':
	st.write(f"Your sentiment is Negative with a confidence score of {results['score']}")
	elif results["label"] == 'LABEL_1':
	st.write(f"Your sentiment is Neutral with a confidence score of {results['score']}")
	else:
	st.write(f"Your sentiment is Positive with a confidence score of {results['score']}")



	st.write("""Example of sentences to input:

	- The New Vaccine is Bad \n
	- I love the vaccine \n
	- Covid-19 is Moving Fast

	""")