Spaces:

AnastasiaMozhayskaya
/

nlp_lstm_project

Running

App Files Files Community

Анастасия commited on Dec 10, 2023

Commit

019c64d

•

1 Parent(s): 536d618

project_streamlit_app

Browse files

Files changed (35) hide show

.gitattributes +1 -0
__init__.py +0 -0
images/.DS_Store +0 -0
images/classes.png +0 -0
images/classification_report.png +0 -0
images/kino.png +0 -0
images/toxy.png +0 -0
main.py +38 -0
model/.DS_Store +0 -0
model/__pycache__/bert.cpython-310.pyc +0 -0
model/__pycache__/ltsm_att.cpython-310.pyc +0 -0
model/__pycache__/ml.cpython-310.pyc +0 -0
model/__pycache__/rnn.cpython-310.pyc +0 -0
model/bert.py +29 -0
model/embedding_matrix.pt +3 -0
model/logistic_regression_weights.pkl +3 -0
model/lr_weights.pkl +3 -0
model/lstm_att_weight.pt +3 -0
model/ltsm_att.py +99 -0
model/ml.py +36 -0
model/rubert_tiny_toxicity_tokenizer_weights.pt/special_tokens_map.json +3 -0
model/rubert_tiny_toxicity_tokenizer_weights.pt/tokenizer.json +3 -0
model/rubert_tiny_toxicity_tokenizer_weights.pt/tokenizer_config.json +3 -0
model/rubert_tiny_toxicity_tokenizer_weights.pt/vocab.txt +0 -0
model/rubert_tiny_toxicity_weights.pt +3 -0
model/tf-idf.pkl +3 -0
model/word2vec_for_ltsm.model +3 -0
model/word_dict.json +3 -0
pages/.DS_Store +0 -0
pages/01_🎞️_Kinootzovik.py +38 -0
pages/02_🤖_Toxicity.py +56 -0
pages/03_🔥_Results.py +69 -0
pages/__init__.py +0 -0
pages/__pycache__/__init__.cpython-310.pyc +0 -0
requirements.txt +221 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.json filter=lfs diff=lfs merge=lfs -text

__init__.py ADDED Viewed

File without changes

images/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

images/classes.png ADDED Viewed

images/classification_report.png ADDED Viewed

images/kino.png ADDED Viewed

images/toxy.png ADDED Viewed

main.py ADDED Viewed

	@@ -0,0 +1,38 @@

+import streamlit as st
+st.write("""
+ \n ## Классификация отзывов на фильм 📽️
+ \n ## Оценка степени токсичности пользовательского сообщения 🌶️
+""")
+# \n ## Генерация текста GPT-моделью по пользовательскому prompt 🕹️
+st.write("### *<span style='color:red'>LSTM Team</span>*", unsafe_allow_html=True)
+st.write("""
+  ### Состав команды:
+  \n1. ##### Анастасия 👩🏻‍💻
+  \n2. ##### Алексей 👨🏻‍💻
+  \n3. ##### Тигран 👨🏻‍💻
+""")
+st.write("""
+  ### Проекты:
+""")
+st.write("""
+  #### 1. Необходимо построить модель классификации введенного пользователем отзыва. Результаты предсказаний класса вывести тремя моделями.
+  \n ##### Задача по моделям:
+        \n- Классический ML-алгоритм, обученный на BagOfWords/TF-IDF представлении
+        \n- RNN или LSTM модель (предпочтительно использовать вариант с attention)
+        \n- BERT-based
+  \n #### 2. Оценка степени токсичности пользовательского сообщения
+  \n #####  Задачи:
+        \n- Решить с помощью модели rubert-tiny-toxicity
+""")
+  # \n ### 3. Генерация текста GPT-моделью по пользовательскому prompt
+  # \n #####  Задачи:
+  #       \n- Пользователь может регулировать длину выдаваемой последовательности, Число генераций, Температуру или top-k/p

model/.DS_Store ADDED Viewed

Binary file (8.2 kB). View file

model/__pycache__/bert.cpython-310.pyc ADDED Viewed

Binary file (1.54 kB). View file

model/__pycache__/ltsm_att.cpython-310.pyc ADDED Viewed

Binary file (3.92 kB). View file

model/__pycache__/ml.cpython-310.pyc ADDED Viewed

Binary file (1.25 kB). View file

model/__pycache__/rnn.cpython-310.pyc ADDED Viewed

Binary file (5.89 kB). View file

model/bert.py ADDED Viewed

	@@ -0,0 +1,29 @@

+import torch
+import streamlit as st
+from transformers import AutoTokenizer, AutoModel
+from sklearn.linear_model import LogisticRegression
+import joblib
+from time import time
+dict = {0: 'Нейтральный', 1: 'Положительный', 2: 'Отрицательный'}
+def preprocess_bert(text):
+    start_time = time()
+    tokenizer = AutoTokenizer.from_pretrained("cointegrated/rubert-tiny2")
+    model = AutoModel.from_pretrained("cointegrated/rubert-tiny2")
+    t = tokenizer(text, padding=True, truncation=True, return_tensors='pt')
+    with torch.no_grad():
+        model_output = model(**{k: v.to(model.device) for k, v in t.items()})
+    embeddings = model_output.last_hidden_state[:, 0, :]
+    embeddings = torch.nn.functional.normalize(embeddings)
+    embeddings = embeddings.detach().cpu().numpy()
+    lr = LogisticRegression()
+    lr = joblib.load('model/lr_weights.pkl')
+    # with open('model/lr_weights.pkl', 'rb') as f:
+    #     lr = pickle.load(f)
+    predicted_label = lr.predict(embeddings)
+    predicted_label_text = dict[predicted_label[0]]
+    end_time = time()
+    inference_time = end_time - start_time
+    return f"***{predicted_label_text}***, время предсказания: ***{inference_time:.4f} сек***."

model/embedding_matrix.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0b8025aae0f6b8a31730a4cdb9095a51e33a4a1f8657a326e898e7c8f3e67007
+size 278827972

model/logistic_regression_weights.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:12241487451736eb9e5305e4ce317ee3c76d12be8498cecbb5c33ebeab995036
+size 120750

model/lr_weights.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:46e799a83602c0ee314840d648ce76b41c9ee18e6f03058f50df62a35a868650
+size 8367

model/lstm_att_weight.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6983922dd858d31e89d5e55e8e02f6a812e013b13202f5042bdc7026ba5134db
+size 139823799

model/ltsm_att.py ADDED Viewed

	@@ -0,0 +1,99 @@

+import json
+import numpy as np
+from gensim.models import Word2Vec
+import torch
+from torch.utils.data import DataLoader, TensorDataset
+import torch.nn.functional as F
+import torch.nn as nn
+import torchutils as tu
+from torchmetrics import Accuracy
+from torchmetrics.functional import f1_score
+from string import punctuation
+import time
+with open('model/word_dict.json', 'r') as fp:
+    vocab_to_int = json.load(fp)
+wv = Word2Vec.load("model/word2vec_for_ltsm.model")
+VOCAB_SIZE = len(vocab_to_int)+1
+HIDDEN_SIZE = 128
+SEQ_LEN = 128
+DEVICE='cpu'
+EMBEDDING_DIM = 128
+embedding_matrix = torch.load('model/embedding_matrix.pt')
+embedding_layer = torch.nn.Embedding.from_pretrained(torch.FloatTensor(embedding_matrix))
+class ConcatAttention(nn.Module):
+    def __init__(
+            self,
+            hidden_size: torch.Tensor = HIDDEN_SIZE
+            ) -> None:
+        super().__init__()
+        self.hidden_size = hidden_size
+        self.linear = nn.Linear(hidden_size, hidden_size)
+        self.align  = nn.Linear(hidden_size * 2, hidden_size)
+        self.tanh   = nn.Tanh()
+    def forward(
+            self,
+            lstm_outputs: torch.Tensor, # BATCH_SIZE x SEQ_LEN x HIDDEN_SIZE
+            final_hidden: torch.Tensor  # BATCH_SIZE x HIDDEN_SIZE
+            ) -> tuple[torch.Tensor]:
+        att_weights = self.linear(lstm_outputs)
+        att_weights = torch.bmm(att_weights, final_hidden.unsqueeze(2))
+        att_weights = F.softmax(att_weights.squeeze(2), dim=1)
+        cntxt       = torch.bmm(lstm_outputs.transpose(1, 2), att_weights.unsqueeze(2))
+        concatted   = torch.cat((cntxt, final_hidden.unsqueeze(2)), dim=1)
+        att_hidden  = self.tanh(self.align(concatted.squeeze(-1)))
+        return att_hidden, att_weights
+class LSTMConcatAttention(nn.Module):
+    def __init__(self) -> None:
+        super().__init__()
+        self.embedding = embedding_layer
+        self.lstm = nn.LSTM(EMBEDDING_DIM, HIDDEN_SIZE, batch_first=True)
+        self.attn = ConcatAttention(HIDDEN_SIZE)
+        self.clf = nn.Sequential(
+            nn.Linear(HIDDEN_SIZE, 128),
+            nn.Dropout(),
+            nn.Tanh(),
+            nn.Linear(128, 3)
+        )
+    def forward(self, x):
+        embeddings = self.embedding(x)
+        outputs, (h_n, _) = self.lstm(embeddings)
+        att_hidden, att_weights = self.attn(outputs, h_n.squeeze(0))
+        out = self.clf(att_hidden)
+        return out, att_weights
+model_concat = LSTMConcatAttention()
+model_concat.load_state_dict(torch.load('model/lstm_att_weight.pt', map_location='cpu'))
+model_concat.eval()
+def pred(text):
+    start_time = time.time()
+    text = text.lower()
+    text = ''.join([c for c in text if c not in punctuation])
+    text = [vocab_to_int[word] for word in text.split() if vocab_to_int.get(word)]
+    if len(text) <= 128:
+        zeros = list(np.zeros(128 - len(text)))
+        text = zeros + text
+    else:
+        text = text[: 128]
+    text = torch.Tensor(text)
+    text = text.unsqueeze(0)
+    text = text.type(torch.LongTensor)
+    # print(text.shape)
+    pred = model_concat(text)[0].argmax(1)
+    labels = {0: 'Негативный', 1:'Позитивный', 2:'Нейтральный'}
+    end_time = time.time()
+    inference_time = end_time - start_time
+    # return labels[pred.item()], inference_time
+    return f"***{labels[pred.item()]}***, время предсказания: ***{inference_time:.4f} сек***."

model/ml.py ADDED Viewed

	@@ -0,0 +1,36 @@

+import streamlit as st
+import numpy as np
+import joblib
+import time
+from sklearn.feature_extraction.text import TfidfVectorizer
+from sklearn.linear_model import LogisticRegression
+import time
+import pandas as pd
+import joblib
+model_ml = LogisticRegression()
+vectorizer = joblib.load("model/tf-idf.pkl")
+def preprocess(text):
+    # Убедитесь, что text - это список
+    if isinstance(text, str):
+        text = [text]
+    # Преобразуйте текст
+    text = vectorizer.transform(text)
+    return text
+model = model_ml
+model = joblib.load("model/logistic_regression_weights.pkl")
+def predict(text):
+    start_time = time.time()
+    text = preprocess(text)
+    predicted_label = model.predict(text)
+    dict = {'Bad': 'Отрицательный', 'Neutral': 'Нейтральный', 'Good': 'Положительный'}
+    predicted_label_text = dict[predicted_label[0]]
+    end_time = time.time()
+    inference_time = end_time - start_time
+    return f"***{predicted_label_text}***, время предсказания: ***{inference_time:.4f} сек***."

model/rubert_tiny_toxicity_tokenizer_weights.pt/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6d346be366a7d1d48332dbc9fdf3bf8960b5d879522b7799ddba59e76237ee3
+size 125

model/rubert_tiny_toxicity_tokenizer_weights.pt/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:064a132db204e46351abb4c3acb9da22fc4a837390be3b87877e79212e10dffa
+size 705727

model/rubert_tiny_toxicity_tokenizer_weights.pt/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7160a114cff6faf66cd441ceaaf0dd32964ecd8c4933679247b596cd1a7125b3
+size 1343

model/rubert_tiny_toxicity_tokenizer_weights.pt/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model/rubert_tiny_toxicity_weights.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7e02ce2bbd1611e3eb07ba3735710fb81b8dcf120223e987897f0d87c0525f5
+size 47165548

model/tf-idf.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a13623e7dcb541282d1c3807bcc21ec7fa2e3c551d91bc557a6977e069c9eef9
+size 1539730

model/word2vec_for_ltsm.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c8f7fdcfe5bb9b680626007980139e21fe3dec2408c1ee0e34c96ba5af1b7259
+size 2182195

model/word_dict.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9cc11db4510ff54d488abaae9613aa1dd3e976dc2db3c334a1a915cfdfc52f1f
+size 17951147

pages/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

pages/01_🎞️_Kinootzovik.py ADDED Viewed

	@@ -0,0 +1,38 @@

+import streamlit as st
+import pandas as pd
+from model.bert import preprocess_bert
+from model.ml import predict
+# from model.rnn import pred
+from model.ltsm_att import pred
+"""
+## Классификация киноотзывов
+"""
+st.image('images/kino.png')
+st.sidebar.header('Панель инструментов :gear:')
+text = st.text_area('Поле для ввода отзыва', height=300)
+with st.sidebar:
+    choice_model = st.radio('Выберите модель:', options=['ML-TFIDF', 'RuBert', 'LSTM(attention)'])
+if choice_model == 'RuBert':
+    if text:
+        st.write(preprocess_bert(text))
+if choice_model == 'ML-TFIDF':
+    if text:
+        st.write(predict(text))
+if choice_model == 'LSTM(attention)':
+    if text:
+        st.write(pred(text))
+data = pd.DataFrame({'Модель': ['ML-TFIDF-LogReg', 'RNN', 'RuBert-tiny2-LogReg'], 'F1-macro': [0.65, 0.57, 0.62]})
+# Вывод таблицы
+checkbox = st.sidebar.checkbox("Таблица f1-macro")
+if checkbox:
+    st.write("<h1 style='text-align: center; font-size: 20pt;'>Оценка качества моделей по метрике f1-macro</h1>", unsafe_allow_html=True)
+    st.table(data)

pages/02_🤖_Toxicity.py ADDED Viewed

	@@ -0,0 +1,56 @@

+import torch
+from transformers import AutoTokenizer, AutoModelForSequenceClassification
+import streamlit as st
+import pandas as pd
+import os
+model_checkpoint = 'cointegrated/rubert-tiny-toxicity'
+tokenizer = AutoTokenizer.from_pretrained(model_checkpoint)
+model = AutoModelForSequenceClassification.from_pretrained(model_checkpoint)
+if torch.cuda.is_available():
+    model.cuda()
+# Сохранение весов модели
+model_weights_filename = "model/rubert_tiny_toxicity_weights.pt"
+torch.save(model.state_dict(), model_weights_filename)
+# Сохранение весов токенизатора
+tokenizer_weights_filename = "model/rubert_tiny_toxicity_tokenizer_weights.pt"
+tokenizer.save_pretrained(tokenizer_weights_filename)
+def text2toxicity(text, aggregate=False):
+    """ Calculate toxicity of a text (if aggregate=True) or a vector of toxicity aspects (if aggregate=False)"""
+    with torch.no_grad():
+        inputs = tokenizer(text, return_tensors='pt', truncation=True, padding=True).to(model.device)
+        proba = torch.sigmoid(model(**inputs).logits).cpu().numpy()
+    if isinstance(text, str):
+        proba = proba[0]
+    if aggregate:
+        return 1 - proba.T[0] * (1 - proba.T[-1])
+    return proba
+"""
+## Оценка степени токсичности сообщения
+"""
+st.image('images/toxy.png')
+# Ввод предложения от пользователя
+input_text = st.text_area("Введите предложение:", height=100)
+# Обработка входных данных через модель
+if input_text:
+    # Вывод результатов
+    my_dict = {
+    'Не токсичный': (text2toxicity(input_text, False))[0],
+    'Оскорбление': (text2toxicity(input_text, False))[1],
+    'Непристойность': (text2toxicity(input_text, False))[2],
+    'Угроза': (text2toxicity(input_text, False))[3],
+    'Опасный': (text2toxicity(input_text, False))[4]
+}
+    # my_dict['index'] = 'your_index_value'
+    # st.write({text2toxicity(input_text, False)[0]: 'non-toxic'})
+    df = pd.DataFrame(my_dict, index=['вероятности'])
+    st.dataframe(df)
+    st.write(f'Вероятность токсичного комментария {text2toxicity(input_text, True)}')

pages/03_🔥_Results.py ADDED Viewed

	@@ -0,0 +1,69 @@

+import streamlit as st
+from PIL import Image
+import matplotlib.pyplot as plt
+st.write("""
+ ## 📝 Итоги.
+""")
+"""
+### 1. Классификация киноотзывов
+Датасет для обучения оказался крайне несбалансированным, отзывы разделены на три класса: Нейтральный, \
+  Положительный, Отрицательный
+"""
+st.image('images/classes.png')
+'''
+\n Датасет был поделен на три выборки:
+'''
+st.text('Тренировочный сет - 21954 отзывов')
+st.text('Валидационный сет - 8782 отзывов')
+st.text('Тестовый сет - 5855 отзывов')
+"""
+##### 1. Rubert-tiny2, модель-классификатор: LogisticRegression
+"""
+"""
+Была проведена балансировка классов в тренировочном наборе методом Oversampling(RandomOverSampler). На скорость обучения повлияла \
+  максимальная длина твита после токенизации в train, MAX_LEN = 4548, она была ограничена 1024 в виду возможностей производительности \
+  системы. Классификатором была выбрана LogisticRegression, также исходя из скорости обучения.
+  \n ##### Classification Report:
+"""
+st.image('images/classification_report.png')
+"""
+Метрика качества f1-macro показала наилучший результат 0.62
+"""
+"""
+##### 2.  ML-алгоритм, обученный на TF-IDF представлении, модель-классификатор: LogisticRegression
+"""
+"""
+Прежде всего для этого алгоритма был проведена предобработки текста, а именно очистка текста от лишних символов, \
+  лемматизация текста, затем, была проведена балансировка классов в тренировочном наборе методом Oversampling(SMOTE). \
+  Для TfidfVectorizer был указан параметр max_features=5000, т.е. было выбрано максимальное количество признаков \
+    (слов или термов), которые были учтены при создании матрицы TF-IDF. Классификатором была выбрана LogisticRegression, \
+        исходя из скорости обучения.
+  \n Метрика качества f1-macro показала наилучший результат 0.65
+"""
+"""
+##### 3.  Модель на основе LTSM
+"""
+"""
+Предобработка текста осуществлялась аналогичным с предыдущими моделями способом, для обеспечения сравнимых результатов \
+  Векторизация текста проводилась с помощью Word2Vec, встроенного в модель. Модель обрабатывала текст через \
+  LTSM слои, были выбраны значения hidden_size 128, embedding_dim 128. В модели также применялся механизм \
+    Attention. Классификация производилась внутри модели полносвязными слоями.
+  \n Метрика качества f1-macro в конце обучения составила 0.57
+"""
+"""
+### 2. Оценка степени токсичности пользовательского сообщения
+Задача была решена с помощью модели [rubert-tiny-toxicity](https://huggingface.co/cointegrated/rubert-tiny-toxicity), \
+  доработанной для классификации токсичности и неуместности коротких неофициальных текстов на русском языке, \
+    таких как комментарии в социальных сетях.
+  \n  Датасет: 14412 сообщений из соцсетей, разделенных на два класса: токсичные и не токсичные. Токсичные \
+    преимущественно наполнены оскорбительной и нецензурной лексикой.
+"""

pages/__init__.py ADDED Viewed

File without changes

pages/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (203 Bytes). View file

requirements.txt ADDED Viewed

	@@ -0,0 +1,221 @@

+absl-py==2.0.0
+aiofiles==23.1.0
+aiogram==3.1.1
+aiohttp==3.8.6
+aiosignal==1.3.1
+altair==5.1.2
+annotated-types==0.6.0
+anyio==4.0.0
+appdirs==1.4.4
+appnope==0.1.3
+argon2-cffi==23.1.0
+argon2-cffi-bindings==21.2.0
+arrow==1.3.0
+asttokens==2.4.1
+astunparse==1.6.3
+async-lru==2.0.4
+async-timeout==4.0.3
+attrs==23.1.0
+Babel==2.13.1
+beautifulsoup4==4.12.2
+black==23.11.0
+bleach==6.1.0
+blinker==1.7.0
+cachetools==5.3.2
+certifi==2023.7.22
+cffi==1.16.0
+charset-normalizer==3.3.2
+click==8.1.7
+comm==0.2.0
+contourpy==1.2.0
+cycler==0.12.1
+debugpy==1.8.0
+decorator==5.1.1
+defusedxml==0.7.1
+exceptiongroup==1.1.3
+executing==2.0.1
+fastjsonschema==2.19.0
+filelock==3.13.1
+flatbuffers==23.5.26
+fonttools==4.44.0
+fqdn==1.5.1
+frozendict==2.3.8
+frozenlist==1.4.0
+fsspec==2023.10.0
+gast==0.5.4
+gensim==4.3.2
+gitdb==4.0.11
+GitPython==3.1.40
+google-auth==2.25.1
+google-auth-oauthlib==1.1.0
+google-pasta==0.2.0
+grpcio==1.59.3
+h5py==3.10.0
+html5lib==1.1
+huggingface-hub==0.19.4
+idna==3.4
+imageio==2.31.6
+importlib-metadata==6.8.0
+ipykernel==6.26.0
+ipython==8.17.2
+ipywidgets==8.1.1
+isoduration==20.11.0
+jedi==0.19.1
+Jinja2==3.1.2
+joblib==1.3.2
+json5==0.9.14
+jsonpointer==2.4
+jsonschema==4.19.2
+jsonschema-specifications==2023.7.1
+jupyter==1.0.0
+jupyter-console==6.6.3
+jupyter-events==0.9.0
+jupyter-lsp==2.2.0
+jupyter_client==8.6.0
+jupyter_core==5.5.0
+jupyter_server==2.10.1
+jupyter_server_terminals==0.4.4
+jupyterlab==4.0.9
+jupyterlab-pygments==0.2.2
+jupyterlab-widgets==3.0.9
+jupyterlab_code_formatter==2.2.1
+jupyterlab_commands==0.4.0
+jupyterlab_server==2.25.2
+keras==2.15.0
+kiwisolver==1.4.5
+lazy_loader==0.3
+libclang==16.0.6
+lightning-utilities==0.10.0
+lxml==4.9.3
+magic-filter==1.0.12
+Markdown==3.5.1
+markdown-it-py==3.0.0
+MarkupSafe==2.1.3
+matplotlib==3.8.1
+matplotlib-inline==0.1.6
+mdurl==0.1.2
+mistune==3.0.2
+ml-dtypes==0.2.0
+mplcyberpunk==0.7.0
+mpmath==1.3.0
+multidict==6.0.4
+multitasking==0.0.11
+mypy-extensions==1.0.0
+nbclient==0.9.0
+nbconvert==7.11.0
+nbformat==5.9.2
+nest-asyncio==1.5.8
+networkx==3.2.1
+nltk==3.8.1
+notebook==7.0.6
+notebook_shim==0.2.3
+numpy==1.26.1
+oauthlib==3.2.2
+opencv-contrib-python==4.8.1.78
+opencv-python==4.8.1.78
+opt-einsum==3.3.0
+overrides==7.4.0
+packaging==23.2
+pandas==2.1.2
+pandocfilters==1.5.0
+parso==0.8.3
+pathspec==0.11.2
+patsy==0.5.3
+peewee==3.17.0
+pexpect==4.8.0
+Pillow==10.0.1
+platformdirs==4.0.0
+plotly==5.18.0
+plotly-express==0.4.1
+prometheus-client==0.18.0
+prompt-toolkit==3.0.41
+protobuf==4.23.4
+psutil==5.9.6
+ptyprocess==0.7.0
+pure-eval==0.2.2
+py-cpuinfo==9.0.0
+pyarrow==14.0.0
+pyasn1==0.5.1
+pyasn1-modules==0.3.0
+pycparser==2.21
+pydantic==2.3.0
+pydantic_core==2.6.3
+pydeck==0.8.1b0
+Pygments==2.16.1
+pyparsing==3.1.1
+python-dateutil==2.8.2
+python-json-logger==2.0.7
+pytz==2023.3.post1
+PyYAML==6.0.1
+pyzmq==25.1.1
+qtconsole==5.5.1
+QtPy==2.4.1
+referencing==0.30.2
+regex==2023.10.3
+requests==2.31.0
+requests-oauthlib==1.3.1
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rich==13.6.0
+rpds-py==0.10.6
+rsa==4.9
+safetensors==0.4.1
+scikit-image==0.22.0
+scikit-learn==1.3.2
+scipy==1.11.3
+seaborn==0.13.0
+Send2Trash==1.8.2
+shortcuts==0.11.0
+six==1.16.0
+smart-open==6.4.0
+smmap==5.0.1
+sniffio==1.3.0
+soupsieve==2.5
+stack-data==0.6.3
+statsmodels==0.14.0
+streamlit==1.28.1
+sympy==1.12
+tenacity==8.2.3
+tensorboard==2.15.1
+tensorboard-data-server==0.7.2
+tensorflow==2.15.0
+tensorflow-estimator==2.15.0
+tensorflow-io-gcs-filesystem==0.34.0
+tensorflow-macos==2.15.0
+termcolor==2.4.0
+terminado==0.18.0
+thop==0.1.1.post2209072238
+threadpoolctl==3.2.0
+tifffile==2023.9.26
+tinycss2==1.2.1
+tokenizers==0.15.0
+toml==0.10.2
+tomli==2.0.1
+toolz==0.12.0
+torch==2.1.1
+torchmetrics==1.2.1
+torchutils==0.0.4
+torchview==0.2.6
+torchvision==0.16.1
+tornado==6.3.3
+tqdm==4.66.1
+traitlets==5.13.0
+transformers==4.35.2
+types-python-dateutil==2.8.19.14
+typing_extensions==4.7.1
+tzdata==2023.3
+tzlocal==5.2
+ultralytics==8.0.216
+uri-template==1.3.0
+urllib3==2.0.7
+validators==0.22.0
+wcwidth==0.2.10
+webcolors==1.13
+webencodings==0.5.1
+websocket-client==1.6.4
+Werkzeug==3.0.1
+widgetsnbextension==4.0.9
+wrapt==1.14.1
+yarl==1.9.2
+yfinance==0.2.31
+zipp==3.17.0