Spaces:
Sleeping
Sleeping
danicafisher
commited on
Commit
•
2edf59a
1
Parent(s):
88077c1
Updates for openai
Browse files- app.py +6 -13
- requirements.txt +2 -1
app.py
CHANGED
@@ -7,21 +7,16 @@ from aimakerspace.openai_utils.prompts import (
|
|
7 |
)
|
8 |
# from aimakerspace.openai_utils.embedding import EmbeddingModel
|
9 |
from aimakerspace.vectordatabase import VectorDatabase
|
10 |
-
from aimakerspace.openai_utils.chatmodel import ChatOpenAI
|
11 |
import chainlit as cl
|
12 |
# import asyncio
|
13 |
import nest_asyncio
|
14 |
nest_asyncio.apply()
|
15 |
from langchain_community.document_loaders import PyMuPDFLoader
|
16 |
from langchain_text_splitters import RecursiveCharacterTextSplitter
|
17 |
-
from
|
18 |
|
19 |
|
20 |
-
# pdf_loader_NIST = PDFFileLoader("data/NIST.AI.600-1.pdf")
|
21 |
-
# pdf_loader_Blueprint = PDFFileLoader("data/Blueprint-for-an-AI-Bill-of-Rights.pdf")
|
22 |
-
# documents_NIST = pdf_loader_NIST.load_documents()
|
23 |
-
# documents_Blueprint = pdf_loader_Blueprint.load_documents()
|
24 |
-
|
25 |
filepath_NIST = "data/NIST.AI.600-1.pdf"
|
26 |
filepath_Blueprint = "data/Blueprint-for-an-AI-Bill-of-Rights.pdf"
|
27 |
|
@@ -30,10 +25,6 @@ documents_Blueprint = PyMuPDFLoader(filepath_Blueprint).load()
|
|
30 |
documents = documents_NIST + documents_Blueprint
|
31 |
|
32 |
|
33 |
-
# text_splitter = CharacterTextSplitter()
|
34 |
-
# split_documents_NIST = text_splitter.split_texts(documents_NIST)
|
35 |
-
# split_documents_Blueprint = text_splitter.split_texts(documents_Blueprint)
|
36 |
-
|
37 |
text_splitter = RecursiveCharacterTextSplitter(
|
38 |
chunk_size = 500,
|
39 |
chunk_overlap = 50
|
@@ -101,12 +92,14 @@ async def start_chat():
|
|
101 |
# vector_db = await vector_db.abuild_from_list(split_documents_NIST)
|
102 |
# vector_db = await vector_db.abuild_from_list(split_documents_Blueprint)
|
103 |
|
104 |
-
chat_openai = ChatOpenAI()
|
|
|
|
|
105 |
|
106 |
# Create a chain
|
107 |
retrieval_augmented_qa_pipeline = RetrievalAugmentedQAPipeline(
|
108 |
vector_db_retriever=vector_db,
|
109 |
-
llm=
|
110 |
)
|
111 |
|
112 |
# cl.user_session.set("settings", settings)
|
|
|
7 |
)
|
8 |
# from aimakerspace.openai_utils.embedding import EmbeddingModel
|
9 |
from aimakerspace.vectordatabase import VectorDatabase
|
10 |
+
# from aimakerspace.openai_utils.chatmodel import ChatOpenAI
|
11 |
import chainlit as cl
|
12 |
# import asyncio
|
13 |
import nest_asyncio
|
14 |
nest_asyncio.apply()
|
15 |
from langchain_community.document_loaders import PyMuPDFLoader
|
16 |
from langchain_text_splitters import RecursiveCharacterTextSplitter
|
17 |
+
from langchain_openai import ChatOpenAI, OpenAIEmbeddings
|
18 |
|
19 |
|
|
|
|
|
|
|
|
|
|
|
20 |
filepath_NIST = "data/NIST.AI.600-1.pdf"
|
21 |
filepath_Blueprint = "data/Blueprint-for-an-AI-Bill-of-Rights.pdf"
|
22 |
|
|
|
25 |
documents = documents_NIST + documents_Blueprint
|
26 |
|
27 |
|
|
|
|
|
|
|
|
|
28 |
text_splitter = RecursiveCharacterTextSplitter(
|
29 |
chunk_size = 500,
|
30 |
chunk_overlap = 50
|
|
|
92 |
# vector_db = await vector_db.abuild_from_list(split_documents_NIST)
|
93 |
# vector_db = await vector_db.abuild_from_list(split_documents_Blueprint)
|
94 |
|
95 |
+
# chat_openai = ChatOpenAI()
|
96 |
+
llm = ChatOpenAI(model="gpt-4o-mini", tags=["base_llm"])
|
97 |
+
|
98 |
|
99 |
# Create a chain
|
100 |
retrieval_augmented_qa_pipeline = RetrievalAugmentedQAPipeline(
|
101 |
vector_db_retriever=vector_db,
|
102 |
+
llm=llm
|
103 |
)
|
104 |
|
105 |
# cl.user_session.set("settings", settings)
|
requirements.txt
CHANGED
@@ -5,4 +5,5 @@ PyPDF2
|
|
5 |
pymupdf
|
6 |
langchain
|
7 |
langchain-community
|
8 |
-
langchain-text-splitters
|
|
|
|
5 |
pymupdf
|
6 |
langchain
|
7 |
langchain-community
|
8 |
+
langchain-text-splitters
|
9 |
+
langchain-openai
|