danicafisher commited on
Commit
2edf59a
1 Parent(s): 88077c1

Updates for openai

Browse files
Files changed (2) hide show
  1. app.py +6 -13
  2. requirements.txt +2 -1
app.py CHANGED
@@ -7,21 +7,16 @@ from aimakerspace.openai_utils.prompts import (
7
  )
8
  # from aimakerspace.openai_utils.embedding import EmbeddingModel
9
  from aimakerspace.vectordatabase import VectorDatabase
10
- from aimakerspace.openai_utils.chatmodel import ChatOpenAI
11
  import chainlit as cl
12
  # import asyncio
13
  import nest_asyncio
14
  nest_asyncio.apply()
15
  from langchain_community.document_loaders import PyMuPDFLoader
16
  from langchain_text_splitters import RecursiveCharacterTextSplitter
17
- from langchain_community.embeddings import OpenAIEmbeddings
18
 
19
 
20
- # pdf_loader_NIST = PDFFileLoader("data/NIST.AI.600-1.pdf")
21
- # pdf_loader_Blueprint = PDFFileLoader("data/Blueprint-for-an-AI-Bill-of-Rights.pdf")
22
- # documents_NIST = pdf_loader_NIST.load_documents()
23
- # documents_Blueprint = pdf_loader_Blueprint.load_documents()
24
-
25
  filepath_NIST = "data/NIST.AI.600-1.pdf"
26
  filepath_Blueprint = "data/Blueprint-for-an-AI-Bill-of-Rights.pdf"
27
 
@@ -30,10 +25,6 @@ documents_Blueprint = PyMuPDFLoader(filepath_Blueprint).load()
30
  documents = documents_NIST + documents_Blueprint
31
 
32
 
33
- # text_splitter = CharacterTextSplitter()
34
- # split_documents_NIST = text_splitter.split_texts(documents_NIST)
35
- # split_documents_Blueprint = text_splitter.split_texts(documents_Blueprint)
36
-
37
  text_splitter = RecursiveCharacterTextSplitter(
38
  chunk_size = 500,
39
  chunk_overlap = 50
@@ -101,12 +92,14 @@ async def start_chat():
101
  # vector_db = await vector_db.abuild_from_list(split_documents_NIST)
102
  # vector_db = await vector_db.abuild_from_list(split_documents_Blueprint)
103
 
104
- chat_openai = ChatOpenAI()
 
 
105
 
106
  # Create a chain
107
  retrieval_augmented_qa_pipeline = RetrievalAugmentedQAPipeline(
108
  vector_db_retriever=vector_db,
109
- llm=chat_openai
110
  )
111
 
112
  # cl.user_session.set("settings", settings)
 
7
  )
8
  # from aimakerspace.openai_utils.embedding import EmbeddingModel
9
  from aimakerspace.vectordatabase import VectorDatabase
10
+ # from aimakerspace.openai_utils.chatmodel import ChatOpenAI
11
  import chainlit as cl
12
  # import asyncio
13
  import nest_asyncio
14
  nest_asyncio.apply()
15
  from langchain_community.document_loaders import PyMuPDFLoader
16
  from langchain_text_splitters import RecursiveCharacterTextSplitter
17
+ from langchain_openai import ChatOpenAI, OpenAIEmbeddings
18
 
19
 
 
 
 
 
 
20
  filepath_NIST = "data/NIST.AI.600-1.pdf"
21
  filepath_Blueprint = "data/Blueprint-for-an-AI-Bill-of-Rights.pdf"
22
 
 
25
  documents = documents_NIST + documents_Blueprint
26
 
27
 
 
 
 
 
28
  text_splitter = RecursiveCharacterTextSplitter(
29
  chunk_size = 500,
30
  chunk_overlap = 50
 
92
  # vector_db = await vector_db.abuild_from_list(split_documents_NIST)
93
  # vector_db = await vector_db.abuild_from_list(split_documents_Blueprint)
94
 
95
+ # chat_openai = ChatOpenAI()
96
+ llm = ChatOpenAI(model="gpt-4o-mini", tags=["base_llm"])
97
+
98
 
99
  # Create a chain
100
  retrieval_augmented_qa_pipeline = RetrievalAugmentedQAPipeline(
101
  vector_db_retriever=vector_db,
102
+ llm=llm
103
  )
104
 
105
  # cl.user_session.set("settings", settings)
requirements.txt CHANGED
@@ -5,4 +5,5 @@ PyPDF2
5
  pymupdf
6
  langchain
7
  langchain-community
8
- langchain-text-splitters
 
 
5
  pymupdf
6
  langchain
7
  langchain-community
8
+ langchain-text-splitters
9
+ langchain-openai