devve1 commited on
Commit
8487529
1 Parent(s): ada35d6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -9
app.py CHANGED
@@ -16,6 +16,7 @@ import numpy as np
16
  import pandas as pd
17
  import streamlit as st
18
  from vllm import LLM
 
19
  from numpy import ndarray
20
  from datetime import datetime
21
  from typing import List, Dict
@@ -72,7 +73,8 @@ from qdrant_client.models import (
72
  global_state_documents_only = False
73
 
74
  class Question(BaseModel):
75
- answer: str = Field(..., description='Answer to the Query')
 
76
 
77
  icon_to_types = {
78
  'ppt':('',
@@ -224,8 +226,9 @@ def main(query: str, client: QdrantClient, collection_name: str, llm, dense_mode
224
 
225
  context = "\n".join(contents)
226
  print(f'Context : \n + {context}')
227
-
228
- gen_text = outlines.generate.json(llm, Question, whitespace_pattern=r"[\n ]?")
 
229
 
230
  gen_choice = outlines.generate.choice(llm, choices=['Yes', 'No'])
231
  prompt = route_llm(context, query)
@@ -242,9 +245,8 @@ def main(query: str, client: QdrantClient, collection_name: str, llm, dense_mode
242
  result_metadatas = "\n\n".join(f'{value}' for value in filtered_metadatas)
243
 
244
  prompt = answer_with_context(context, query)
245
- answer = gen_text(prompt, max_tokens=300, sampling_params=SamplingParams(temperature=0))
246
- print(f'Asnwer : {answer}')
247
- answer = f"{answer.answer}\n\n\nSource(s) :\n\n{result_metadatas}"
248
 
249
  if not st.session_state.documents_only:
250
  answer = f'Documents Based :\n\n{answer}'
@@ -255,15 +257,15 @@ def main(query: str, client: QdrantClient, collection_name: str, llm, dense_mode
255
  print(f'Choice 2: {action}')
256
  if action == 'General Question':
257
  prompt = open_query_prompt(past_messages, query)
258
- answer = gen_text(prompt, max_tokens=300, sampling_params=SamplingParams(temperature=0.6, top_p=0.9, top_k=10)).answer
259
  else:
260
  print(f'GLOBAL STATE : {global_state_documents_only}')
261
  if global_state_documents_only:
262
  prompt = idk(query)
263
- answer = gen_text(prompt, max_tokens=128, sampling_params=SamplingParams(temperature=0.6, top_p=0.9, top_k=10)).answer
264
  else:
265
  prompt = self_knowledge(query)
266
- answer = gen_text(prompt, max_tokens=300, sampling_params=SamplingParams(temperature=0.6, top_p=0.9, top_k=10)).answer
267
  answer = f'Internal Knowledge :\n\n{answer}'
268
 
269
  torch.cuda.empty_cache()
 
16
  import pandas as pd
17
  import streamlit as st
18
  from vllm import LLM
19
+ from json import pyjson
20
  from numpy import ndarray
21
  from datetime import datetime
22
  from typing import List, Dict
 
73
  global_state_documents_only = False
74
 
75
  class Question(BaseModel):
76
+ answer: str
77
+ schema = pyjson.dumps(Question.model_json_schema())
78
 
79
  icon_to_types = {
80
  'ppt':('',
 
226
 
227
  context = "\n".join(contents)
228
  print(f'Context : \n + {context}')
229
+
230
+ regex = build_regex_from_schema(schema, r"[\n ]?")
231
+ gen_text = outlines.generate.regex(llm, regex)
232
 
233
  gen_choice = outlines.generate.choice(llm, choices=['Yes', 'No'])
234
  prompt = route_llm(context, query)
 
245
  result_metadatas = "\n\n".join(f'{value}' for value in filtered_metadatas)
246
 
247
  prompt = answer_with_context(context, query)
248
+ answer = json.loads(gen_text(prompt, max_tokens=300, sampling_params=SamplingParams(temperature=0)))['answer']
249
+ answer = f"{answer}\n\n\nSource(s) :\n\n{result_metadatas}"
 
250
 
251
  if not st.session_state.documents_only:
252
  answer = f'Documents Based :\n\n{answer}'
 
257
  print(f'Choice 2: {action}')
258
  if action == 'General Question':
259
  prompt = open_query_prompt(past_messages, query)
260
+ answer = json.loads(gen_text(prompt, max_tokens=300, sampling_params=SamplingParams(temperature=0.6, top_p=0.9, top_k=10)))['answer']
261
  else:
262
  print(f'GLOBAL STATE : {global_state_documents_only}')
263
  if global_state_documents_only:
264
  prompt = idk(query)
265
+ answer = json.loads(gen_text(prompt, max_tokens=128, sampling_params=SamplingParams(temperature=0.6, top_p=0.9, top_k=10)))['answer']
266
  else:
267
  prompt = self_knowledge(query)
268
+ answer = json.loads(gen_text(prompt, max_tokens=300, sampling_params=SamplingParams(temperature=0.6, top_p=0.9, top_k=10)))['answer']
269
  answer = f'Internal Knowledge :\n\n{answer}'
270
 
271
  torch.cuda.empty_cache()