devve1 commited on
Commit
2400c5a
1 Parent(s): d26efd6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -9
app.py CHANGED
@@ -13,8 +13,7 @@ from llama_cpp import Llama
13
  from scipy.sparse import csr_matrix, save_npz, load_npz, vstack
14
  from qdrant_client import QdrantClient, models
15
  from langchain_community.document_loaders import WikipediaLoader, WebBaseLoader
16
- from statistical_chunker import StatisticalChunker
17
- from semantic_router.encoders.huggingface import HuggingFaceEncoder
18
  from fastembed.sparse.splade_pp import supported_splade_models
19
  from fastembed import SparseTextEmbedding, SparseEmbedding
20
  from unstructured.partition.auto import partition
@@ -103,7 +102,7 @@ def transform_query(query: str) -> str:
103
  return f'Represent this sentence for searching relevant passages: {query}'
104
 
105
  def main(query: str, client: QdrantClient, collection_name: str, llm, dense_model, sparse_model):
106
- dense_query = list(dense_model(transform_query(query)).cpu().numpy())
107
  sparse_query = list(sparse_model.embed(query, 32))
108
 
109
  search_results = search(
@@ -337,11 +336,6 @@ def chunk_documents(texts, metadatas, dense_model, sparse_model):
337
  breakpoint_threshold_type='standard_deviation'
338
  )
339
 
340
-
341
-
342
-
343
-
344
-
345
  _metadatas = metadatas or [{}] * len(texts)
346
  documents = []
347
  metadatas_docs = []
@@ -359,7 +353,7 @@ def chunk_documents(texts, metadatas, dense_model, sparse_model):
359
  joblib.Parallel(n_jobs=joblib.cpu_count(), verbose=1, require='sharedmem')(
360
  joblib.delayed(create_document)(text, i, _metadatas) for i, text in enumerate(texts))
361
 
362
- dense_embeddings = dense_model.embed(documents).cpu().numpy()
363
  sparse_embeddings = list(sparse_model.embed(documents, 32))
364
 
365
  return documents, metadatas_docs, dense_embeddings, sparse_embeddings
 
13
  from scipy.sparse import csr_matrix, save_npz, load_npz, vstack
14
  from qdrant_client import QdrantClient, models
15
  from langchain_community.document_loaders import WikipediaLoader, WebBaseLoader
16
+ from fastembed_ext import FastEmbedEmbeddingsLc
 
17
  from fastembed.sparse.splade_pp import supported_splade_models
18
  from fastembed import SparseTextEmbedding, SparseEmbedding
19
  from unstructured.partition.auto import partition
 
102
  return f'Represent this sentence for searching relevant passages: {query}'
103
 
104
  def main(query: str, client: QdrantClient, collection_name: str, llm, dense_model, sparse_model):
105
+ dense_query = list(dense_model.embed_query(query,32)
106
  sparse_query = list(sparse_model.embed(query, 32))
107
 
108
  search_results = search(
 
336
  breakpoint_threshold_type='standard_deviation'
337
  )
338
 
 
 
 
 
 
339
  _metadatas = metadatas or [{}] * len(texts)
340
  documents = []
341
  metadatas_docs = []
 
353
  joblib.Parallel(n_jobs=joblib.cpu_count(), verbose=1, require='sharedmem')(
354
  joblib.delayed(create_document)(text, i, _metadatas) for i, text in enumerate(texts))
355
 
356
+ dense_embeddings = dense_model.embed_documents(documents, 32)
357
  sparse_embeddings = list(sparse_model.embed(documents, 32))
358
 
359
  return documents, metadatas_docs, dense_embeddings, sparse_embeddings