Update app.py
Browse files
app.py
CHANGED
@@ -13,8 +13,7 @@ from llama_cpp import Llama
|
|
13 |
from scipy.sparse import csr_matrix, save_npz, load_npz, vstack
|
14 |
from qdrant_client import QdrantClient, models
|
15 |
from langchain_community.document_loaders import WikipediaLoader, WebBaseLoader
|
16 |
-
from
|
17 |
-
from semantic_router.encoders.huggingface import HuggingFaceEncoder
|
18 |
from fastembed.sparse.splade_pp import supported_splade_models
|
19 |
from fastembed import SparseTextEmbedding, SparseEmbedding
|
20 |
from unstructured.partition.auto import partition
|
@@ -103,7 +102,7 @@ def transform_query(query: str) -> str:
|
|
103 |
return f'Represent this sentence for searching relevant passages: {query}'
|
104 |
|
105 |
def main(query: str, client: QdrantClient, collection_name: str, llm, dense_model, sparse_model):
|
106 |
-
dense_query = list(dense_model(
|
107 |
sparse_query = list(sparse_model.embed(query, 32))
|
108 |
|
109 |
search_results = search(
|
@@ -337,11 +336,6 @@ def chunk_documents(texts, metadatas, dense_model, sparse_model):
|
|
337 |
breakpoint_threshold_type='standard_deviation'
|
338 |
)
|
339 |
|
340 |
-
|
341 |
-
|
342 |
-
|
343 |
-
|
344 |
-
|
345 |
_metadatas = metadatas or [{}] * len(texts)
|
346 |
documents = []
|
347 |
metadatas_docs = []
|
@@ -359,7 +353,7 @@ def chunk_documents(texts, metadatas, dense_model, sparse_model):
|
|
359 |
joblib.Parallel(n_jobs=joblib.cpu_count(), verbose=1, require='sharedmem')(
|
360 |
joblib.delayed(create_document)(text, i, _metadatas) for i, text in enumerate(texts))
|
361 |
|
362 |
-
dense_embeddings = dense_model.
|
363 |
sparse_embeddings = list(sparse_model.embed(documents, 32))
|
364 |
|
365 |
return documents, metadatas_docs, dense_embeddings, sparse_embeddings
|
|
|
13 |
from scipy.sparse import csr_matrix, save_npz, load_npz, vstack
|
14 |
from qdrant_client import QdrantClient, models
|
15 |
from langchain_community.document_loaders import WikipediaLoader, WebBaseLoader
|
16 |
+
from fastembed_ext import FastEmbedEmbeddingsLc
|
|
|
17 |
from fastembed.sparse.splade_pp import supported_splade_models
|
18 |
from fastembed import SparseTextEmbedding, SparseEmbedding
|
19 |
from unstructured.partition.auto import partition
|
|
|
102 |
return f'Represent this sentence for searching relevant passages: {query}'
|
103 |
|
104 |
def main(query: str, client: QdrantClient, collection_name: str, llm, dense_model, sparse_model):
|
105 |
+
dense_query = list(dense_model.embed_query(query,32)
|
106 |
sparse_query = list(sparse_model.embed(query, 32))
|
107 |
|
108 |
search_results = search(
|
|
|
336 |
breakpoint_threshold_type='standard_deviation'
|
337 |
)
|
338 |
|
|
|
|
|
|
|
|
|
|
|
339 |
_metadatas = metadatas or [{}] * len(texts)
|
340 |
documents = []
|
341 |
metadatas_docs = []
|
|
|
353 |
joblib.Parallel(n_jobs=joblib.cpu_count(), verbose=1, require='sharedmem')(
|
354 |
joblib.delayed(create_document)(text, i, _metadatas) for i, text in enumerate(texts))
|
355 |
|
356 |
+
dense_embeddings = dense_model.embed_documents(documents, 32)
|
357 |
sparse_embeddings = list(sparse_model.embed(documents, 32))
|
358 |
|
359 |
return documents, metadatas_docs, dense_embeddings, sparse_embeddings
|