Spaces:
Running
on
T4
Running
on
T4
Update app.py
Browse files
app.py
CHANGED
@@ -53,7 +53,7 @@ def transform_query(query: str) -> str:
|
|
53 |
return f'Represent this sentence for searching relevant passages: {query}'
|
54 |
|
55 |
def query_hybrid_search(query: str, client: QdrantClient, collection_name: str, dense_model: OptimumEncoder, sparse_model: SparseTextEmbedding):
|
56 |
-
dense_embeddings = dense_model([transform_query(query)], 1)[0]
|
57 |
sparse_embeddings = list(sparse_model.query_embed(query))[0]
|
58 |
|
59 |
return client.query_points(
|
@@ -281,7 +281,7 @@ def chunk_documents(texts: List[str], metadatas: List[dict], dense_model: Optimu
|
|
281 |
documents_and_metadatas = [(chunk.content, chunk.metadata) for sub_chunk in chunks for chunk in sub_chunk]
|
282 |
documents, metadatas_docs = [list(t) for t in zip(*documents_and_metadatas)]
|
283 |
|
284 |
-
dense_embeddings = dense_model(documents, 32)
|
285 |
sparse_embeddings = list(sparse_model.embed(documents, 32, 0))
|
286 |
|
287 |
return documents, metadatas_docs, dense_embeddings, sparse_embeddings
|
|
|
53 |
return f'Represent this sentence for searching relevant passages: {query}'
|
54 |
|
55 |
def query_hybrid_search(query: str, client: QdrantClient, collection_name: str, dense_model: OptimumEncoder, sparse_model: SparseTextEmbedding):
|
56 |
+
dense_embeddings = dense_model([transform_query(query)], 1, convert_to_numpy=True)[0]
|
57 |
sparse_embeddings = list(sparse_model.query_embed(query))[0]
|
58 |
|
59 |
return client.query_points(
|
|
|
281 |
documents_and_metadatas = [(chunk.content, chunk.metadata) for sub_chunk in chunks for chunk in sub_chunk]
|
282 |
documents, metadatas_docs = [list(t) for t in zip(*documents_and_metadatas)]
|
283 |
|
284 |
+
dense_embeddings = dense_model(documents, 32, convert_to_numpy=True)
|
285 |
sparse_embeddings = list(sparse_model.embed(documents, 32, 0))
|
286 |
|
287 |
return documents, metadatas_docs, dense_embeddings, sparse_embeddings
|