Spaces:

capradeepgujaran
/

ChatWithDocuments

Running

capradeepgujaran commited on 5 days ago

Commit

3303167

•

1 Parent(s): ea34aa6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -128,17 +128,19 @@ def process_upload(api_key, files):
         return f"No valid documents were indexed. Errors: {'; '.join(error_messages)}", None
 def calculate_similarity(response, ground_truth):
     response_embedding = sentence_model.encode(response, convert_to_tensor=True)
     truth_embedding = sentence_model.encode(ground_truth, convert_to_tensor=True)
-    # Normalize the embeddings
-    response_embedding = response_embedding / np.linalg.norm(response_embedding)
-    truth_embedding = truth_embedding / np.linalg.norm(truth_embedding)
     # Calculate cosine similarity using sklearn's cosine_similarity function
     similarity = cosine_similarity(response_embedding.reshape(1, -1), truth_embedding.reshape(1, -1))[0][0]
     return similarity * 100  # Convert to percentage
 def query_app(query, model_name, use_similarity_check, openai_api_key):
     global vector_index, query_log

         return f"No valid documents were indexed. Errors: {'; '.join(error_messages)}", None
 def calculate_similarity(response, ground_truth):
+    # Encode the response and ground truth
     response_embedding = sentence_model.encode(response, convert_to_tensor=True)
     truth_embedding = sentence_model.encode(ground_truth, convert_to_tensor=True)
+    # Explicitly normalize the embeddings (should result in unit vectors)
+    response_embedding = response_embedding / response_embedding.norm(p=2)
+    truth_embedding = truth_embedding / truth_embedding.norm(p=2)
     # Calculate cosine similarity using sklearn's cosine_similarity function
     similarity = cosine_similarity(response_embedding.reshape(1, -1), truth_embedding.reshape(1, -1))[0][0]
     return similarity * 100  # Convert to percentage
 def query_app(query, model_name, use_similarity_check, openai_api_key):
     global vector_index, query_log