Spaces:
Runtime error
Runtime error
thankrandomness
commited on
Commit
·
ef72046
1
Parent(s):
f8a90e7
lower the similarity threshold
Browse files
app.py
CHANGED
@@ -78,7 +78,7 @@ def upsert_data(dataset_split):
|
|
78 |
upsert_data(dataset['train'])
|
79 |
|
80 |
# Define retrieval function with similarity threshold
|
81 |
-
def retrieve_relevant_text(input_text, similarity_threshold=0
|
82 |
input_embedding = embed_text([input_text])[0]
|
83 |
results = collection.query(
|
84 |
query_embeddings=[input_embedding],
|
@@ -103,7 +103,7 @@ def retrieve_relevant_text(input_text, similarity_threshold=0.1): # Lower thres
|
|
103 |
return output
|
104 |
|
105 |
# Evaluate retrieval efficiency on the validation/test set
|
106 |
-
def evaluate_efficiency(dataset_split, similarity_threshold=0
|
107 |
y_true = []
|
108 |
y_pred = []
|
109 |
total_similarity = 0
|
|
|
78 |
upsert_data(dataset['train'])
|
79 |
|
80 |
# Define retrieval function with similarity threshold
|
81 |
+
def retrieve_relevant_text(input_text, similarity_threshold=1.0): # Lower threshold to capture more results
|
82 |
input_embedding = embed_text([input_text])[0]
|
83 |
results = collection.query(
|
84 |
query_embeddings=[input_embedding],
|
|
|
103 |
return output
|
104 |
|
105 |
# Evaluate retrieval efficiency on the validation/test set
|
106 |
+
def evaluate_efficiency(dataset_split, similarity_threshold=1.0):
|
107 |
y_true = []
|
108 |
y_pred = []
|
109 |
total_similarity = 0
|