Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -16,10 +16,10 @@ def load_model():
|
|
| 16 |
|
| 17 |
# Cache corpus embedding generation
|
| 18 |
@st.cache_data
|
| 19 |
-
def generate_embeddings(_model,
|
| 20 |
# Prepare paper texts by combining query and answer fields
|
| 21 |
paper_texts = [
|
| 22 |
-
record['query'] + '[SEP]' + record['answer'] for record in
|
| 23 |
]
|
| 24 |
# Compute embeddings for all paper texts
|
| 25 |
return paper_texts, _model.encode(paper_texts, convert_to_tensor=True, show_progress_bar=True)
|
|
|
|
| 16 |
|
| 17 |
# Cache corpus embedding generation
|
| 18 |
@st.cache_data
|
| 19 |
+
def generate_embeddings(_model, _dataset_file, sample_size=32):
|
| 20 |
# Prepare paper texts by combining query and answer fields
|
| 21 |
paper_texts = [
|
| 22 |
+
record['query'] + '[SEP]' + record['answer'] for record in _dataset_file.select(range(sample_size))
|
| 23 |
]
|
| 24 |
# Compute embeddings for all paper texts
|
| 25 |
return paper_texts, _model.encode(paper_texts, convert_to_tensor=True, show_progress_bar=True)
|