Spaces:
Running
Running
File size: 1,252 Bytes
3d745f2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 |
from strive.reranker import Reranker, EmbeddingType, deduplicate_results
import gradio as gr
def rerank_and_deduplicate(query, corpus_text):
corpus = [line.strip() for line in corpus_text.split("\n") if line.strip()]
textual_reranker = Reranker(embedding_type=EmbeddingType.textual)
semantic_reranker = Reranker(embedding_type=EmbeddingType.semantic)
textual_results = textual_reranker.rerank_documents(query, corpus, top_k=len(corpus))
semantic_results = semantic_reranker.rerank_documents(query, corpus, top_k=len(corpus))
merged_results = textual_results + semantic_results
deduplicated_results = deduplicate_results(merged_results, top_k=50)
return "\n".join([f"{text} (Score: {score:.4f})" for text, score in deduplicated_results])
app = gr.Interface(
fn=rerank_and_deduplicate,
inputs=[
gr.Textbox(label="Query", placeholder="Enter your query here"),
gr.Textbox(label="Corpus", placeholder="Enter one sentence per line", lines=10)
],
outputs=gr.Textbox(label="Top Ranked Results"),
title="STRIVE: Semantic Tokenized Ranking via Vectorization & Embeddings",
description="Enter a query and multiple sentences to test the reranking algorithm."
)
app.launch()
|