File size: 1,252 Bytes
3d745f2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
from strive.reranker import Reranker, EmbeddingType, deduplicate_results
import gradio as gr

def rerank_and_deduplicate(query, corpus_text):
    corpus = [line.strip() for line in corpus_text.split("\n") if line.strip()]
    textual_reranker = Reranker(embedding_type=EmbeddingType.textual)
    semantic_reranker = Reranker(embedding_type=EmbeddingType.semantic)
    
    textual_results = textual_reranker.rerank_documents(query, corpus, top_k=len(corpus))
    semantic_results = semantic_reranker.rerank_documents(query, corpus, top_k=len(corpus))
    
    merged_results = textual_results + semantic_results
    deduplicated_results = deduplicate_results(merged_results, top_k=50)
    
    return "\n".join([f"{text} (Score: {score:.4f})" for text, score in deduplicated_results])

app = gr.Interface(
    fn=rerank_and_deduplicate,
    inputs=[
        gr.Textbox(label="Query", placeholder="Enter your query here"),
        gr.Textbox(label="Corpus", placeholder="Enter one sentence per line", lines=10)
    ],
    outputs=gr.Textbox(label="Top Ranked Results"),
    title="STRIVE: Semantic Tokenized Ranking via Vectorization & Embeddings",
    description="Enter a query and multiple sentences to test the reranking algorithm."
)

app.launch()