File size: 1,037 Bytes
eb5fab4
 
 
 
ada59c2
 
 
 
eb5fab4
 
 
9247534
 
046dab3
eb5fab4
 
 
d5c70ed
eb5fab4
ada59c2
eb5fab4
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import gradio as gr

from chonky import ParagraphSplitter


def run(text, model_id):
    splitter = ParagraphSplitter(model_id=model_id)
    return "\n\n---\n\n".join(splitter(text))

with gr.Blocks() as demo:
    gr.Markdown("# Semantic Chunking Demo\n  **Note**: This Space runs on CPU only, so input is limited to max. 50000 characters.")
    model = gr.Dropdown(label="Choose model", value="mamei16/chonky_distilbert-base-multilingual-cased",
                        choices=["mamei16/chonky_distilbert-base-multilingual-cased", "mamei16/chonky_distilbert_base_uncased_1.1", "mamei16/chonky_mdistilbert-base-english-cased",
                                 "mirth/chonky_distilbert_base_uncased_1", "mirth/chonky_modernbert_base_1"])
    button = gr.Button("Run", variant="primary")
    text = gr.Textbox(label='Input Text', max_length=50000)
    gr.Markdown("## Result chunks:")
    chunks = gr.Markdown("---")

    button.click(run, [text, model], chunks)


if __name__ == "__main__":
    demo.queue(max_size=20)
    demo.launch()