Spaces:
Sleeping
Sleeping
import gradio as gr | |
import polars as pl | |
data = pl.read_parquet("hf://datasets/polinaeterna/text_unnested/data/*.parquet") | |
min_min = data["min"].min() | |
min_max = data["min"].max() | |
def filter(min_value: min_min, max_value: min_max): | |
df = data.filter((pl.col("min") >= min_value) & (pl.col("min") <= max_value)).to_pandas() | |
if df.shape[0] > 100: | |
return df.head(100) | |
return df | |
with gr.Blocks() as demo: | |
gr.Markdown("# π« Filter text datasets by string lengths distribution π«") | |
min_value = gr.Slider(min_min, min_max, 0, step=1, label="Min min value") | |
max_value = gr.Slider(min_min, min_max, 0, step=1, label="Max min value") | |
btn = gr.Button("Get datasets ") | |
datasets = gr.DataFrame() | |
btn.click(filter, inputs=[min_value, max_value], outputs=[datasets]) | |
demo.launch(debug=True) |