File size: 1,757 Bytes
3f6f474 cf575f8 3f6f474 cf575f8 3f6f474 cf575f8 3f6f474 cf575f8 3f6f474 cf575f8 3f6f474 cf575f8 3f6f474 cf575f8 3f6f474 cf575f8 3f6f474 cf575f8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 |
from io import StringIO
from typing import Optional
import gradio as gr
import pandas as pd
from utils.similarity import batch_cos_sim
def read_data(filepath: str) -> Optional[pd.DataFrame]:
if filepath.endswith('.xlsx'):
df = pd.read_csv(filepath)
elif filepath.endswith('.csv'):
df = pd.read_csv(filepath)
else:
raise Exception('File type not supported')
return df
def process(model_name: str,
text: str,
file=None,
):
if file:
df = read_data(file.name)
elif text:
string_io = StringIO(text)
df = pd.read_csv(string_io)
else:
raise Exception('No input provided')
df = batch_cos_sim(df, model_name)
path = 'output.csv'
df.to_csv(path, index=False, encoding='utf-8-sig')
return str(df), path
model_name_input = gr.components.Textbox(
value='paraphrase-multilingual-MiniLM-L12-v2',
lines=1,
type='text'
)
model_name_option = gr.components.Dropdown(
label='Model Name',
value='paraphrase-multilingual-MiniLM-L12-v2',
choices=[
'paraphrase-multilingual-MiniLM-L12-v2',
'paraphrase-multilingual-mpnet-base-v2',
'cyclone/simcse-chinese-roberta-wwm-ext'
]
)
text_input = gr.components.Textbox(
value='prompt,response\n',
lines=10,
type='text'
)
text_output = gr.components.Textbox(
label='Output',
type='text'
)
file_output = gr.components.File(label='Output File',
file_count='single',
file_types=['', '.', '.csv', '.xls', '.xlsx'])
app = gr.Interface(
fn=process,
inputs=[model_name_option, text_input, 'file'],
outputs=[text_output, file_output]
)
app.launch()
|