Spaces:

curtpond
/

mle10-glg-demo

Sleeping

File size: 2,030 Bytes

925e416
 
 
cbd3f4c
0f34ca3
 
 
 
 
 
438fdb3
925e416
2aa7ddb
e84b099
2aa7ddb
438fdb3
e84b099
438fdb3
5a7c4c9
0f34ca3
438fdb3
0f34ca3
438fdb3
0f34ca3
 
 
 
 
 
 
 
e84b099
 
0f34ca3
e84b099
 
 
 
0f34ca3
4a02fcc
925e416
e84b099
 
 
 
0e46e88
e84b099
87806b7
2aa7ddb
e84b099
 
 
 
 
 
 
925e416
 
733f064
7862c87
 
 
f7170b6
925e416
c71ee2b
 
733f064
925e416

# Imports
import gradio as gr
from sklearn.linear_model import LogisticRegression
import pickle5 as pickle
import re
import string
import nltk
from nltk.corpus import stopwords
nltk.download('stopwords')
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.feature_extraction.text import TfidfVectorizer

# file name
#lr_filename = 'lr_021223.pkl'

# Load model from pickle file
# model = pickle.load(open(lr_filename, 'rb'))


# Process input text, including removing stopwords, converting to lowercase, and removing punctuation
stop = stopwords.words('english')
def process_text(text):
    text = [word for word in text.split() if word not in stop]
    text = str(text).lower()
    text = re.sub(
        f"[{re.escape(string.punctuation)}]", " ", text
    )
    text = " ".join(text.split())
    return text

# Vectorize input text
vec = CountVectorizer()
'''
def vectorize_text(text):
    #text = process_text(text)
    #text = vectorizer.fit_transform([text])
    #return text
'''

# Valid input for the model so number of features match
def predict(text):
    # Load the pickled model
    filename = 'lr_021223.pkl'
    loaded_model = pickle.load(open(filename, 'rb'))
    text = vec.transform([text])
    text = process_text(text)
    prediction = loaded_model.predict(text)
    return prediction

'''
Prediction function
#def predict(text):
    #text = vectorize_text(text)
    #prediction = model.predict(text)
    #return prediction
'''

# Define interface
demo = gr.Interface(fn=predict,
                        title="Text Classification Demo",
                        description="This is a demo of a text classification model using Logistic Regression.",
                        inputs=gr.Textbox(lines=10, placeholder='Input text here...', label="Input Text"),
                        outputs=gr.Textbox(label="Predicted Label: Other: 0, Healthcare: 1, Technology: 2", lines=2, placeholder='Predicted label will appear here...'),
                        allow_flagging='never'
)

demo.launch()