Spaces:

silvaKenpachi
/

depression_example

Runtime error

File size: 4,220 Bytes

a10547f
b6c250a
 
 
12c727d
f0656c0
a10547f
12c727d
b6c250a
a10547f
12c727d
 
b6c250a
8be3cb5
 
 
 
12c727d
b6c250a
12c727d
9e4102b
 
 
 
 
12c727d
b0e84c2
92a5021
 
 
 
 
 
 
 
de23191
92a5021
 
4924a5b
92a5021
 
 
de23191
 
92a5021
de23191
92a5021
 
b6c250a
b0e84c2
 
 
 
 
f0656c0
 
 
 
 
 
 
 
 
 
 
 
 
dabf209
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
b6c250a
 
f0656c0
 
 
 
b4315ee
 
 
dabf209
b0e84c2
 
 
f0656c0
b0e84c2
 
f0656c0
dabf209
f0656c0
 
dabf209
 
 
f0656c0
dabf209
12c727d
dabf209
 
4d4ad4b
dabf209
4d4ad4b
 
b6c250a
b0e84c2
b4315ee
12c727d

import gradio as gr
import joblib
import pandas as pd
import datasets
import json
import numpy as np

# Load the model
pipe = joblib.load("./model.pkl")

title = "Premium Amount Prediction"
description = "This model predicts the Premium Amount. Drag and drop any slice from the dataset or edit values as you wish in the dataframe component below."

# Load and prepare dataset
df = datasets.load_dataset("silvaKenpachi/mental_health")["train"].to_pandas()
df.dropna(axis=0, inplace=True)

# Load configuration
with open("./config.json") as f:
    config_dict = json.load(f)
all_headers = config_dict["sklearn"]["columns"]

# Filter headers to only include those present in the dataset
headers = [col for col in all_headers if col in df.columns]

# Define input and output interfaces
#inputs = [gr.Dataframe(headers=headers, row_count=(2, "dynamic"), col_count=(len(headers), "fixed"), label="Input Data", interactive=True)]

#working code that returns only 2 rows in output
#inputs = [gr.Dataframe(headers=all_headers, row_count=(2, "dynamic"), col_count=(len(all_headers), "fixed"), label="Input Data", interactive=True)]
#outputs = [gr.Dataframe(row_count=(2, "dynamic"), col_count=(1, "fixed"), label="Predictions", headers=["Depression"])]

# Define input and output interfaces with dynamic row counts
inputs = [gr.Dataframe(
    headers=headers,
    row_count=(10, "dynamic"),  # Use tuple format (min_rows, "dynamic")
    col_count=(len(headers), "fixed"),
    label="Input Data",
    interactive=True
)]

outputs = [gr.Dataframe(
    row_count=(10, "dynamic"),  # Use tuple format (min_rows, "dynamic")
    col_count=(2, "fixed"),
    label="Predictions",
    headers=["Name", "Depression"]
)]


#def infer(inputs):
    #data = pd.DataFrame(inputs, columns=headers)
    #predictions = pipe.predict(data)
    #return pd.DataFrame(predictions, columns=["Depression"])

#code to fix missing columns with na
#def infer(inputs):
    #data = pd.DataFrame(inputs, columns=headers)
    # Add missing columns with default values (e.g., 0)
    #for col in all_headers:
        #if col not in data.columns:
            #data[col] = 0
    # Ensure the order of columns matches the training data
    #data = data[all_headers]
    #predictions = pipe.predict(data)
    #return pd.DataFrame(predictions, columns=["Depression"])


#def infer(inputs):
    #data = pd.DataFrame(inputs, columns=headers)
    
    # Replace empty strings with NaN
    #data = data.replace('', np.nan)
    
    # Add missing columns with default values (e.g., 0)
    #for col in all_headers:
        #if col not in data.columns:
            #data[col] = 0
    
    # Ensure the order of columns matches the training data
    #data = data[all_headers]
    
    # Fill NaN values with default values (e.g., 0)
    #data = data.fillna(0)
    
    # Convert all data to float
    #data = data.astype(float)
    
    #predictions = pipe.predict(data)
    #return pd.DataFrame(predictions, columns=["Name", "Depression"])
    #return pd.DataFrame({
        #'Name': data['Name'],
        #'Depression': predictions
    #})

def infer(inputs):
    data = pd.DataFrame(inputs, columns=headers)
    
    # Replace empty strings with NaN
    data = data.replace('', np.nan)
    
    # Store the Name column
    names = data['Name'].copy()
    
    # Add missing columns with default values
    for col in all_headers:
        if col not in data.columns:
            data[col] = 0
    
    # Ensure the order of columns matches the training data
    data = data[all_headers]
    
    # Fill NaN values
    data = data.fillna(0)
    
    # Convert numeric columns to float, excluding 'Name'
    numeric_columns = [col for col in all_headers if col != 'Name']
    data[numeric_columns] = data[numeric_columns].astype(float)
    
    # Make predictions
    predictions = pipe.predict(data)
    
    # Create output DataFrame with original names and predictions
    return pd.DataFrame({
        'Name': names,
        'Depression': predictions
    })



gr.Interface(
    fn=infer,
    inputs=inputs,
    outputs=outputs,
    title=title,
    description=description,
    examples=[df[headers].head(3).values.tolist()],
    cache_examples=False
).launch(debug=True)