Spaces:

saifhmb
/

Credit-Card-Risk-Assessment-ML-App

Sleeping

Credit-Card-Risk-Assessment-ML-App / app.py

saifhmb

added indented block after 'with' statement on line 91 and subsequent lines

16e7cd6 unverified about 1 year ago

5.28 kB

	# importing libraries
	from datasets import load_dataset, load_dataset_builder
	import numpy as np
	import matplotlib.pyplot as plt
	import pandas as pd
	import sklearn
	from sklearn.compose import ColumnTransformer
	from sklearn.model_selection import train_test_split
	from sklearn.preprocessing import OneHotEncoder, LabelEncoder, StandardScaler
	from sklearn.linear_model import LogisticRegression
	from sklearn.metrics import confusion_matrix, ConfusionMatrixDisplay, accuracy_score, precision_score, recall_score, classification_report
	from transformers import Trainer, TrainingArguments
	from skops import hub_utils
	import pickle
	from skops.card import Card, metadata_from_config
	from pathlib import Path
	from tempfile import mkdtemp, mkstemp
	import streamlit as st
	from PIL import Image

	# Loading the dataset
	dataset_name = "saifhmb/CreditCardRisk"
	dataset = load_dataset(dataset_name, split = 'train')
	dataset = pd.DataFrame(dataset)
	X = dataset.iloc[:, :-1].values
	y = dataset.iloc[:, -1].values

	# Encoding the Independent Variables
	ct = ColumnTransformer(transformers = [('encoder', OneHotEncoder(), [2, 3, 6, 7])], remainder = 'passthrough')
	X = np.array(ct.fit_transform(X))

	# Encoding the Dependent Variable
	le = LabelEncoder()
	y = le.fit_transform(y)

	# Spliting the datset into Training and Test set
	X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.15, random_state = 0)

	# Feature Scaling
	sc = StandardScaler()
	X_train = sc.fit_transform(X_train)
	X_test = sc.transform(X_test)

	# Training Logit Reg Model using the Training set
	model = LogisticRegression()
	model.fit(X_train, y_train)

	# Predicting the Test result
	y_pred = model.predict(X_test)

	# Making the Confusion Matrix and evaluating performance
	cm = confusion_matrix(y_pred, y_test, labels=model.classes_)
	display_labels = np.array(['bad loss', 'bad profit', 'good risk'])
	disp = ConfusionMatrixDisplay(confusion_matrix=cm, display_labels=display_labels)
	disp.plot()
	plt.show()
	acc = accuracy_score(y_test, y_pred)
	ps = precision_score(y_test, y_pred, average ='micro')
	rs = recall_score(y_test, y_pred, average ='micro')

	# Pickling the model
	pickle_out = open("model.pkl", "wb")
	pickle.dump(model, pickle_out)
	pickle_out.close()

	# Loading the model to predict on the data
	pickle_in = open('model.pkl', 'rb')
	model = pickle.load(pickle_in)

	def welcome():
	return 'welcome all'

	# defining the function which will make the prediction using the data which the user inputs
	def prediction(AGE, INCOME, GENDER, MARITAL, NUMKIDS, NUMCARDS, HOWPAID, MORTGAGE, STORECAR, LOANS):
	prediction = model.predict(sc.transform([[AGE, INCOME, GENDER, MARITAL, NUMKIDS, NUMCARDS, HOWPAID, MORTGAGE, STORECAR, LOANS]]))
	print(prediction)
	return prediction

	# this is the main function in which we define our webpage
	def main():
	# giving the webpage a title
	st.title("Credit Card Risk Assessment ML App")
	st.header("Model Description", divider = "gray")
	multi = '''This is a logistic regression model trained on customers' credit card risk dataset in a bank using sklearn library.
	The model predicts whether a customer is worth issuing a credit card or not.
	For more details on the model please refer to the model card at https://huggingface.co/saifhmb/Credit-Card-Risk-Model
	'''
	st.markdown(multi)
	st.markdown("To determine whether a customer is worth issuing a credit card or not, please ENTER the AGE INCOME, GENDER, MARITAL, NUMKIDS, NUMCARDS, HOWPAID, MORTGAGE, STORECAR, and LOANS:")
	col1, col2, col3 = st.columns(3)
	with col1:
	AGE = st.number_input("AGE")
	with col2:
	INCOME = st.number_input("INCOME")
	with col3:
	GENDER = st.text_input("GENDER (Please enter 'm' for male and 'f' for female)")

	col4, col5, col6 = st.columns(3)
	with col4:
	MARITAL = st.text_input("MARITAL STATUS (Please enter one of the following options: 'single', 'married', or 'divsepwid')")
	with col5:
	NUMKIDS = st.number_input("Number of dependent children")
	with col6:
	NUMCARDS = st.number_input("Number of credit cards excluding store credit cards")

	col7, col8, col9 =st.columns(3)
	with col7:
	HOWPAID = st.text_input("How often is customer paid by employer (weekly or monthly)")
	with col8:
	MORTGAGE = st.text_input("Does customer have a mortgage? please enter 'y' for yes or 'n' for no")
	with col9:
	STORECAR = st.number_input("Number of store credit cards")

	LOANS = st.number_input("Number of outstanding loans")
	result = ""
	if st.button("Predict"):
	result = prediction(AGE, INCOME, GENDER, MARITAL, NUMKIDS, NUMCARDS, HOWPAID, MORTGAGE, STORECAR, LOANS)
	if result == 0:
	st.success("The output is {}".format(result) + " which falls under 'bad loss' and thus the customer is NOT worth issuing a credit card")
	if result == 1:
	st.success("The output is {}".format(result) + " which falls under 'bad profit' and thus the customer MAYBE worth issuing a credit card")
	if result == 2:
	st.success("The output is {}".format(result) + " which falls under 'good risk' and thus the customer worth issuing a credit card")

	if __name__=='__main__':
	main()