import numpy as np
import pandas as pd
import matplotlib as plt
import seaborn as sns
data_filepath="/work/loan_status.csv"
data = pd.read_csv(data_filepath)
data.head(10)
data.columns
data.grade.unique()
data.sub_grade.unique()
data.loan_status.unique()
data.purpose.unique()
data.isnull().sum()
data.describe()
sns.histplot(x=data.grade)
sns.histplot(x=data.loan_status)
sns.histplot(x=data.grade, hue=data.loan_status)
data.info()
data_crosstab1 = pd.crosstab(data['grade'], data['loan_status'], margins = False)
data_crosstab1
data_crosstab2 = pd.crosstab(data['purpose'], data['loan_status'], margins = False)
data_crosstab2