# Traditional Credit Scoring Using Logistic Regression
import scorecardpy as sc

# data prepare ------
# load germancredit data
dat = sc.germancredit()

# filter variable via missing rate, iv, identical value rate
dt_s = sc.var_filter(dat, y="creditability")

# breaking dt into train and test
train, test = sc.split_df(dt_s, 'creditability').values()

# woe binning ------
bins = sc.woebin(dt_s, y="creditability")
# sc.woebin_plot(bins)

# binning adjustment
# # adjust breaks interactively
# breaks_adj = sc.woebin_adj(dt_s, "creditability", bins) 
# # or specify breaks manually
breaks_adj = {
    'age.in.years': [26, 35, 40],
    'other.debtors.or.guarantors': ["none", "co-applicant%,%guarantor"]
}
bins_adj = sc.woebin(dt_s, y="creditability", breaks_list=breaks_adj)

# converting train and test into woe values
train_woe = sc.woebin_ply(train, bins_adj)
test_woe = sc.woebin_ply(test, bins_adj)

y_train = train_woe.loc[:,'creditability']
X_train = train_woe.loc[:,train_woe.columns != 'creditability']
y_test = test_woe.loc[:,'creditability']
X_test = test_woe.loc[:,train_woe.columns != 'creditability']

# logistic regression ------
from sklearn.linear_model import LogisticRegression
lr = LogisticRegression(penalty='l1', C=0.9, solver='saga', n_jobs=-1)
lr.fit(X_train, y_train)
# lr.coef_
# lr.intercept_

# predicted proability
train_pred = lr.predict_proba(X_train)[:,1]
test_pred = lr.predict_proba(X_test)[:,1]

# performance ks & roc ------
train_perf = sc.perf_eva(y_train, train_pred, title = "train")
test_perf = sc.perf_eva(y_test, test_pred, title = "test")

# score ------
card = sc.scorecard(bins_adj, lr, X_train.columns)
# credit score
train_score = sc.scorecard_ply(train, card, print_step=0)
test_score = sc.scorecard_ply(test, card, print_step=0)

# psi
sc.perf_psi(
  score = {'train':train_score, 'test':test_score},
  label = {'train':y_train, 'test':y_test}
)

猜你喜欢

学习SQL语句(强大的groupby与selectfrom模式)
[NetWork] 路由聚合与CIDR
photoshop 2021 直装版,PS2021mac版
如何在Linux下进行Lua调试（linux调试lua）
优化Oracle减少关联查询的编程实践（oracle减少关联查询）
Java实现Sybase数据库连接详解编程语言
构建基于Redis的可靠镜像（构建redis镜像）
微软Office 2019 批量授权版
为什么Foxmail接收不了邮件？
Vlan的概念以及配置

相关主题

Ubuntu系统安装
安装Python
Mac 上安装maven
PHP5安装方法
go 安装方法
oracle-rac安装
安装zookeeper
安装Anaconda
PostgreSQL安装使用
python安装，pycharm安装
python安装、pycharm安装
Pycharm下载与安装教程
ubuntu安装gcc
Linux SVN安装
插件安装方法
60安装方法
Redis安装部署
ubuntu mysql 安装
安装IIS
Mac M1 安装 Redis

zl程序教程

当前栏目

Py之scorecardpy：scorecardpy的简介、安装、使用方法之详细攻略

scorecardpy的简介

scorecardpy的安装

scorecardpy的使用方法

1、基础案例

相关文章