my-vignette
library(autoScorecard)
#Quick Modeling
##step 1: Import Data
accepts <- read.csv(system.file("extdata", "accepts.csv", package = "autoScorecard" ))
##step 2: Create scorecard
##Considering efficiency and readability, many parameters of this automatic modeling function
##are default, which requires high-precision modeling and needs to be manually established step by step
auto_scorecard1 <- auto_scorecard( feature = accepts[1:2000,], key_var= "application_id",
y_var = "bad_ind",sample_rate = 0.7, points0 = 600, odds0=1/20, pdo = 50,
max_depth =3,tree_p = 0.1, missing_rate = 0, single_var_rate = 1, iv_set=0.02,
char_to_number = TRUE , na.omit = TRUE)
#> Start: AIC=873.27
#> bad_ind ~ application_id + vehicle_year + vehicle_make + tot_derog +
#> tot_tr + age_oldest_tr + tot_open_tr + tot_rev_tr + tot_rev_debt +
#> tot_rev_line + rev_util + fico_score + purch_price + msrp +
#> down_pyt + loan_term + loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - application_id 1 831.27 871.27
#> - purch_price 1 831.40 871.40
#> - msrp 1 832.05 872.05
#> - tot_tr 1 832.12 872.12
#> - tot_open_tr 1 832.40 872.40
#> - vehicle_year 1 832.95 872.95
#> - tot_rev_line 1 833.09 873.09
#> <none> 831.27 873.27
#> - tot_income 1 833.94 873.94
#> - vehicle_make 1 834.31 874.31
#> - down_pyt 1 834.90 874.90
#> - loan_term 1 835.25 875.25
#> - tot_rev_tr 1 836.28 876.28
#> - veh_mileage 1 836.68 876.68
#> - loan_amt 1 836.72 876.72
#> - age_oldest_tr 1 837.63 877.63
#> - tot_derog 1 838.33 878.33
#> - tot_rev_debt 1 839.33 879.33
#> - rev_util 1 844.21 884.21
#> - ltv 1 848.13 888.13
#> - fico_score 1 853.94 893.94
#>
#> Step: AIC=871.27
#> bad_ind ~ vehicle_year + vehicle_make + tot_derog + tot_tr +
#> age_oldest_tr + tot_open_tr + tot_rev_tr + tot_rev_debt +
#> tot_rev_line + rev_util + fico_score + purch_price + msrp +
#> down_pyt + loan_term + loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - purch_price 1 831.40 869.40
#> - msrp 1 832.05 870.05
#> - tot_tr 1 832.12 870.12
#> - tot_open_tr 1 832.40 870.40
#> - vehicle_year 1 832.95 870.95
#> - tot_rev_line 1 833.09 871.09
#> <none> 831.27 871.27
#> - tot_income 1 833.94 871.94
#> - vehicle_make 1 834.31 872.31
#> - down_pyt 1 834.90 872.90
#> - loan_term 1 835.25 873.25
#> + application_id 1 831.27 873.27
#> - tot_rev_tr 1 836.29 874.29
#> - veh_mileage 1 836.68 874.68
#> - loan_amt 1 836.72 874.72
#> - age_oldest_tr 1 837.63 875.63
#> - tot_derog 1 838.33 876.33
#> - tot_rev_debt 1 839.34 877.34
#> - rev_util 1 844.23 882.23
#> - ltv 1 848.17 886.17
#> - fico_score 1 853.98 891.98
#>
#> Step: AIC=869.4
#> bad_ind ~ vehicle_year + vehicle_make + tot_derog + tot_tr +
#> age_oldest_tr + tot_open_tr + tot_rev_tr + tot_rev_debt +
#> tot_rev_line + rev_util + fico_score + msrp + down_pyt +
#> loan_term + loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - tot_tr 1 832.30 868.30
#> - tot_open_tr 1 832.56 868.56
#> - msrp 1 832.67 868.67
#> - vehicle_year 1 833.01 869.01
#> - tot_rev_line 1 833.23 869.23
#> <none> 831.40 869.40
#> - tot_income 1 834.19 870.19
#> - vehicle_make 1 834.44 870.44
#> - down_pyt 1 835.01 871.01
#> + purch_price 1 831.27 871.27
#> + application_id 1 831.40 871.40
#> - loan_term 1 835.48 871.48
#> - tot_rev_tr 1 836.36 872.36
#> - veh_mileage 1 836.91 872.91
#> - age_oldest_tr 1 837.75 873.75
#> - tot_derog 1 838.40 874.40
#> - loan_amt 1 838.49 874.49
#> - tot_rev_debt 1 839.57 875.57
#> - rev_util 1 844.38 880.38
#> - ltv 1 848.45 884.45
#> - fico_score 1 854.27 890.27
#>
#> Step: AIC=868.3
#> bad_ind ~ vehicle_year + vehicle_make + tot_derog + age_oldest_tr +
#> tot_open_tr + tot_rev_tr + tot_rev_debt + tot_rev_line +
#> rev_util + fico_score + msrp + down_pyt + loan_term + loan_amt +
#> ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - tot_open_tr 1 833.16 867.16
#> - msrp 1 833.62 867.62
#> - vehicle_year 1 833.94 867.94
#> <none> 832.30 868.30
#> - vehicle_make 1 835.20 869.20
#> + tot_tr 1 831.40 869.40
#> - tot_income 1 835.52 869.52
#> - tot_rev_line 1 835.68 869.68
#> - down_pyt 1 835.93 869.93
#> + purch_price 1 832.12 870.12
#> + application_id 1 832.30 870.30
#> - loan_term 1 836.40 870.40
#> - tot_rev_tr 1 837.03 871.03
#> - veh_mileage 1 837.89 871.89
#> - tot_derog 1 838.45 872.45
#> - loan_amt 1 839.30 873.30
#> - age_oldest_tr 1 840.67 874.67
#> - tot_rev_debt 1 840.80 874.80
#> - rev_util 1 845.37 879.37
#> - ltv 1 849.58 883.58
#> - fico_score 1 854.62 888.62
#>
#> Step: AIC=867.16
#> bad_ind ~ vehicle_year + vehicle_make + tot_derog + age_oldest_tr +
#> tot_rev_tr + tot_rev_debt + tot_rev_line + rev_util + fico_score +
#> msrp + down_pyt + loan_term + loan_amt + ltv + tot_income +
#> veh_mileage
#>
#> Df Deviance AIC
#> - msrp 1 834.49 866.49
#> - vehicle_year 1 835.01 867.01
#> <none> 833.16 867.16
#> - tot_income 1 836.11 868.11
#> - vehicle_make 1 836.14 868.14
#> - tot_rev_line 1 836.20 868.20
#> + tot_open_tr 1 832.30 868.30
#> + tot_tr 1 832.56 868.56
#> - down_pyt 1 836.77 868.77
#> + purch_price 1 832.96 868.96
#> - tot_rev_tr 1 837.03 869.03
#> + application_id 1 833.16 869.16
#> - loan_term 1 837.25 869.25
#> - veh_mileage 1 838.82 870.82
#> - tot_derog 1 839.20 871.20
#> - loan_amt 1 839.94 871.94
#> - tot_rev_debt 1 841.17 873.17
#> - age_oldest_tr 1 841.29 873.29
#> - rev_util 1 847.28 879.28
#> - ltv 1 850.90 882.90
#> - fico_score 1 855.29 887.29
#>
#> Step: AIC=866.49
#> bad_ind ~ vehicle_year + vehicle_make + tot_derog + age_oldest_tr +
#> tot_rev_tr + tot_rev_debt + tot_rev_line + rev_util + fico_score +
#> down_pyt + loan_term + loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - vehicle_year 1 835.55 865.55
#> <none> 834.49 866.49
#> + msrp 1 833.16 867.16
#> + tot_open_tr 1 833.62 867.62
#> - vehicle_make 1 837.66 867.66
#> - tot_rev_line 1 837.67 867.67
#> - tot_income 1 837.68 867.68
#> + purch_price 1 833.71 867.71
#> + tot_tr 1 833.85 867.85
#> - tot_rev_tr 1 838.25 868.25
#> + application_id 1 834.49 868.49
#> - down_pyt 1 838.76 868.76
#> - loan_term 1 839.15 869.15
#> - veh_mileage 1 840.23 870.23
#> - tot_derog 1 840.24 870.24
#> - age_oldest_tr 1 842.58 872.58
#> - tot_rev_debt 1 842.89 872.89
#> - loan_amt 1 843.20 873.20
#> - rev_util 1 848.45 878.45
#> - ltv 1 851.91 881.91
#> - fico_score 1 857.15 887.15
#>
#> Step: AIC=865.55
#> bad_ind ~ vehicle_make + tot_derog + age_oldest_tr + tot_rev_tr +
#> tot_rev_debt + tot_rev_line + rev_util + fico_score + down_pyt +
#> loan_term + loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> <none> 835.55 865.55
#> + vehicle_year 1 834.49 866.49
#> + tot_open_tr 1 834.51 866.51
#> - vehicle_make 1 838.58 866.58
#> - tot_rev_line 1 838.60 866.60
#> - tot_income 1 838.75 866.75
#> + tot_tr 1 834.93 866.93
#> + msrp 1 835.01 867.01
#> + purch_price 1 835.15 867.15
#> - tot_rev_tr 1 839.49 867.49
#> + application_id 1 835.55 867.55
#> - down_pyt 1 839.62 867.62
#> - loan_term 1 840.07 868.07
#> - veh_mileage 1 840.39 868.39
#> - tot_derog 1 841.35 869.35
#> - loan_amt 1 843.51 871.51
#> - age_oldest_tr 1 843.60 871.60
#> - tot_rev_debt 1 843.94 871.94
#> - rev_util 1 849.68 877.68
#> - ltv 1 853.00 881.00
#> - fico_score 1 857.67 885.67
data:image/s3,"s3://crabby-images/e5856/e5856f195ddb00984fa044ceef4a2258f153dabe" alt=""
data:image/s3,"s3://crabby-images/d3488/d3488d9ab760b0cb285d1c2494a5d22254c6d0b2" alt=""
data:image/s3,"s3://crabby-images/5f98c/5f98c0325f4a7d5ce2ac9183e4d7b45488f0ba60" alt=""
data:image/s3,"s3://crabby-images/f9154/f9154497c9115079441a653ce34054ff07ade887" alt=""
data:image/s3,"s3://crabby-images/e7c26/e7c2615068980028031d9d67272ec8cbf1dff7da" alt=""
data:image/s3,"s3://crabby-images/fdaad/fdaadf51fd7077a22e24c1d0e6bc7febd1626c20" alt=""
data:image/s3,"s3://crabby-images/5b36b/5b36ba2915aef23e0f5f9695f284f8e5b170bed6" alt=""
#Step-by-Step Modeling
##step 1: Import Data
accepts <- read.csv(system.file("extdata", "accepts.csv", package = "autoScorecard" ))
##step 2: Data Description
data_detect1 <- data_detect( df = accepts, key_var = c("application_id","account_number") ,
y_var = "bad_ind" )
head(data_detect1)
#> variable class nrow missing_rate unique_count identical_rate min
#> 1 vehicle_year integer 5845 0.0001710864 21 0.356372968 0
#> 2 vehicle_make character 5845 0.0000000000 155 0.190248075 NA
#> 3 bankruptcy_ind character 5845 0.0000000000 3 0.886227545 NA
#> 4 tot_derog integer 5845 0.0364414029 30 0.488793841 0
#> 5 tot_tr integer 5845 0.0364414029 68 0.039349872 0
#> 6 age_oldest_tr integer 5845 0.0369546621 461 0.007869974 1
#> p25 p50 p75 max mean sd cv
#> 1 1997 1999 2000 9999 1901.793634 488.024392 0.2566127
#> 2 NA NA NA NA NA NA NA
#> 3 NA NA NA NA NA NA NA
#> 4 0 0 2 32 1.910156 3.274744 1.7143852
#> 5 9 16 24 77 17.084695 10.814056 0.6329675
#> 6 78 137 205 588 154.304317 99.940540 0.6476847
##step 3: Data Filtering
feature<- filter_var( df = accepts , key_var = c("application_id","account_number"), y_var = "bad_ind" ,
missing_rate = 0 , single_var_rate = 1 ,
iv_set = 0.02, char_to_number = TRUE , na.omit = TRUE )
##step 4: Select Training Sample
d = sort( sample( nrow( feature ), nrow( feature )*0.7))
train <- feature[d,]
test <- feature[-d,]
##step 5: Data Distribution Comparison
comparison_two_data( df1 = train , df2 = test ,key_var = c("application_id","account_number"), y_var="bad_ind")
data:image/s3,"s3://crabby-images/c9814/c9814ba4f7612fe49753a1e96334557af036a62e" alt=""
data:image/s3,"s3://crabby-images/f83b0/f83b0c1dcafcf2cee314167604515f2ad2e3614a" alt=""
data:image/s3,"s3://crabby-images/a329e/a329eb88608aa426e7060e4bcb37d5eb66eb13a3" alt=""
data:image/s3,"s3://crabby-images/8722b/8722b8d6e188892af887414da9ea263d1f6961f3" alt=""
data:image/s3,"s3://crabby-images/1b45c/1b45c8e769e0ac23cd1eee84e657daa6b2c548ca" alt=""
data:image/s3,"s3://crabby-images/48073/480731d6d7151cf21a99b68ddc24f1663dfb4c57" alt=""
data:image/s3,"s3://crabby-images/393d5/393d57093a01b9c58eaeb77ba4ae056fa9e973cc" alt=""
data:image/s3,"s3://crabby-images/86bdb/86bdbecc93d3788dfce9f34bdec293de1dc1debc" alt=""
data:image/s3,"s3://crabby-images/623bd/623bda6e87a611f10d65d5c6f984aec57fe2e0e9" alt=""
data:image/s3,"s3://crabby-images/28534/28534288d5764495ac952dee5a4bc430813d972c" alt=""
data:image/s3,"s3://crabby-images/403c5/403c50f70a578dfaac84b764e0aeccadffd67b94" alt=""
data:image/s3,"s3://crabby-images/c6488/c6488157a7308a03751fec8effc4f83e81d4442c" alt=""
data:image/s3,"s3://crabby-images/d0e16/d0e164aa1788a652ad54cced980422d09c528ff2" alt=""
data:image/s3,"s3://crabby-images/2bf11/2bf11f2ac78c9a49ac0b9567033c8592b7b6094a" alt=""
data:image/s3,"s3://crabby-images/00eb4/00eb4cbb03597f047fd2f72bcb336a51c7ba9c7b" alt=""
data:image/s3,"s3://crabby-images/d5e65/d5e659aa159457f49d3dda5adb131d2135c0fe85" alt=""
data:image/s3,"s3://crabby-images/765bf/765bf47473dc0e34e30758561dd5af37041fc528" alt=""
data:image/s3,"s3://crabby-images/268a9/268a9d8ecc08474c00536d822b292c7acb8fe4b3" alt=""
data:image/s3,"s3://crabby-images/93af6/93af620392924fd9a151902e2dff045dc1800a83" alt=""
data:image/s3,"s3://crabby-images/2f8e8/2f8e870d4088945c91fb17472767fa9446420e6c" alt=""
data:image/s3,"s3://crabby-images/fe4b4/fe4b42d499cac814e98d8abbabfe12aa60ec31fc" alt=""
data:image/s3,"s3://crabby-images/a42ae/a42aeb19af6171b5ce358698907b692ea6bae47b" alt=""
data:image/s3,"s3://crabby-images/21898/218980b37b7f38feb3c8cfb79fd4f0e253827ba1" alt=""
data:image/s3,"s3://crabby-images/84fdb/84fdbe0fb50329b227a45069f756cdee89238aa6" alt=""
data:image/s3,"s3://crabby-images/62ba3/62ba3a83786a505c62b2a203499e880f8f0f8ecc" alt=""
data:image/s3,"s3://crabby-images/3f533/3f533d6349fdd60c773376dde997a63e7ecc95f2" alt=""
data:image/s3,"s3://crabby-images/a4732/a4732a20a719a3cb95532d7e1fbe3ae685dba797" alt=""
data:image/s3,"s3://crabby-images/0eeae/0eeaec9d07673c711a24625b3b0c32049fd51636" alt=""
data:image/s3,"s3://crabby-images/b99cc/b99ccc10e5d2dd492fa49ca5504c689e532b70e0" alt=""
data:image/s3,"s3://crabby-images/53f7b/53f7bae5750191dcda33c3308c4333fe0449641c" alt=""
data:image/s3,"s3://crabby-images/7fc73/7fc73ea44a701f86b78fe7e1183a226d01ff3f87" alt=""
data:image/s3,"s3://crabby-images/5e4bc/5e4bc7018660199bd7b60475d646ad1561cba2a9" alt=""
data:image/s3,"s3://crabby-images/abde5/abde547239f4c60be01562e1c081733b6b25f46c" alt=""
data:image/s3,"s3://crabby-images/7a1d1/7a1d106f666cc814357f6a0340bf5dec105339ac" alt=""
data:image/s3,"s3://crabby-images/03e8f/03e8fb4cf7fdf2f2eb2f0f7eead2e03c820e0c5f" alt=""
data:image/s3,"s3://crabby-images/a0c3e/a0c3e0419bb39a0197a49d00d7a6ede2c37e7953" alt=""
data:image/s3,"s3://crabby-images/509b4/509b4c781700560591cc4e1a77c5a9c80eaadfe1" alt=""
data:image/s3,"s3://crabby-images/78635/78635ed68eca78a3bbee57201583a842f67bf0d0" alt=""
data:image/s3,"s3://crabby-images/4378e/4378e4fb5ebead936aa8b0337e4ad77aad43416f" alt=""
data:image/s3,"s3://crabby-images/5a202/5a2024d115a8bec1c078e01148d58e822f2e1ee7" alt=""
data:image/s3,"s3://crabby-images/5c534/5c53456ecb829ea7d6135462bad8ad2774a46364" alt=""
data:image/s3,"s3://crabby-images/0dd52/0dd52f3e62d4fac4c567c7fb8a15582ff91a7d9e" alt=""
data:image/s3,"s3://crabby-images/d8075/d8075c063c2c20d34f07236c56d112963a07a917" alt=""
data:image/s3,"s3://crabby-images/f13be/f13bea7e055988229ad75f5e235058cd088a3f27" alt=""
data:image/s3,"s3://crabby-images/5d6d9/5d6d9612aec1ce78c63cbb88c133eca35e2eed61" alt=""
data:image/s3,"s3://crabby-images/40a58/40a58830acc75ebe2dc721e228b3ed71a412f002" alt=""
data:image/s3,"s3://crabby-images/1e787/1e787c3ecdcaa2120698681abf06ff7a6ce448dd" alt=""
data:image/s3,"s3://crabby-images/e0b64/e0b64d5200d0e776c8e6f567cc49dc6eeadc0a99" alt=""
data:image/s3,"s3://crabby-images/30822/308226f1c96c2b9501ad6b2b173ab158c8a7c34a" alt=""
data:image/s3,"s3://crabby-images/ea6bd/ea6bdd308a292460e8a90dee3ebe16605202b4eb" alt=""
data:image/s3,"s3://crabby-images/35ca5/35ca5ccd8302042b9a115ee582f31bebe5453f93" alt=""
data:image/s3,"s3://crabby-images/f4a9e/f4a9eed7753533fe19266f33b107aea8f8681721" alt=""
data:image/s3,"s3://crabby-images/ebdd3/ebdd3d7176f314e63b0bd524979c24d12e0146b2" alt=""
data:image/s3,"s3://crabby-images/5357c/5357c83064e6ec3d2695595cde4639959b1928c5" alt=""
data:image/s3,"s3://crabby-images/2246f/2246f3f04e849f303f84774c2ab3b767ec103397" alt=""
data:image/s3,"s3://crabby-images/7423f/7423f5d2202312eaa37eea384f323e922b896031" alt=""
data:image/s3,"s3://crabby-images/b895f/b895f4f73dcfb9b29c3277f053e796629b7367cf" alt=""
data:image/s3,"s3://crabby-images/45b3b/45b3b92dc6850a797018728dba89df56cd2f7505" alt=""
data:image/s3,"s3://crabby-images/7c7d3/7c7d3740250fe78bc3adbd3dcf2e0e340292afff" alt=""
data:image/s3,"s3://crabby-images/14a10/14a107c2daa7d25566795f80189a03314a2a5ddb" alt=""
data:image/s3,"s3://crabby-images/f1035/f10355539485dc76910b96027ba3be321110c7ad" alt=""
data:image/s3,"s3://crabby-images/70c3d/70c3d9dd7ae1533fa6e0eba91071425ed2da531f" alt=""
data:image/s3,"s3://crabby-images/99920/99920040a070cf704c11c7623f564d5e8d55f631" alt=""
data:image/s3,"s3://crabby-images/449c1/449c1eb2588fa40c881b07fcbbddb33acb1d211d" alt=""
data:image/s3,"s3://crabby-images/7d584/7d58426b3563feb477c7652d1a5358341ebb6073" alt=""
data:image/s3,"s3://crabby-images/874bf/874bfea422e28ff5a77321b51a2b750f3171b314" alt=""
data:image/s3,"s3://crabby-images/5f05f/5f05f22df3cb9bf2e5a2f49c875a03657061673f" alt=""
data:image/s3,"s3://crabby-images/68c7f/68c7f49d17a77c1ff9f853c95ffdf3724e811df5" alt=""
data:image/s3,"s3://crabby-images/90901/90901f44fd01d40f7b92dcb63d7e9a1a631b2f0c" alt=""
data:image/s3,"s3://crabby-images/11af1/11af128ae294b0069d791fb6fb47efa4b656a502" alt=""
data:image/s3,"s3://crabby-images/fe336/fe3363d5f5934e9055783485972eac31cf0980b4" alt=""
data:image/s3,"s3://crabby-images/e34d3/e34d39e79ab5253dd5b55f65e4f7beea4eef1626" alt=""
data:image/s3,"s3://crabby-images/fc069/fc0694127bf50895823e4e5ed24bc64161c5865d" alt=""
data:image/s3,"s3://crabby-images/842b9/842b909188c0fbeef019b62f36de8f046be5ee80" alt=""
data:image/s3,"s3://crabby-images/58b03/58b03f6b072e45acb01592eeca933d0f7197b27e" alt=""
data:image/s3,"s3://crabby-images/5ea72/5ea72407af4aa410d12e540d8b695b1e5fd93764" alt=""
data:image/s3,"s3://crabby-images/de683/de683ec064ee64d69129ccbe680689af102ed2e5" alt=""
data:image/s3,"s3://crabby-images/a2d75/a2d7568818e8479a6643da7a2341bb6da85873b9" alt=""
data:image/s3,"s3://crabby-images/c386f/c386f3be2ba2c59090c92701f0988e23e287b4d8" alt=""
data:image/s3,"s3://crabby-images/245de/245deb613087814c4145ba335f6501bd5a8fd553" alt=""
data:image/s3,"s3://crabby-images/b7ceb/b7ceba00af2af8c578cebd6e64829b38fec47d69" alt=""
data:image/s3,"s3://crabby-images/0dc2d/0dc2dd9019bb0408a2fc45129e78913e3e7c96c1" alt=""
data:image/s3,"s3://crabby-images/c29ed/c29ed1f93900f31e2c94c28fb9434fc0111e7528" alt=""
data:image/s3,"s3://crabby-images/24ac8/24ac8b007dd4dfc20e6221522a55a09625304768" alt=""
data:image/s3,"s3://crabby-images/36b11/36b115e590d589498b7821999171d811449e4869" alt=""
data:image/s3,"s3://crabby-images/7a39b/7a39bda4af11b16e1bd018f4d13c26b6ba7d2c91" alt=""
data:image/s3,"s3://crabby-images/c53d7/c53d745ec88a545e6aa672e4664f583ab9ee349d" alt=""
data:image/s3,"s3://crabby-images/ce416/ce4169ef81157803c36060b4e7c44dbdc1c3ca9f" alt=""
data:image/s3,"s3://crabby-images/42087/42087b70183f6756ac72c4d15d9459ec0797b2dc" alt=""
data:image/s3,"s3://crabby-images/d2413/d2413ba2a057d3ae694894b5e376a09ed1627826" alt=""
data:image/s3,"s3://crabby-images/9f2a4/9f2a4261c12ed243ef48b41f77d35186afd2b94b" alt=""
data:image/s3,"s3://crabby-images/7d455/7d455570774f305d32332e39fcf397583bea8164" alt=""
data:image/s3,"s3://crabby-images/2a28a/2a28abf6de3d2b4b1ebfe23ff4c9c1756b04929c" alt=""
data:image/s3,"s3://crabby-images/eb50d/eb50ddb8774577a186987b7db34af4575af6f3dd" alt=""
data:image/s3,"s3://crabby-images/31d37/31d37874be371e4e92e8f7fde2bcb6cc39686451" alt=""
##step 6: Automatic binning of data
##Decision Tree Binning
treebins_train <- bins_tree(df= train, key_var= c("application_id","account_number"), y_var="bad_ind",
max_depth=3, p=0.1)
##Equal Frequency Binning
binning_eqfreq1 <- binning_eqfreq( df= train, feat= 'tot_derog', label = 'bad_ind', nbins = 3)
##Equal Width Binning
binning_eqwid1 <- binning_eqwid( df = train, feat = 'tot_derog', label = 'bad_ind', nbins = 3)
##The K-means Binning
binning_kmean1 <- binning_kmean( df = train, feat= 'loan_term', label = 'bad_ind', nbins = 3)
##Chi-Square Binning
bins_chim1 <- bins_chim( df = train[1:200,], key_var = "application_id", y_var = "bad_ind" , alpha=0.1 )
##Unsupervised Automatic Binning Function
f_1 <-bins_unsupervised( df = feature[1:200,] , id="application_id" , label="bad_ind" ,
methods = c("k_means", "equal_width","equal_freq") , bin_nums=5 )
##The Combination of Two Bins Produces the Best Binning Result
best1 <- best_iv( df=f_1 ,bin=c('bins') , method = c('method') ,variable= c( "variable" ) ,label_iv='miv' )
vs1 <- best_vs( df1 = treebins_train[,-c(3)], df2 = best1[,-c(1:2)] ,variable="variable" ,label_iv='miv' )
##step 7: Replace Feature Data by Binning Template
woe_train <- rep_woe( df= train ,key_var="application_id", y_var="bad_ind" , tool=treebins_train ,
var_label= "variable",col_woe='woe', lower='lower' ,upper ='upper' )
woe_test <- rep_woe( df= test ,key_var="application_id", y_var="bad_ind" , tool=treebins_train ,
var_label= "variable",col_woe='woe', lower='lower' ,upper ='upper' )
##step 8: Modeling
lg<-stats::glm(bad_ind~.,family=stats::binomial(link='logit'),data= woe_train)
lg_both<-stats::step(lg,direction = "both")
#> Start: AIC=2478.97
#> bad_ind ~ application_id + account_number + vehicle_year + vehicle_make +
#> tot_derog + tot_tr + age_oldest_tr + tot_open_tr + tot_rev_tr +
#> tot_rev_debt + tot_rev_line + rev_util + fico_score + purch_price +
#> msrp + down_pyt + loan_term + loan_amt + ltv + tot_income +
#> veh_mileage
#>
#> Df Deviance AIC
#> - account_number 1 2435.0 2477.0
#> - vehicle_make 1 2435.0 2477.0
#> - tot_rev_tr 1 2435.0 2477.0
#> - msrp 1 2435.3 2477.3
#> - tot_income 1 2436.3 2478.3
#> - application_id 1 2436.9 2478.9
#> <none> 2435.0 2479.0
#> - tot_tr 1 2437.0 2479.0
#> - age_oldest_tr 1 2437.4 2479.4
#> - tot_rev_debt 1 2437.6 2479.6
#> - tot_open_tr 1 2438.4 2480.4
#> - tot_rev_line 1 2438.5 2480.5
#> - loan_term 1 2438.6 2480.6
#> - purch_price 1 2439.1 2481.1
#> - loan_amt 1 2440.4 2482.4
#> - rev_util 1 2441.5 2483.5
#> - tot_derog 1 2442.1 2484.1
#> - vehicle_year 1 2442.4 2484.4
#> - down_pyt 1 2443.7 2485.7
#> - veh_mileage 1 2451.1 2493.1
#> - ltv 1 2475.7 2517.7
#> - fico_score 1 2513.7 2555.7
#>
#> Step: AIC=2476.98
#> bad_ind ~ application_id + vehicle_year + vehicle_make + tot_derog +
#> tot_tr + age_oldest_tr + tot_open_tr + tot_rev_tr + tot_rev_debt +
#> tot_rev_line + rev_util + fico_score + purch_price + msrp +
#> down_pyt + loan_term + loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - vehicle_make 1 2435.0 2475.0
#> - tot_rev_tr 1 2435.0 2475.0
#> - msrp 1 2435.3 2475.3
#> - tot_income 1 2436.3 2476.3
#> - application_id 1 2436.9 2476.9
#> <none> 2435.0 2477.0
#> - tot_tr 1 2437.0 2477.0
#> - age_oldest_tr 1 2437.4 2477.4
#> - tot_rev_debt 1 2437.6 2477.6
#> - tot_open_tr 1 2438.4 2478.4
#> - tot_rev_line 1 2438.6 2478.6
#> - loan_term 1 2438.7 2478.7
#> + account_number 1 2435.0 2479.0
#> - purch_price 1 2439.2 2479.2
#> - loan_amt 1 2440.5 2480.5
#> - rev_util 1 2441.6 2481.6
#> - tot_derog 1 2442.1 2482.1
#> - vehicle_year 1 2442.4 2482.4
#> - down_pyt 1 2443.7 2483.7
#> - veh_mileage 1 2451.1 2491.1
#> - ltv 1 2475.8 2515.8
#> - fico_score 1 2513.9 2553.9
#>
#> Step: AIC=2475
#> bad_ind ~ application_id + vehicle_year + tot_derog + tot_tr +
#> age_oldest_tr + tot_open_tr + tot_rev_tr + tot_rev_debt +
#> tot_rev_line + rev_util + fico_score + purch_price + msrp +
#> down_pyt + loan_term + loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - tot_rev_tr 1 2435.0 2473.0
#> - msrp 1 2435.3 2473.3
#> - tot_income 1 2436.3 2474.3
#> - application_id 1 2437.0 2475.0
#> <none> 2435.0 2475.0
#> - tot_tr 1 2437.0 2475.0
#> - age_oldest_tr 1 2437.4 2475.4
#> - tot_rev_debt 1 2437.6 2475.6
#> - tot_open_tr 1 2438.5 2476.5
#> - tot_rev_line 1 2438.6 2476.6
#> - loan_term 1 2438.7 2476.7
#> + vehicle_make 1 2435.0 2477.0
#> + account_number 1 2435.0 2477.0
#> - purch_price 1 2439.2 2477.2
#> - loan_amt 1 2440.5 2478.5
#> - rev_util 1 2441.6 2479.6
#> - tot_derog 1 2442.1 2480.1
#> - vehicle_year 1 2442.6 2480.6
#> - down_pyt 1 2443.7 2481.7
#> - veh_mileage 1 2451.2 2489.2
#> - ltv 1 2476.1 2514.1
#> - fico_score 1 2514.1 2552.1
#>
#> Step: AIC=2473.04
#> bad_ind ~ application_id + vehicle_year + tot_derog + tot_tr +
#> age_oldest_tr + tot_open_tr + tot_rev_debt + tot_rev_line +
#> rev_util + fico_score + purch_price + msrp + down_pyt + loan_term +
#> loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - msrp 1 2435.4 2471.4
#> - tot_income 1 2436.3 2472.3
#> - tot_tr 1 2437.0 2473.0
#> - application_id 1 2437.0 2473.0
#> <none> 2435.0 2473.0
#> - age_oldest_tr 1 2437.5 2473.5
#> - tot_rev_debt 1 2437.7 2473.7
#> - tot_open_tr 1 2438.6 2474.6
#> - tot_rev_line 1 2438.7 2474.7
#> - loan_term 1 2438.8 2474.8
#> + tot_rev_tr 1 2435.0 2475.0
#> + vehicle_make 1 2435.0 2475.0
#> + account_number 1 2435.0 2475.0
#> - purch_price 1 2439.2 2475.2
#> - loan_amt 1 2440.5 2476.5
#> - tot_derog 1 2442.1 2478.1
#> - rev_util 1 2442.4 2478.4
#> - vehicle_year 1 2442.6 2478.6
#> - down_pyt 1 2443.8 2479.8
#> - veh_mileage 1 2451.2 2487.2
#> - ltv 1 2476.2 2512.2
#> - fico_score 1 2515.8 2551.8
#>
#> Step: AIC=2471.39
#> bad_ind ~ application_id + vehicle_year + tot_derog + tot_tr +
#> age_oldest_tr + tot_open_tr + tot_rev_debt + tot_rev_line +
#> rev_util + fico_score + purch_price + down_pyt + loan_term +
#> loan_amt + ltv + tot_income + veh_mileage
#>
#> Df Deviance AIC
#> - tot_income 1 2436.6 2470.6
#> - tot_tr 1 2437.3 2471.3
#> - application_id 1 2437.4 2471.4
#> <none> 2435.4 2471.4
#> - age_oldest_tr 1 2437.8 2471.8
#> - tot_rev_debt 1 2438.0 2472.0
#> - tot_open_tr 1 2438.9 2472.9
#> - loan_term 1 2439.0 2473.0
#> + msrp 1 2435.0 2473.0
#> - tot_rev_line 1 2439.1 2473.1
#> - purch_price 1 2439.3 2473.3
#> + tot_rev_tr 1 2435.3 2473.3
#> + vehicle_make 1 2435.4 2473.4
#> + account_number 1 2435.4 2473.4
#> - loan_amt 1 2440.6 2474.6
#> - tot_derog 1 2442.5 2476.5
#> - rev_util 1 2442.7 2476.7
#> - vehicle_year 1 2443.3 2477.3
#> - down_pyt 1 2444.3 2478.3
#> - veh_mileage 1 2451.7 2485.7
#> - ltv 1 2476.2 2510.2
#> - fico_score 1 2515.9 2549.9
#>
#> Step: AIC=2470.6
#> bad_ind ~ application_id + vehicle_year + tot_derog + tot_tr +
#> age_oldest_tr + tot_open_tr + tot_rev_debt + tot_rev_line +
#> rev_util + fico_score + purch_price + down_pyt + loan_term +
#> loan_amt + ltv + veh_mileage
#>
#> Df Deviance AIC
#> <none> 2436.6 2470.6
#> - application_id 1 2438.7 2470.7
#> - tot_tr 1 2438.8 2470.8
#> - age_oldest_tr 1 2439.3 2471.3
#> - tot_rev_debt 1 2439.3 2471.3
#> + tot_income 1 2435.4 2471.4
#> - tot_open_tr 1 2440.2 2472.2
#> - loan_term 1 2440.3 2472.3
#> + msrp 1 2436.3 2472.3
#> + tot_rev_tr 1 2436.6 2472.6
#> + vehicle_make 1 2436.6 2472.6
#> + account_number 1 2436.6 2472.6
#> - tot_rev_line 1 2440.8 2472.8
#> - purch_price 1 2441.0 2473.0
#> - loan_amt 1 2441.6 2473.6
#> - tot_derog 1 2443.6 2475.6
#> - rev_util 1 2443.6 2475.6
#> - vehicle_year 1 2444.1 2476.1
#> - down_pyt 1 2445.6 2477.6
#> - veh_mileage 1 2452.8 2484.8
#> - ltv 1 2478.4 2510.4
#> - fico_score 1 2517.9 2549.9
logit<-stats::predict(lg_both,woe_test)
woe_test$lg_both_p<-exp(logit)/(1+exp(logit))
pred_both <- ROCR::prediction(woe_test$lg_both_p, woe_test$bad_ind)
perf_both <- ROCR::performance(pred_both,"tpr","fpr")
##step 9: Correlation Diagram
coe = (lg_both$coefficients)
cor1<-stats::cor( Xvar_df<- woe_train[-which(colnames(feature) %in% c("application_id","account_number","bad_ind"))])
corrplot::corrplot(cor1)
corrplot::corrplot(cor1,method = "number")
data:image/s3,"s3://crabby-images/2ce22/2ce2243754f24976f4047cfb09e9dbd8ab126f34" alt=""
##step 10: Manually Input Parameters to Generate Scorecards
##scorecard
Score<-noauto_scorecard( bins_card= woe_test, fit= lg_both,bins_woe=treebins_train ,points0 = 600,
odds0 = 1/20, pdo = 50 ,k = 2)
Score_2<-noauto_scorecard( bins_card= woe_train, fit= lg_both,bins_woe=treebins_train ,points0 = 600,
odds0 = 1/20, pdo = 50 ,k = 3)
##scorecard2
Score<-noauto_scorecard2( bins_card= woe_test, fit= lg_both,bins_woe=treebins_train ,points0 = 600,
odds0 = 1/20, pdo = 50 ,k = 2)
Score_2<-noauto_scorecard2( bins_card= woe_train, fit= lg_both,bins_woe=treebins_train ,points0 = 600,
odds0 = 1/20, pdo = 50 ,k = 3)
##step 11: PSI
data_train <- Score_2$data_score
data_test <- Score$data_score
psi_1<-psi_cal( df_train = data_train , df_test = data_test,feat='Score',label='bad_ind' , nbins=10)
data:image/s3,"s3://crabby-images/6ea95/6ea95579c7b3b2b06fbec05d81f39232ce6c2a9c" alt=""
##step 12: Data Painter
plot_board( label= woe_test$bad_ind, pred = woe_test$lg_both_p )
data:image/s3,"s3://crabby-images/eb530/eb530630b8f90793116daed0562b2445025cfdbe" alt=""
data:image/s3,"s3://crabby-images/37ec5/37ec59257ddd071f4d86a1409efd9993d2107ad7" alt=""