In [10]:
ModelsDir <- '/home/kate/Research/Property/Models/'
DataDir <- '/home/kate/Research/Property/Data/'
UseSavedIfExists <- FALSE
In [11]:
source('/home/kate/code/Utils/MyFunctions.R')
In [12]:
training_data <- read.csv(paste(DataDir,"property_wcf_training", '.csv', sep = ""), header=TRUE)
In [13]:
testing_data <- read.csv(paste(DataDir,"property_wcf_testing", '.csv', sep = ""), header=TRUE)

formulas <- list() formulas[[1]] <- cova_ic_nc_water ~ 1 formulas[[2]] <- cova_ic_nc_water ~ ecy formulas[[3]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit formulas[[4]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible formulas[[5]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft formulas[[6]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd formulas[[7]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk formulas[[8]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk formulas[[9]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk formulas[[10]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk formulas[[11]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk formulas[[12]] <- cova_ic_nc_water ~ log_cova_limit + cova_deductible + log_water_risk_3_blk formulas[[13]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + log_water_risk_3_blk formulas[[14]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + water_risk_3_blk formulas[[15]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk formulas[[16]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + cova_deductible + log_water_risk_3_blk formulas[[17]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk formulas[[18]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk formulas[[19]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk

formulas[[20]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded formulas[[21]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + log_yearbuilt + log_sqft formulas[[22]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + log_yearbuilt + log_sqft + roofcd formulas[[23]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk formulas[[24]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + log_yearbuilt + log_sqft + log_water_risk_3_blk formulas[[25]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + log_yearbuilt + log_water_risk_3_blk formulas[[26]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + log_water_risk_3_blk formulas[[27]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + waterded + log_water_risk_3_blk formulas[[28]] <- cova_ic_nc_water ~ log_cova_limit + waterded + log_water_risk_3_blk formulas[[29]] <- cova_ic_nc_water ~ cova_limit + waterded + log_water_risk_3_blk formulas[[30]] <- cova_ic_nc_water ~ cova_limit + waterded + water_risk_3_blk formulas[[31]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk formulas[[32]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + waterded + log_water_risk_3_blk formulas[[33]] <- cova_ic_nc_water ~ ecy + usagetype + waterded + log_yearbuilt + log_sqft + log_water_risk_3_blk formulas[[34]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk formulas[[35]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + log_yearbuilt + log_water_risk_3_blk

formulas[[36]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + waterded formulas[[37]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + waterded formulas[[38]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + waterded formulas[[39]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk + waterded formulas[[40]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded formulas[[41]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterded formulas[[42]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterded formulas[[43]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterded formulas[[44]] <- cova_ic_nc_water ~ log_cova_limit + cova_deductible + log_water_risk_3_blk + waterded formulas[[45]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + log_water_risk_3_blk + waterded formulas[[46]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + water_risk_3_blk + waterded formulas[[47]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk + waterded formulas[[48]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + cova_deductible + log_water_risk_3_blk + waterded formulas[[49]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded formulas[[50]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded formulas[[51]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterded

formulas[[52]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + waterded + waterdetectiondevice formulas[[53]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + waterded + waterdetectiondevice formulas[[54]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + waterded + waterdetectiondevice formulas[[55]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[56]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[57]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[58]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[59]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[60]] <- cova_ic_nc_water ~ log_cova_limit + cova_deductible + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[61]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[62]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + water_risk_3_blk + waterded + waterdetectiondevice formulas[[63]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[64]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + cova_deductible + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[65]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[66]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[67]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterded + waterdetectiondevice

formulas[[52]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + waterdetectiondevice formulas[[53]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + waterdetectiondevice formulas[[54]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + waterdetectiondevice formulas[[55]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk + waterdetectiondevice formulas[[56]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice formulas[[57]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterdetectiondevice formulas[[58]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice formulas[[59]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice formulas[[60]] <- cova_ic_nc_water ~ log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice formulas[[61]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice formulas[[62]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + water_risk_3_blk + waterdetectiondevice formulas[[63]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk + waterdetectiondevice formulas[[64]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice formulas[[65]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice formulas[[66]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice formulas[[67]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterdetectiondevice

formulas[[68]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + waterdetectiondevice formulas[[69]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + waterded + waterdetectiondevice formulas[[70]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + roofcd + waterded + waterdetectiondevice formulas[[71]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[72]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[73]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[74]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[75]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[76]] <- cova_ic_nc_water ~ log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[77]] <- cova_ic_nc_water ~ cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[78]] <- cova_ic_nc_water ~ cova_limit + water_risk_3_blk + waterded + waterdetectiondevice formulas[[79]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[80]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[81]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[82]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice formulas[[83]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_water_risk_3_blk + waterded + waterdetectiondevice

formulas[[84]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + waterdetectiondevice + sprinklersystem formulas[[85]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + waterdetectiondevice + sprinklersystem formulas[[86]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + waterdetectiondevice + sprinklersystem formulas[[87]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[88]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[89]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[90]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[91]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[92]] <- cova_ic_nc_water ~ log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[93]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[94]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[95]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[96]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[97]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[98]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem formulas[[99]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem

formulas[[100]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + waterdetectiondevice + sprinklersystem formulas[[101]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + waterded + waterdetectiondevice + sprinklersystem formulas[[102]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + roofcd + waterded + waterdetectiondevice + sprinklersystem formulas[[103]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[104]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[105]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[106]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[107]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[108]] <- cova_ic_nc_water ~ log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[109]] <- cova_ic_nc_water ~ cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[110]] <- cova_ic_nc_water ~ cova_limit + water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[111]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[112]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[113]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[114]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem formulas[[115]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem

formulas[[116]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + waterdetectiondevice + sprinklersystem + landlordind formulas[[117]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + waterdetectiondevice + sprinklersystem + landlordind formulas[[118]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + waterdetectiondevice + sprinklersystem + landlordind formulas[[119]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[120]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[121]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[122]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[123]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[124]] <- cova_ic_nc_water ~ log_cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[125]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[126]] <- cova_ic_nc_water ~ cova_limit + cova_deductible + water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[127]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[128]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + cova_deductible + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[129]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[130]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind formulas[[131]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + cova_deductible + log_yearbuilt + log_water_risk_3_blk + waterdetectiondevice + sprinklersystem + landlordind

formulas[[132]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[133]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[134]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + roofcd + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[135]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + roofcd + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[136]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[137]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[138]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[139]] <- cova_ic_nc_water ~ log_ecy + usagetype + log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[140]] <- cova_ic_nc_water ~ log_cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[141]] <- cova_ic_nc_water ~ cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[142]] <- cova_ic_nc_water ~ cova_limit + water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[143]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit+ log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[144]] <- cova_ic_nc_water ~ ecy + usagetype + cova_limit + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[145]] <- cova_ic_nc_water ~ ecy + usagetype + cova_deductible + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[146]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_sqft + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[147]] <- cova_ic_nc_water ~ ecy + usagetype + log_cova_limit + log_yearbuilt + log_water_risk_3_blk + waterded + waterdetectiondevice + sprinklersystem + landlordind formulas[[148]] <- cova_ic_nc_water ~ log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk

In [14]:
formulas <- list()
formulas[[1]] <- cova_ic_nc_water ~  log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype +  cova_deductible + log_water_risk_3_blk
formulas[[2]] <- cova_ic_nc_water ~  landlordind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype +  cova_deductible + log_water_risk_3_blk
formulas[[3]] <- cova_ic_nc_water ~  landlordind + poolind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype +  cova_deductible + log_water_risk_3_blk
formulas[[4]] <- cova_ic_nc_water ~  landlordind + poolind + multipolicyind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype +  cova_deductible + log_water_risk_3_blk
formulas[[5]] <- cova_ic_nc_water ~  poolind + multipolicyind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype +  cova_deductible + log_water_risk_3_blk
formulas[[6]] <- cova_ic_nc_water ~  landlordind + multipolicyind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype +  cova_deductible + log_water_risk_3_blk
In [15]:
formulas_s <- list()
i<-1
for (formula in formulas) {
    formulas_s[[i]] <- Reduce(paste, deparse(formula))
    i <- i+1
    }
In [16]:
AIC_l <- list()
  BIC_l <- list()
  LogLik_l <- list()
  df_l <- list()
  trn_gini_l <- list()  
  test_gini_l <- list()  
  i<-1;
for (formula in formulas) {
  print(formula)
  test_pred_loss <- 0
  train_pred_loss <- 0
  #Modeling
  model <- glm(formula, family = "poisson", data = training_data)  
  #Prediction
  test_pred_loss <- predict.glm(model, testing_data, type = "response")
  train_pred_loss <- predict.glm(model,training_data, type = "response")
  #Scores
    AIC_l[[i]] <- round(AIC(model), digits = 0)
    BIC_l[[i]] <- round(BIC(model), digits = 0)
    LogLik_l[[i]] <- logLik(model)
    df_l[[i]] <- attr(logLik(model),"df")
    trn_gini_l[[i]]  <- NormalizedWeightedGini(training_data$cova_ic_nc_water,train_pred_loss,training_data$ecy)
    test_gini_l[[i]]  <- NormalizedWeightedGini(testing_data$cova_ic_nc_water,test_pred_loss,testing_data$ecy)
    i <- i + 1    
}
cova_ic_nc_water ~ log_ecy + log_sqft + log_yearbuilt + roofcd + 
    usagetype + cova_deductible + log_water_risk_3_blk
cova_ic_nc_water ~ landlordind + log_ecy + log_sqft + log_yearbuilt + 
    roofcd + usagetype + cova_deductible + log_water_risk_3_blk
cova_ic_nc_water ~ landlordind + poolind + log_ecy + log_sqft + 
    log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk
cova_ic_nc_water ~ landlordind + poolind + multipolicyind + log_ecy + 
    log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + 
    log_water_risk_3_blk
cova_ic_nc_water ~ poolind + multipolicyind + log_ecy + log_sqft + 
    log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk
cova_ic_nc_water ~ landlordind + multipolicyind + log_ecy + log_sqft + 
    log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk
In [18]:
Log <- data.frame(
  formulas=unlist(formulas_s),  
  AIC=unlist(AIC_l),
  BIC=unlist(BIC_l), 
  logLik=unlist(LogLik_l),
  df=unlist(df_l) ,
  train_gini=unlist(trn_gini_l) ,
  test_gini=unlist(test_gini_l )
)

write.table(Log,paste(ModelsDir,"frequency_tuning.csv", sep = ""), sep=",",  col.names=TRUE, row.names = FALSE)
In [19]:
Log
formulasAICBIClogLikdftrain_ginitest_gini
cova_ic_nc_water ~ log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk 114058 114278 -57011.06 18 0.3794492 0.3972265
cova_ic_nc_water ~ landlordind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk 114047 114279 -57004.27 19 0.3802589 0.4041143
cova_ic_nc_water ~ landlordind + poolind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk 114015 114259 -56987.37 20 0.3821256 0.4075710
cova_ic_nc_water ~ landlordind + poolind + multipolicyind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk114013 114270 -56985.70 21 0.3821588 0.4076518
cova_ic_nc_water ~ poolind + multipolicyind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk 114025 114270 -56992.47 20 0.3813627 0.4011727
cova_ic_nc_water ~ landlordind + multipolicyind + log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk 114046 114290 -57002.85 20 0.3802821 0.4042483
In [20]:
Model <- glm(cova_ic_nc_water ~ landlordind + poolind + log_ecy + log_sqft +      log_yearbuilt + roofcd + usagetype + cova_deductible + log_water_risk_3_blk, family = "poisson", data = training_data)  
summary(Model)
Call:
glm(formula = cova_ic_nc_water ~ landlordind + poolind + log_ecy + 
    log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible + 
    log_water_risk_3_blk, family = "poisson", data = training_data)

Deviance Residuals: 
    Min       1Q   Median       3Q      Max  
-0.3675  -0.1351  -0.1002  -0.0683   5.4848  

Coefficients:
                       Estimate Std. Error z value Pr(>|z|)    
(Intercept)          -1.157e+02  8.565e+00 -13.508  < 2e-16 ***
landlordind          -2.395e-01  6.510e-02  -3.678 0.000235 ***
poolind               2.930e-01  4.849e-02   6.042 1.52e-09 ***
log_ecy               9.423e-01  1.917e-02  49.159  < 2e-16 ***
log_sqft              5.665e-01  2.928e-02  19.349  < 2e-16 ***
log_yearbuilt         1.348e+01  1.133e+00  11.902  < 2e-16 ***
roofcdMEMBRANE       -1.250e-02  9.594e-02  -0.130 0.896370    
roofcdMETAL           1.922e-01  1.902e-01   1.011 0.312089    
roofcdOTHER           9.125e-02  3.237e-02   2.819 0.004812 ** 
roofcdTAR            -3.050e-03  7.853e-02  -0.039 0.969019    
roofcdTILE            9.665e-02  2.783e-02   3.473 0.000514 ***
roofcdWOOD            1.466e-01  9.753e-02   1.503 0.132924    
usagetypePRIMARY      2.357e+00  5.777e-01   4.080 4.50e-05 ***
usagetypeRENTAL       2.038e+00  5.778e-01   3.526 0.000421 ***
usagetypeSEASONAL     2.100e+00  6.012e-01   3.492 0.000479 ***
usagetypeSECONDARY    1.161e+00  7.304e-01   1.590 0.111908    
usagetypeUNOCCUPIED  -6.227e+00  4.507e+01  -0.138 0.890121    
usagetypeVACANT      -1.127e+00  1.155e+00  -0.976 0.329060    
cova_deductible      -3.243e-04  1.435e-05 -22.602  < 2e-16 ***
log_water_risk_3_blk  5.493e-01  2.331e-02  23.564  < 2e-16 ***
---
Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1

(Dispersion parameter for poisson family taken to be 1)

    Null deviance: 101039  on 1517325  degrees of freedom
Residual deviance:  94301  on 1517306  degrees of freedom
AIC: 114015

Number of Fisher Scoring iterations: 12
In [21]:
Model <- glm(cova_ic_nc_water ~ landlordind + poolind + multipolicyind + log_ecy +      log_sqft + log_yearbuilt + roofcd + usagetype + cova_deductible +      log_water_risk_3_blk, family = "poisson", data = training_data)  
summary(Model)
Call:
glm(formula = cova_ic_nc_water ~ landlordind + poolind + multipolicyind + 
    log_ecy + log_sqft + log_yearbuilt + roofcd + usagetype + 
    cova_deductible + log_water_risk_3_blk, family = "poisson", 
    data = training_data)

Deviance Residuals: 
    Min       1Q   Median       3Q      Max  
-0.3609  -0.1351  -0.1001  -0.0683   5.4851  

Coefficients:
                       Estimate Std. Error z value Pr(>|z|)    
(Intercept)          -1.163e+02  8.569e+00 -13.569  < 2e-16 ***
landlordind          -2.321e-01  6.523e-02  -3.558 0.000373 ***
poolind               2.953e-01  4.850e-02   6.088 1.15e-09 ***
multipolicyind       -4.933e-02  2.712e-02  -1.819 0.068932 .  
log_ecy               9.422e-01  1.917e-02  49.159  < 2e-16 ***
log_sqft              5.656e-01  2.928e-02  19.320  < 2e-16 ***
log_yearbuilt         1.356e+01  1.133e+00  11.965  < 2e-16 ***
roofcdMEMBRANE       -1.316e-02  9.594e-02  -0.137 0.890895    
roofcdMETAL           1.977e-01  1.902e-01   1.039 0.298619    
roofcdOTHER           9.105e-02  3.237e-02   2.813 0.004907 ** 
roofcdTAR            -2.419e-03  7.853e-02  -0.031 0.975431    
roofcdTILE            9.656e-02  2.783e-02   3.470 0.000521 ***
roofcdWOOD            1.480e-01  9.753e-02   1.517 0.129145    
usagetypePRIMARY      2.368e+00  5.777e-01   4.099 4.15e-05 ***
usagetypeRENTAL       2.038e+00  5.778e-01   3.526 0.000421 ***
usagetypeSEASONAL     2.106e+00  6.012e-01   3.503 0.000460 ***
usagetypeSECONDARY    1.177e+00  7.305e-01   1.611 0.107263    
usagetypeUNOCCUPIED  -6.227e+00  4.507e+01  -0.138 0.890116    
usagetypeVACANT      -1.127e+00  1.155e+00  -0.976 0.328986    
cova_deductible      -3.253e-04  1.436e-05 -22.646  < 2e-16 ***
log_water_risk_3_blk  5.480e-01  2.333e-02  23.491  < 2e-16 ***
---
Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1

(Dispersion parameter for poisson family taken to be 1)

    Null deviance: 101039  on 1517325  degrees of freedom
Residual deviance:  94298  on 1517305  degrees of freedom
AIC: 114013

Number of Fisher Scoring iterations: 12