HousePrices|TrainTest|FE
Feature engineered dataset for House Price forecast to be used to train models
@kaggle.ravi20076_housepricestraintestfe
Feature engineered dataset for House Price forecast to be used to train models
@kaggle.ravi20076_housepricestraintestfe
This dataset is created by running the public kernel for the House Price forecast starter competition privately. The reference notebook is as below-
https://www.kaggle.com/code/venkatapadavala/house-prices-advanced-regression-practice
I shall use the contents of the dataset to train ML models in my training kernel directly and shall produce my submission. This dataset is quite comprehensive with null imputation and secondary feature creation and a simple model on this dataset yields a good public score in the original kernel.
CREATE TABLE xtest (
"unnamed_0" BIGINT -- Unnamed: 0,
"lotfrontage" DOUBLE,
"lotarea" DOUBLE,
"overallqual" BIGINT,
"overallcond" DOUBLE,
"yearbuilt" BIGINT,
"yearremod_add" DOUBLE,
"masvnrarea" DOUBLE,
"bsmtfinsf1" DOUBLE,
"bsmtfinsf2" DOUBLE,
"bsmtunfsf" DOUBLE,
"totalbsmtsf" DOUBLE,
"n_1stflrsf" DOUBLE -- 1stFlrSF,
"n_2ndflrsf" DOUBLE -- 2ndFlrSF,
"lowqualfinsf" DOUBLE,
"grlivarea" DOUBLE,
"bsmtfullbath" DOUBLE,
"bsmthalfbath" DOUBLE,
"fullbath" BIGINT,
"halfbath" DOUBLE,
"bedroomabvgr" BIGINT,
"kitchenabvgr" DOUBLE,
"totrmsabvgrd" DOUBLE,
"fireplaces" DOUBLE,
"garagecars" DOUBLE,
"garagearea" DOUBLE,
"wooddecksf" DOUBLE,
"openporchsf" DOUBLE,
"enclosedporch" DOUBLE,
"n_3ssnporch" DOUBLE -- 3SsnPorch,
"screenporch" DOUBLE,
"poolarea" DOUBLE,
"miscval" DOUBLE,
"sqftperroom" DOUBLE,
"total_home_quality" BIGINT,
"total_bathrooms" DOUBLE,
"highqualsf" DOUBLE,
"age" DOUBLE,
"renovate" DOUBLE,
"mssubclass_120" DOUBLE,
"mssubclass_150" DOUBLE,
"mssubclass_160" DOUBLE,
"mssubclass_180" DOUBLE,
"mssubclass_190" DOUBLE,
"mssubclass_20" DOUBLE,
"mssubclass_30" DOUBLE,
"mssubclass_40" DOUBLE,
"mssubclass_45" DOUBLE,
"mssubclass_50" DOUBLE,
"mssubclass_60" DOUBLE,
"mssubclass_70" DOUBLE,
"mssubclass_75" DOUBLE,
"mssubclass_80" DOUBLE,
"mssubclass_85" DOUBLE,
"mssubclass_90" DOUBLE,
"mszoning_a_agr" DOUBLE -- MSZoning A (agr),
"mszoning_c_all" DOUBLE -- MSZoning C (all),
"mszoning_fv" DOUBLE,
"mszoning_i_all" DOUBLE -- MSZoning I (all),
"mszoning_none" DOUBLE,
"mszoning_rh" DOUBLE,
"mszoning_rl" BIGINT,
"mszoning_rm" DOUBLE,
"street_grvl" DOUBLE,
"street_pave" BIGINT,
"alley_grvl" DOUBLE,
"alley_none" BIGINT,
"alley_pave" DOUBLE,
"lotshape_ir1" DOUBLE,
"lotshape_ir2" DOUBLE,
"lotshape_ir3" DOUBLE,
"lotshape_reg" BIGINT,
"landcontour_bnk" DOUBLE,
"landcontour_hls" DOUBLE,
"landcontour_low" DOUBLE,
"landcontour_lvl" BIGINT,
"utilities_allpub" BIGINT,
"utilities_nosewa" DOUBLE,
"utilities_nosewr" DOUBLE,
"utilities_none" DOUBLE,
"lotconfig_corner" DOUBLE,
"lotconfig_culdsac" DOUBLE,
"lotconfig_fr2" DOUBLE,
"lotconfig_fr3" DOUBLE,
"lotconfig_inside" BIGINT,
"landslope_gtl" BIGINT,
"landslope_mod" DOUBLE,
"landslope_sev" DOUBLE,
"neighborhood_blmngtn" DOUBLE,
"neighborhood_blueste" DOUBLE,
"neighborhood_brdale" DOUBLE,
"neighborhood_brkside" DOUBLE,
"neighborhood_clearcr" DOUBLE,
"neighborhood_collgcr" DOUBLE,
"neighborhood_crawfor" DOUBLE,
"neighborhood_edwards" DOUBLE,
"neighborhood_gilbert" DOUBLE,
"neighborhood_greens" DOUBLE,
"neighborhood_grnhill" DOUBLE,
"neighborhood_idotrr" DOUBLE
);CREATE TABLE xytrain (
"unnamed_0" BIGINT -- Unnamed: 0,
"lotfrontage" DOUBLE,
"lotarea" DOUBLE,
"overallqual" BIGINT,
"overallcond" DOUBLE,
"yearbuilt" BIGINT,
"yearremod_add" DOUBLE,
"masvnrarea" DOUBLE,
"bsmtfinsf1" DOUBLE,
"bsmtfinsf2" DOUBLE,
"bsmtunfsf" DOUBLE,
"totalbsmtsf" DOUBLE,
"n_1stflrsf" DOUBLE -- 1stFlrSF,
"n_2ndflrsf" DOUBLE -- 2ndFlrSF,
"lowqualfinsf" DOUBLE,
"grlivarea" DOUBLE,
"bsmtfullbath" DOUBLE,
"bsmthalfbath" DOUBLE,
"fullbath" BIGINT,
"halfbath" DOUBLE,
"bedroomabvgr" BIGINT,
"kitchenabvgr" DOUBLE,
"totrmsabvgrd" DOUBLE,
"fireplaces" DOUBLE,
"garagecars" DOUBLE,
"garagearea" DOUBLE,
"wooddecksf" DOUBLE,
"openporchsf" DOUBLE,
"enclosedporch" DOUBLE,
"n_3ssnporch" DOUBLE -- 3SsnPorch,
"screenporch" DOUBLE,
"poolarea" DOUBLE,
"miscval" DOUBLE,
"sqftperroom" DOUBLE,
"total_home_quality" BIGINT,
"total_bathrooms" DOUBLE,
"highqualsf" DOUBLE,
"age" DOUBLE,
"renovate" DOUBLE,
"mssubclass_120" DOUBLE,
"mssubclass_150" DOUBLE,
"mssubclass_160" DOUBLE,
"mssubclass_180" DOUBLE,
"mssubclass_190" DOUBLE,
"mssubclass_20" DOUBLE,
"mssubclass_30" DOUBLE,
"mssubclass_40" DOUBLE,
"mssubclass_45" DOUBLE,
"mssubclass_50" DOUBLE,
"mssubclass_60" DOUBLE,
"mssubclass_70" DOUBLE,
"mssubclass_75" DOUBLE,
"mssubclass_80" DOUBLE,
"mssubclass_85" DOUBLE,
"mssubclass_90" DOUBLE,
"mszoning_a_agr" DOUBLE -- MSZoning A (agr),
"mszoning_c_all" DOUBLE -- MSZoning C (all),
"mszoning_fv" DOUBLE,
"mszoning_i_all" DOUBLE -- MSZoning I (all),
"mszoning_none" DOUBLE,
"mszoning_rh" DOUBLE,
"mszoning_rl" BIGINT,
"mszoning_rm" DOUBLE,
"street_grvl" DOUBLE,
"street_pave" BIGINT,
"alley_grvl" DOUBLE,
"alley_none" BIGINT,
"alley_pave" DOUBLE,
"lotshape_ir1" DOUBLE,
"lotshape_ir2" DOUBLE,
"lotshape_ir3" DOUBLE,
"lotshape_reg" BIGINT,
"landcontour_bnk" DOUBLE,
"landcontour_hls" DOUBLE,
"landcontour_low" DOUBLE,
"landcontour_lvl" BIGINT,
"utilities_allpub" BIGINT,
"utilities_nosewa" DOUBLE,
"utilities_nosewr" DOUBLE,
"utilities_none" DOUBLE,
"lotconfig_corner" DOUBLE,
"lotconfig_culdsac" DOUBLE,
"lotconfig_fr2" DOUBLE,
"lotconfig_fr3" DOUBLE,
"lotconfig_inside" BIGINT,
"landslope_gtl" BIGINT,
"landslope_mod" DOUBLE,
"landslope_sev" DOUBLE,
"neighborhood_blmngtn" DOUBLE,
"neighborhood_blueste" DOUBLE,
"neighborhood_brdale" DOUBLE,
"neighborhood_brkside" DOUBLE,
"neighborhood_clearcr" DOUBLE,
"neighborhood_collgcr" DOUBLE,
"neighborhood_crawfor" DOUBLE,
"neighborhood_edwards" DOUBLE,
"neighborhood_gilbert" DOUBLE,
"neighborhood_greens" DOUBLE,
"neighborhood_grnhill" DOUBLE,
"neighborhood_idotrr" DOUBLE
);Anyone who has the link will be able to view this.