DEVELOPMENT... { "data_id": "43443", "name": "Filipino-Family-Income-and-Expenditure", "exact_name": "Filipino-Family-Income-and-Expenditure", "version": 1, "version_label": "v1.0", "description": "Context\nThe Philippine Statistics Authority (PSA) spearheads the conduct of the Family Income and Expenditure Survey (FIES) nationwide. The survey, which is undertaken every three (3) years, is aimed at providing data on family income and expenditure, including, among others, levels of consumption by item of expenditure, sources of income in cash, and related information affecting income and expenditure levels and patterns in the Philippines.\nContent\nInside this data set is some selected variables from the latest Family Income and Expenditure Survey (FIES) in the Philippines. It contains more than 40k observations and 60 variables which is primarily comprised of the household income and expenditures of that specific household\nAcknowledgements\nThe Philippine Statistics Authority for providing the publisher with their raw data\nInspiration\nSocio-economic classification models in the Philippines has been very problematic. In fact, not one SEC model has been widely accepted. Government bodies uses their own SEC models and private research entities uses their own. We all know that household income is the greatest indicator of one's socio-economic classification that's why the publisher would like to find out the following:\n1) Best model in predicting household income\n2) Key drivers of household income, we want to make the model as sparse as possible\n3) Some exploratory analysis in the data would also be useful", "format": "arff", "uploader": " Stewart", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-23 13:21:21", "update_comment": null, "last_update": "2022-03-23 13:21:21", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102268\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Filipino-Family-Income-and-Expenditure", "Context The Philippine Statistics Authority (PSA) spearheads the conduct of the Family Income and Expenditure Survey (FIES) nationwide. The survey, which is undertaken every three (3) years, is aimed at providing data on family income and expenditure, including, among others, levels of consumption by item of expenditure, sources of income in cash, and related information affecting income and expenditure levels and patterns in the Philippines. Content Inside this data set is some selected variabl " ], "weight": 5 }, "qualities": { "NumberOfInstances": 41544, "NumberOfFeatures": 60, "NumberOfClasses": null, "NumberOfMissingValues": 15072, "NumberOfInstancesWithMissingValues": 7536, "NumberOfNumericFeatures": 45, "NumberOfSymbolicFeatures": 0, "PercentageOfSymbolicFeatures": 0, "AutoCorrelation": null, "PercentageOfNumericFeatures": 75, "PercentageOfMissingValues": 0.6046601193914886, "PercentageOfInstancesWithMissingValues": 18.13980358174466, "PercentageOfBinaryFeatures": 0, "NumberOfBinaryFeatures": 0, "MinorityClassSize": null, "MinorityClassPercentage": null, "MajorityClassSize": null, "MajorityClassPercentage": null, "Dimensionality": 0.0014442518775274408 }, "tags": [], "features": [ { "name": "Electricity", "index": "45", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "Household_Head_Class_of_Worker", "index": "31", "type": "string", "distinct": "7", "missing": "7536" }, { "name": "Type_of_Household", "index": "32", "type": "string", "distinct": "3", "missing": "0" }, { "name": "Total_Number_of_Family_members", "index": "33", "type": "numeric", "distinct": "21", "missing": "0", "min": "1", "max": "26", "mean": "5", "stdev": "2" }, { "name": "Members_with_age_less_than_5_year_old", "index": "34", "type": "numeric", "distinct": "6", "missing": "0", "min": "0", "max": "5", "mean": "0", "stdev": "1" }, { "name": "Members_with_age_5_-_17_years_old", "index": "35", "type": "numeric", "distinct": "9", "missing": "0", "min": "0", "max": "8", "mean": "1", "stdev": "1" }, { "name": "Total_number_of_family_members_employed", "index": "36", "type": "numeric", "distinct": "9", "missing": "0", "min": "0", "max": "8", "mean": "1", "stdev": "1" }, { "name": "Type_of_Building\/House", "index": "37", "type": "string", "distinct": "6", "missing": "0" }, { "name": "Type_of_Roof", "index": "38", "type": "string", "distinct": "7", "missing": "0" }, { "name": "Type_of_Walls", "index": "39", "type": "string", "distinct": "6", "missing": "0" }, { "name": "House_Floor_Area", "index": "40", "type": "numeric", "distinct": "313", "missing": "0", "min": "5", "max": "998", "mean": "56", "stdev": "55" }, { "name": "House_Age", "index": "41", "type": "numeric", "distinct": "111", "missing": "0", "min": "0", "max": "200", "mean": "20", "stdev": "14" }, { "name": "Number_of_bedrooms", "index": "42", "type": "numeric", "distinct": "10", "missing": "0", "min": "0", "max": "9", "mean": "2", "stdev": "1" }, { "name": "Tenure_Status", "index": "43", "type": "string", "distinct": "8", "missing": "0" }, { "name": "Toilet_Facilities", "index": "44", "type": "string", "distinct": "8", "missing": "0" }, { "name": "Household_Head_Occupation", "index": "30", "type": "string", "distinct": "378", "missing": "7536" }, { "name": "Main_Source_of_Water_Supply", "index": "46", "type": "string", "distinct": "11", "missing": "0" }, { "name": "Number_of_Television", "index": "47", "type": "numeric", "distinct": "7", "missing": "0", "min": "0", "max": "6", "mean": "1", "stdev": "1" }, { "name": "Number_of_CD\/VCD\/DVD", "index": "48", "type": "numeric", "distinct": "6", "missing": "0", "min": "0", "max": "5", "mean": "0", "stdev": "1" }, { "name": "Number_of_Component\/Stereo_set", "index": "49", "type": "numeric", "distinct": "6", "missing": "0", "min": "0", "max": "5", "mean": "0", "stdev": "0" }, { "name": "Number_of_Refrigerator\/Freezer", "index": "50", "type": "numeric", "distinct": "6", "missing": "0", "min": "0", "max": "5", "mean": "0", "stdev": "1" }, { "name": "Number_of_Washing_Machine", "index": "51", "type": "numeric", "distinct": "4", "missing": "0", "min": "0", "max": "3", "mean": "0", "stdev": "0" }, { "name": "Number_of_Airconditioner", "index": "52", "type": "numeric", "distinct": "6", "missing": "0", "min": "0", "max": "5", "mean": "0", "stdev": "0" }, { "name": "Number_of_Car,_Jeep,_Van", "index": "53", "type": "numeric", "distinct": "6", "missing": "0", "min": "0", "max": "5", "mean": "0", "stdev": "0" }, { "name": "Number_of_Landline\/wireless_telephones", "index": "54", "type": "numeric", "distinct": "5", "missing": "0", "min": "0", "max": "4", "mean": "0", "stdev": "0" }, { "name": "Number_of_Cellular_phone", "index": "55", "type": "numeric", "distinct": "11", "missing": "0", "min": "0", "max": "10", "mean": "2", "stdev": "2" }, { "name": "Number_of_Personal_Computer", "index": "56", "type": "numeric", "distinct": "7", "missing": "0", "min": "0", "max": "6", "mean": "0", "stdev": "1" }, { "name": "Number_of_Stove_with_Oven\/Gas_Range", "index": "57", "type": "numeric", "distinct": "4", "missing": "0", "min": "0", "max": "3", "mean": "0", "stdev": "0" }, { "name": "Number_of_Motorized_Banca", "index": "58", "type": "numeric", "distinct": "4", "missing": "0", "min": "0", "max": "3", "mean": "0", "stdev": "0" }, { "name": "Number_of_Motorcycle\/Tricycle", "index": "59", "type": "numeric", "distinct": "6", "missing": "0", "min": "0", "max": "5", "mean": "0", "stdev": "1" }, { "name": "Housing_and_water_Expenditure", "index": "15", "type": "numeric", "distinct": "13243", "missing": "0", "min": "1950", "max": "2188560", "mean": "38375", "stdev": "53112" }, { "name": "Region", "index": "1", "type": "string", "distinct": "17", "missing": "0" }, { "name": "Total_Food_Expenditure", "index": "2", "type": "numeric", "distinct": "35776", "missing": "0", "min": "2947", "max": "827565", "mean": "85099", "stdev": "51638" }, { "name": "Main_Source_of_Income", "index": "3", "type": "string", "distinct": "3", "missing": "0" }, { "name": "Agricultural_Household_indicator", "index": "4", "type": "numeric", "distinct": "3", "missing": "0", "min": "0", "max": "2", "mean": "0", "stdev": "1" }, { "name": "Bread_and_Cereals_Expenditure", "index": "5", "type": "numeric", "distinct": "26082", "missing": "0", "min": "0", "max": "765864", "mean": "25134", "stdev": "13466" }, { "name": "Total_Rice_Expenditure", "index": "6", "type": "numeric", "distinct": "16145", "missing": "0", "min": "0", "max": "758326", "mean": "18196", "stdev": "11727" }, { "name": "Meat_Expenditure", "index": "7", "type": "numeric", "distinct": "18619", "missing": "0", "min": "0", "max": "261566", "mean": "10540", "stdev": "10498" }, { "name": "Total_Fish_and__marine_products_Expenditure", "index": "8", "type": "numeric", "distinct": "18014", "missing": "0", "min": "0", "max": "188208", "mean": "10529", "stdev": "7812" }, { "name": "Fruit_Expenditure", "index": "9", "type": "numeric", "distinct": "7140", "missing": "0", "min": "0", "max": "273769", "mean": "2550", "stdev": "2970" }, { "name": "Vegetables_Expenditure", "index": "10", "type": "numeric", "distinct": "10599", "missing": "0", "min": "0", "max": "74800", "mean": "5007", "stdev": "3300" }, { "name": "Restaurant_and_hotels_Expenditure", "index": "11", "type": "numeric", "distinct": "12367", "missing": "0", "min": "0", "max": "725296", "mean": "15437", "stdev": "23705" }, { "name": "Alcoholic_Beverages_Expenditure", "index": "12", "type": "numeric", "distinct": "4084", "missing": "0", "min": "0", "max": "59592", "mean": "1085", "stdev": "2174" }, { "name": "Tobacco_Expenditure", "index": "13", "type": "numeric", "distinct": "3118", "missing": "0", "min": "0", "max": "139370", "mean": "2295", "stdev": "3999" }, { "name": "Clothing,_Footwear_and_Other_Wear_Expenditure", "index": "14", "type": "numeric", "distinct": "9819", "missing": "0", "min": "0", "max": "356750", "mean": "4955", "stdev": "7497" }, { "name": "Total_Household_Income", "index": "0", "type": "numeric", "distinct": "38670", "missing": "0", "min": "11285", "max": "11815988", "mean": "247556", "stdev": "286881" }, { "name": "Imputed_House_Rental_Value", "index": "16", "type": "numeric", "distinct": "266", "missing": "0", "min": "0", "max": "1920000", "mean": "20922", "stdev": "39372" }, { "name": "Medical_Care_Expenditure", "index": "17", "type": "numeric", "distinct": "11887", "missing": "0", "min": "0", "max": "1049275", "mean": "7160", "stdev": "26902" }, { "name": "Transportation_Expenditure", "index": "18", "type": "numeric", "distinct": "7435", "missing": "0", "min": "0", "max": "834996", "mean": "11806", "stdev": "19351" }, { "name": "Communication_Expenditure", "index": "19", "type": "numeric", "distinct": "3826", "missing": "0", "min": "0", "max": "149940", "mean": "4095", "stdev": "7299" }, { "name": "Education_Expenditure", "index": "20", "type": "numeric", "distinct": "6893", "missing": "0", "min": "0", "max": "731000", "mean": "7474", "stdev": "21219" }, { "name": "Miscellaneous_Goods_and_Services_Expenditure", "index": "21", "type": "numeric", "distinct": "7669", "missing": "0", "min": "0", "max": "553560", "mean": "12522", "stdev": "17547" }, { "name": "Special_Occasions_Expenditure", "index": "22", "type": "numeric", "distinct": "3412", "missing": "0", "min": "0", "max": "556700", "mean": "5266", "stdev": "13280" }, { "name": "Crop_Farming_and_Gardening_expenses", "index": "23", "type": "numeric", "distinct": "9961", "missing": "0", "min": "0", "max": "3729973", "mean": "13817", "stdev": "47644" }, { "name": "Total_Income_from_Entrepreneurial_Acitivites", "index": "24", "type": "numeric", "distinct": "20204", "missing": "0", "min": "0", "max": "9234485", "mean": "54376", "stdev": "147143" }, { "name": "Household_Head_Sex", "index": "25", "type": "string", "distinct": "2", "missing": "0" }, { "name": "Household_Head_Age", "index": "26", "type": "numeric", "distinct": "89", "missing": "0", "min": "9", "max": "99", "mean": "51", "stdev": "14" }, { "name": "Household_Head_Marital_Status", "index": "27", "type": "string", "distinct": "6", "missing": "0" }, { "name": "Household_Head_Highest_Grade_Completed", "index": "28", "type": "string", "distinct": "46", "missing": "0" }, { "name": "Household_Head_Job_or_Business_Indicator", "index": "29", "type": "string", "distinct": "2", "missing": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }