DEVELOPMENT... { "data_id": "787", "name": "witmer_census_1980", "exact_name": "witmer_census_1980", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Felicia West", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:33:29", "update_comment": null, "last_update": "2014-10-06 03:31:44", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53321\/witmer_census_1980.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": "\"STATE\"", "runs": 117, "suggest": { "input": [ "witmer_census_1980", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 50, "NumberOfFeatures": 5, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 4, "NumberOfSymbolicFeatures": 1, "AutoCorrelation": 0.8367346938775511, "CfsSubsetEval_DecisionStumpAUC": 0.6834935897435898, "CfsSubsetEval_DecisionStumpErrRate": 0.32, "CfsSubsetEval_DecisionStumpKappa": 0.34853420195439744, "CfsSubsetEval_NaiveBayesAUC": 0.6834935897435898, "CfsSubsetEval_NaiveBayesErrRate": 0.32, "CfsSubsetEval_NaiveBayesKappa": 0.34853420195439744, "CfsSubsetEval_kNN1NAUC": 0.6834935897435898, "CfsSubsetEval_kNN1NErrRate": 0.32, "CfsSubsetEval_kNN1NKappa": 0.34853420195439744, "ClassEntropy": 0.9988455359952018, "DecisionStumpAUC": 0.6578525641025641, "DecisionStumpErrRate": 0.34, "DecisionStumpKappa": 0.3089430894308944, "Dimensionality": 0.1, "EquivalentNumberOfAtts": null, "J48.00001.AUC": 0.6498397435897436, "J48.00001.ErrRate": 0.36, "J48.00001.Kappa": 0.26948051948051954, "J48.0001.AUC": 0.6498397435897436, "J48.0001.ErrRate": 0.36, "J48.0001.Kappa": 0.26948051948051954, "J48.001.AUC": 0.6498397435897436, "J48.001.ErrRate": 0.36, "J48.001.Kappa": 0.26948051948051954, "MajorityClassPercentage": 52, "MajorityClassSize": 26, "MaxAttributeEntropy": null, "MaxKurtosisOfNumericAtts": 3.673380835740347, "MaxMeansOfNumericAtts": 9140.58, "MaxMutualInformation": null, "MaxNominalAttDistinctValues": 2, "MaxSkewnessOfNumericAtts": 0.43846074201772367, "MaxStdDevOfNumericAtts": 1289.5023892326583, "MeanAttributeEntropy": null, "MeanKurtosisOfNumericAtts": 1.5135788914315085, "MeanMeansOfNumericAtts": 2299.2974999999997, "MeanMutualInformation": null, "MeanNoiseToSignalRatio": null, "MeanNominalAttDistinctValues": 2, "MeanSkewnessOfNumericAtts": -0.03413477483522419, "MeanStdDevOfNumericAtts": 324.0958799688384, "MinAttributeEntropy": null, "MinKurtosisOfNumericAtts": -0.3030233784453502, "MinMeansOfNumericAtts": 10.958, "MinMutualInformation": null, "MinNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -0.6620636381204995, "MinStdDevOfNumericAtts": 1.6934447443128509, "MinorityClassPercentage": 48, "MinorityClassSize": 24, "NaiveBayesAUC": 0.6538461538461539, "NaiveBayesErrRate": 0.46, "NaiveBayesKappa": 0.09162717219589268, "NumberOfBinaryFeatures": 1, "PercentageOfBinaryFeatures": 20, "PercentageOfInstancesWithMissingValues": 0, "PercentageOfMissingValues": 0, "PercentageOfNumericFeatures": 80, "PercentageOfSymbolicFeatures": 20, "Quartile1AttributeEntropy": null, "Quartile1KurtosisOfNumericAtts": -0.14646403309477674, "Quartile1MeansOfNumericAtts": 12.2465, "Quartile1MutualInformation": null, "Quartile1SkewnessOfNumericAtts": -0.5269332481526318, "Quartile1StdDevOfNumericAtts": 1.8115547683913475, "Quartile2AttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 1.3419790542155183, "Quartile2MeansOfNumericAtts": 22.826, "Quartile2MutualInformation": null, "Quartile2SkewnessOfNumericAtts": 0.04353189838093953, "Quartile2StdDevOfNumericAtts": 2.5938429491912354, "Quartile3AttributeEntropy": null, "Quartile3KurtosisOfNumericAtts": 3.3452216531737835, "Quartile3MeansOfNumericAtts": 6862.819999999999, "Quartile3MutualInformation": null, "Quartile3SkewnessOfNumericAtts": 0.38099702526601964, "Quartile3StdDevOfNumericAtts": 967.8822421889325, "REPTreeDepth1AUC": 0.5825320512820513, "REPTreeDepth1ErrRate": 0.46, "REPTreeDepth1Kappa": 0.09448818897637803, "REPTreeDepth2AUC": 0.5825320512820513, "REPTreeDepth2ErrRate": 0.46, "REPTreeDepth2Kappa": 0.09448818897637803, "REPTreeDepth3AUC": 0.5825320512820513, "REPTreeDepth3ErrRate": 0.46, "REPTreeDepth3Kappa": 0.09448818897637803, "RandomTreeDepth1AUC": 0.6362179487179486, "RandomTreeDepth1ErrRate": 0.36, "RandomTreeDepth1Kappa": 0.2741935483870968, "RandomTreeDepth2AUC": 0.6362179487179486, "RandomTreeDepth2ErrRate": 0.36, "RandomTreeDepth2Kappa": 0.2741935483870968, "RandomTreeDepth3AUC": 0.6362179487179486, "RandomTreeDepth3ErrRate": 0.36, "RandomTreeDepth3Kappa": 0.2741935483870968, "StdvNominalAttDistinctValues": 0, "kNN1NAUC": 0.5785256410256411, "kNN1NErrRate": 0.42, "kNN1NKappa": 0.15730337078651668 }, "tags": [ { "tag": "binarized", "uploader": "1" }, { "tag": "mythbusting_1", "uploader": "1" }, { "tag": "study_1", "uploader": "2" }, { "tag": "study_123", "uploader": "3886" }, { "tag": "study_15", "uploader": "939" }, { "tag": "study_20", "uploader": "939" } ], "features": [ { "name": "binaryClass", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "24", "0" ], [ "0", "26" ] ] ] }, { "name": "STATE", "index": "0", "type": "nominal", "distinct": "50", "missing": "0", "ignore": "1", "distr": [ [ "Alabama", "Alaska", "Arizona", "Arkansas", "California", "Colorado", "Connecticut", "Delaware", "Florida", "Georgia", "Hawaii", "Idaho", "Illinios", "Indiana", "Iowa", "Kansas", "Kentucky", "Louisiana", "Maine", "Maryland", "Massachusetts", "Michigan", "Minnesota", "Mississippi", "Missouri", "Montana", "Nebraska", "Neveda", "New_Hampshire", "New_Jersey", "New_Mexico", "New_York", "North_Carolina", "North_Dakota", "Ohio", "Oklahoma", "Oregon", "Pennsylvania", "Rhode_Island", "South_Carolina", "South_Dakota", "Tennessee", "Texas", "Utah", "Vermont", "Virginia", "Washington", "West_Virginia", "Wisconsin", "Wyoming" ], [ [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ] ] ] }, { "name": "OVER65Perc", "index": "1", "type": "numeric", "distinct": "39", "missing": "0", "min": "3", "max": "17", "mean": "11", "stdev": "2" }, { "name": "MEDAGE", "index": "2", "type": "numeric", "distinct": "37", "missing": "0", "min": "24", "max": "35", "mean": "30", "stdev": "2" }, { "name": "PERCAP$", "index": "3", "type": "numeric", "distinct": "50", "missing": "0", "min": "6614", "max": "13007", "mean": "9141", "stdev": "1290" }, { "name": "COLLEGEPerc", "index": "4", "type": "numeric", "distinct": "39", "missing": "0", "min": "10", "max": "23", "mean": "16", "stdev": "3" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 4, "total_downloads": 5, "reach": 4, "reuse": 14, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 14 }