DEVELOPMENT... { "data_id": "45656", "name": "simulated_adult", "exact_name": "simulated_adult", "version": 1, "version_label": null, "description": "See [https:\/\/github.com\/slds-lmu\/paper_2023_ci_for_ge](https:\/\/github.com\/slds-lmu\/paper_2023_ci_for_ge) for a description.", "format": "arff", "uploader": "Shirley ", "uploader_id": 30127, "visibility": "public", "creator": "\"Sebastian Fischer\"", "contributor": null, "date": "2023-08-30 09:56:28", "update_comment": null, "last_update": "2023-08-30 09:56:28", "licence": "CC BY 4.0", "status": "active", "error_message": null, "url": "https:\/\/api.openml.org\/data\/download\/22117141\/dataset", "default_target_attribute": "class", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "simulated_adult", "See [https:\/\/github.com\/slds-lmu\/paper_2023_ci_for_ge](https:\/\/github.com\/slds-lmu\/paper_2023_ci_for_ge) for a description. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 5100000, "NumberOfFeatures": 15, "NumberOfClasses": 2, "NumberOfMissingValues": 68, "NumberOfInstancesWithMissingValues": 68, "NumberOfNumericFeatures": 6, "NumberOfSymbolicFeatures": 9, "PercentageOfSymbolicFeatures": 60, "AutoCorrelation": 0.6262273776916427, "PercentageOfNumericFeatures": 40, "PercentageOfMissingValues": 8.888888888888889e-5, "PercentageOfInstancesWithMissingValues": 0.0013333333333333333, "PercentageOfBinaryFeatures": 13.333333333333334, "NumberOfBinaryFeatures": 2, "MinorityClassSize": 1267954, "MinorityClassPercentage": 24.8618431372549, "MajorityClassSize": 3832046, "MajorityClassPercentage": 75.13815686274509, "Dimensionality": 2.9411764705882355e-6 }, "tags": [ { "tag": "study_396", "uploader": "0" } ], "features": [ { "name": "class", "index": "14", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "<=50K", ">50K" ], [ [ "3832046", "0" ], [ "0", "1267954" ] ] ] }, { "name": "age", "index": "0", "type": "numeric", "distinct": "76", "missing": "0", "min": "0", "max": "99", "mean": "36", "stdev": "12" }, { "name": "workclass", "index": "1", "type": "nominal", "distinct": "7", "missing": "2", "distr": [ [ "Federal-gov", "Local-gov", "Private", "Self-emp-inc", "Self-emp-not-inc", "State-gov", "Without-pay" ], [ [ "32379", "31240" ], [ "113962", "64270" ], [ "3416786", "994159" ], [ "33211", "75419" ], [ "169205", "75156" ], [ "66314", "27701" ], [ "189", "7" ] ] ] }, { "name": "fnlwgt", "index": "2", "type": "numeric", "distinct": "34775", "missing": "0", "min": "2", "max": "27999996", "mean": "182280", "stdev": "94293" }, { "name": "education", "index": "3", "type": "nominal", "distinct": "16", "missing": "29", "distr": [ [ "10th", "11th", "12th", "1st-4th", "5th-6th", "7th-8th", "9th", "Assoc-acdm", "Assoc-voc", "Bachelors", "Doctorate", "HS-grad", "Masters", "Preschool", "Prof-school", "Some-college" ], [ [ "58995", "2431" ], [ "99073", "2572" ], [ "19738", "702" ], [ "3980", "134" ], [ "13855", "336" ], [ "30075", "1295" ], [ "25001", "883" ], [ "62431", "24385" ], [ "102385", "32455" ], [ "446904", "467319" ], [ "4210", "23204" ], [ "1953378", "301969" ], [ "63084", "147815" ], [ "951", "17" ], [ "7421", "40708" ], [ "940539", "221726" ] ] ] }, { "name": "education-num", "index": "4", "type": "numeric", "distinct": "19", "missing": "0", "min": "0", "max": "18", "mean": "10", "stdev": "2" }, { "name": "marital-status", "index": "5", "type": "nominal", "distinct": "7", "missing": "4", "distr": [ [ "Divorced", "Married-AF-spouse", "Married-civ-spouse", "Married-spouse-absent", "Never-married", "Separated", "Widowed" ], [ [ "579972", "24505" ], [ "232", "80" ], [ "1407973", "1207046" ], [ "13644", "628" ], [ "1715436", "32456" ], [ "63324", "1510" ], [ "51462", "1728" ] ] ] }, { "name": "occupation", "index": "6", "type": "nominal", "distinct": "14", "missing": "23", "distr": [ [ "Adm-clerical", "Armed-Forces", "Craft-repair", "Exec-managerial", "Farming-fishing", "Handlers-cleaners", "Machine-op-inspct", "Other-service", "Priv-house-serv", "Prof-specialty", "Protective-serv", "Sales", "Tech-support", "Transport-moving" ], [ [ "637888", "55346" ], [ "97", "12" ], [ "785872", "203544" ], [ "313294", "401488" ], [ "75576", "8610" ], [ "212854", "7860" ], [ "332304", "37723" ], [ "468239", "6693" ], [ "6157", "49" ], [ "286434", "291298" ], [ "36070", "16738" ], [ "429845", "169385" ], [ "65301", "27572" ], [ "182096", "41632" ] ] ] }, { "name": "relationship", "index": "7", "type": "nominal", "distinct": "6", "missing": "6", "distr": [ [ "Husband", "Not-in-family", "Other-relative", "Own-child", "Unmarried", "Wife" ], [ [ "1336944", "1143536" ], [ "1177003", "51655" ], [ "64167", "429" ], [ "810283", "1849" ], [ "378332", "7386" ], [ "65311", "63099" ] ] ] }, { "name": "race", "index": "8", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "Amer-Indian-Eskimo", "Asian-Pac-Islander", "Black", "Other", "White" ], [ [ "7687", "650" ], [ "31699", "10104" ], [ "228321", "18673" ], [ "4803", "387" ], [ "3559536", "1238140" ] ] ] }, { "name": "sex", "index": "9", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "Female", "Male" ], [ [ "1330045", "85711" ], [ "2502001", "1182243" ] ] ] }, { "name": "capital-gain", "index": "10", "type": "numeric", "distinct": "121", "missing": "0", "min": "0", "max": "99999", "mean": "375", "stdev": "4375" }, { "name": "capital-loss", "index": "11", "type": "numeric", "distinct": "91", "missing": "0", "min": "0", "max": "99999", "mean": "21", "stdev": "205" }, { "name": "hours-per-week", "index": "12", "type": "numeric", "distinct": "91", "missing": "0", "min": "1", "max": "99", "mean": "41", "stdev": "8" }, { "name": "native-country", "index": "13", "type": "nominal", "distinct": "41", "missing": "4", "distr": [ [ "Cambodia", "Canada", "China", "Columbia", "Cuba", "Dominican-Republic", "Ecuador", "El-Salvador", "England", "France", "Germany", "Greece", "Guatemala", "Haiti", "Holand-Netherlands", "Honduras", "Hong", "Hungary", "India", "Iran", "Ireland", "Italy", "Jamaica", "Japan", "Laos", "Mexico", "Nicaragua", "Outlying-US(Guam-USVI-etc)", "Peru", "Philippines", "Poland", "Portugal", "Puerto-Rico", "Scotland", "South", "Taiwan", "Thailand", "Trinadad&Tobago", "United-States", "Vietnam", "Yugoslavia" ], [ [ "423", "74" ], [ "1637", "1082" ], [ "1624", "890" ], [ "1513", "44" ], [ "1430", "399" ], [ "1911", "40" ], [ "530", "77" ], [ "3672", "105" ], [ "726", "786" ], [ "136", "161" ], [ "2146", "728" ], [ "435", "479" ], [ "2317", "22" ], [ "1140", "58" ], [ "2", "0" ], [ "418", "1" ], [ "383", "94" ], [ "114", "86" ], [ "1618", "1532" ], [ "390", "398" ], [ "653", "230" ], [ "1030", "461" ], [ "1595", "151" ], [ "641", "637" ], [ "247", "34" ], [ "30625", "643" ], [ "431", "28" ], [ "184", "10" ], [ "438", "44" ], [ "4972", "1850" ], [ "1294", "352" ], [ "2310", "566" ], [ "3164", "275" ], [ "185", "33" ], [ "1975", "334" ], [ "538", "646" ], [ "201", "37" ], [ "355", "32" ], [ "3756627", "1254287" ], [ "1827", "121" ], [ "185", "127" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }