{ "data_id": "42164", "name": "dating_profile", "exact_name": "dating_profile", "version": 1, "version_label": "0.1", "description": "Anonymized data of dating profiles from OkCupid", "format": "arff", "uploader": "Thomas Schmitt", "uploader_id": 3422, "visibility": "public", "creator": "\"OkCupid\"", "contributor": null, "date": "2019-10-04 12:46:11", "update_comment": null, "last_update": "2019-10-04 12:46:11", "licence": "NA", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/21754538\/dataset", "default_target_attribute": "age", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "dating_profile", "Anonymized data of dating profiles from OkCupid " ], "weight": 5 }, "qualities": { "NumberOfInstances": 59946, "NumberOfFeatures": 31, "NumberOfClasses": 0, "NumberOfMissingValues": 273249, "NumberOfInstancesWithMissingValues": 55542, "NumberOfNumericFeatures": 3, "NumberOfSymbolicFeatures": 0, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": 1.2657731208364558, "MajorityClassSize": null, "MinKurtosisOfNumericAtts": 1.572517755530649, "PercentageOfBinaryFeatures": 0, "Quartile2StdDevOfNumericAtts": 9.452779096971241, "MaxAttributeEntropy": null, "MaxKurtosisOfNumericAtts": 86.87016313687228, "MinMeansOfNumericAtts": 32.340289593967825, "PercentageOfInstancesWithMissingValues": 92.65338804924433, "Quartile3AttributeEntropy": null, "MaxMeansOfNumericAtts": 20033.222533613683, "MinMutualInformation": null, "PercentageOfMissingValues": 14.704040087691824, "Quartile3KurtosisOfNumericAtts": 86.87016313687228, "MaxMutualInformation": null, "MinNominalAttDistinctValues": null, "PercentageOfNumericFeatures": 9.67741935483871, "Quartile3MeansOfNumericAtts": 20033.222533613683, "MaxNominalAttDistinctValues": null, "MinSkewnessOfNumericAtts": -0.4630608834485455, "PercentageOfSymbolicFeatures": 0, "Quartile3MutualInformation": null, "MaxSkewnessOfNumericAtts": 9.03615695641967, "MinStdDevOfNumericAtts": 3.994803134655349, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 9.03615695641967, "MaxStdDevOfNumericAtts": 97346.19210364216, "MinorityClassPercentage": null, "Quartile1KurtosisOfNumericAtts": 1.572517755530649, "Quartile3StdDevOfNumericAtts": 97346.19210364216, "MeanAttributeEntropy": null, "MinorityClassSize": null, "Quartile1MeansOfNumericAtts": 32.340289593967825, "StdvNominalAttDistinctValues": null, "MeanKurtosisOfNumericAtts": 32.06791444630804, "NumberOfBinaryFeatures": 0, "Quartile1MutualInformation": null, "MeanMeansOfNumericAtts": 6711.286034574714, "Quartile1SkewnessOfNumericAtts": -0.4630608834485455, "MeanMutualInformation": null, "Quartile1StdDevOfNumericAtts": 3.994803134655349, "AutoCorrelation": -8.740745683543247, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "ClassEntropy": null, "MeanNominalAttDistinctValues": null, "Quartile2KurtosisOfNumericAtts": 7.76106244652118, "Dimensionality": 0.0005171320855436559, "MeanSkewnessOfNumericAtts": 3.279623064602527, "Quartile2MeansOfNumericAtts": 68.29528051649076, "EquivalentNumberOfAtts": null, "MeanStdDevOfNumericAtts": 32453.213228624594, "Quartile2MutualInformation": null, "MajorityClassPercentage": null }, "tags": [], "features": [ { "name": "age", "index": "0", "type": "numeric", "distinct": "54", "missing": "0", "target": "1", "min": "18", "max": "110", "mean": "32", "stdev": "9" }, { "name": "body_type", "index": "1", "type": "string", "distinct": "12", "missing": "5296" }, { "name": "diet", "index": "2", "type": "string", "distinct": "18", "missing": "24395" }, { "name": "drinks", "index": "3", "type": "string", "distinct": "6", "missing": "2985" }, { "name": "drugs", "index": "4", "type": "string", "distinct": "3", "missing": "14080" }, { "name": "education", "index": "5", "type": "string", "distinct": "32", "missing": "6628" }, { "name": "essay0", "index": "6", "type": "string", "distinct": "54349", "missing": "5490" }, { "name": "essay1", "index": "7", "type": "string", "distinct": "51516", "missing": "7572" }, { "name": "essay2", "index": "8", "type": "string", "distinct": "48634", "missing": "9639" }, { "name": "essay3", "index": "9", "type": "string", "distinct": "43532", "missing": "11496" }, { "name": "essay4", "index": "10", "type": "string", "distinct": "49260", "missing": "10537" }, { "name": "essay5", "index": "11", "type": "string", "distinct": "48962", "missing": "10852" }, { "name": "essay6", "index": "12", "type": "string", "distinct": "43602", "missing": "13773" }, { "name": "essay7", "index": "13", "type": "string", "distinct": "45553", "missing": "12456" }, { "name": "essay8", "index": "14", "type": "string", "distinct": "39323", "missing": "19238" }, { "name": "essay9", "index": "15", "type": "string", "distinct": "45442", "missing": "12605" }, { "name": "ethnicity", "index": "16", "type": "string", "distinct": "217", "missing": "5680" }, { "name": "height", "index": "17", "type": "numeric", "distinct": "60", "missing": "3", "min": "1", "max": "95", "mean": "68", "stdev": "4" }, { "name": "income", "index": "18", "type": "numeric", "distinct": "13", "missing": "0", "min": "-1", "max": "1000000", "mean": "20033", "stdev": "97346" }, { "name": "job", "index": "19", "type": "string", "distinct": "21", "missing": "8198" }, { "name": "last_online", "index": "20", "type": "string", "distinct": "30123", "missing": "0" }, { "name": "location", "index": "21", "type": "string", "distinct": "199", "missing": "0" }, { "name": "offspring", "index": "22", "type": "string", "distinct": "15", "missing": "35561" }, { "name": "orientation", "index": "23", "type": "string", "distinct": "3", "missing": "0" }, { "name": "pets", "index": "24", "type": "string", "distinct": "15", "missing": "19921" }, { "name": "religion", "index": "25", "type": "string", "distinct": "45", "missing": "20226" }, { "name": "sex", "index": "26", "type": "string", "distinct": "2", "missing": "0" }, { "name": "sign", "index": "27", "type": "string", "distinct": "48", "missing": "11056" }, { "name": "smokes", "index": "28", "type": "string", "distinct": "5", "missing": "5512" }, { "name": "speaks", "index": "29", "type": "string", "distinct": "7647", "missing": "50" }, { "name": "status", "index": "30", "type": "string", "distinct": "5", "missing": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 1, "total_downloads": 1, "reach": 1, "reuse": 1, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 1 }