{ "data_id": "23", "name": "cmc", "exact_name": "cmc", "version": 1, "version_label": "1", "description": "**Author**: [Tjen-Sien Lim](limt@stat.wisc.edu) \r\n**Source**: [As obtained from UCI](https:\/\/archive.ics.uci.edu\/ml\/datasets\/Contraceptive+Method+Choice)\r\n**Please cite**: [UCI citation](https:\/\/archive.ics.uci.edu\/ml\/citation_policy.html)\r\n\r\n1. Title: Contraceptive Method Choice\r\n \r\n 2. Sources:\r\n (a) Origin: This dataset is a subset of the 1987 National Indonesia\r\n Contraceptive Prevalence Survey\r\n (b) Creator: Tjen-Sien Lim (limt@stat.wisc.edu)\r\n (c) Donor: Tjen-Sien Lim (limt@stat.wisc.edu)\r\n (c) Date: June 7, 1997\r\n \r\n 3. Past Usage:\r\n Lim, T.-S., Loh, W.-Y. & Shih, Y.-S. (1999). A Comparison of\r\n Prediction Accuracy, Complexity, and Training Time of Thirty-three\r\n Old and New Classification Algorithms. Machine Learning. Forthcoming.\r\n (ftp:\/\/ftp.stat.wisc.edu\/pub\/loh\/treeprogs\/quest1.7\/mach1317.pdf or\r\n (http:\/\/www.stat.wisc.edu\/~limt\/mach1317.pdf)\r\n \r\n 4. Relevant Information:\r\n This dataset is a subset of the 1987 National Indonesia Contraceptive\r\n Prevalence Survey. The samples are married women who were either not \r\n pregnant or do not know if they were at the time of interview. The \r\n problem is to predict the current contraceptive method choice \r\n (no use, long-term methods, or short-term methods) of a woman based \r\n on her demographic and socio-economic characteristics.\r\n \r\n 5. Number of Instances: 1473\r\n \r\n 6. Number of Attributes: 10 (including the class attribute)\r\n \r\n 7. Attribute Information:\r\n \r\n 1. Wife's age (numerical)\r\n 2. Wife's education (categorical) 1=low, 2, 3, 4=high\r\n 3. Husband's education (categorical) 1=low, 2, 3, 4=high\r\n 4. Number of children ever born (numerical)\r\n 5. Wife's religion (binary) 0=Non-Islam, 1=Islam\r\n 6. Wife's now working? (binary) 0=Yes, 1=No\r\n 7. Husband's occupation (categorical) 1, 2, 3, 4\r\n 8. Standard-of-living index (categorical) 1=low, 2, 3, 4=high\r\n 9. Media exposure (binary) 0=Good, 1=Not good\r\n 10. Contraceptive method used (class attribute) 1=No-use \r\n 2=Long-term\r\n 3=Short-term\r\n \r\n 8. Missing Attribute Values: None\r\n\r\n Information about the dataset\r\n CLASSTYPE: nominal\r\n CLASSINDEX: last", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": null, "contributor": null, "date": "2014-04-06 23:21:03", "update_comment": null, "last_update": "2014-04-06 23:21:03", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/23\/dataset_23_cmc.arff", "default_target_attribute": "Contraceptive_method_used", "row_id_attribute": null, "ignore_attribute": null, "runs": 22723, "suggest": { "input": [ "cmc", "1. Title: Contraceptive Method Choice 2. Sources: (a) Origin: This dataset is a subset of the 1987 National Indonesia Contraceptive Prevalence Survey (b) Creator: Tjen-Sien Lim (limt@stat.wisc.edu) (c) Donor: Tjen-Sien Lim (limt@stat.wisc.edu) (c) Date: June 7, 1997 3. Past Usage: Lim, T.-S., Loh, W.-Y. & Shih, Y.-S. (1999). A Comparison of Prediction Accuracy, Complexity, and Training Time of Thirty-three Old and New Classification Algorithms. Machine Learning. Forthcoming. (ftp:\/\/ftp.stat.wisc " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1473, "NumberOfFeatures": 10, "NumberOfClasses": 3, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 2, "NumberOfSymbolicFeatures": 8, "MinAttributeEntropy": 0.380671663040156, "Quartile2KurtosisOfNumericAtts": 0.2928560302339025, "REPTreeDepth2Kappa": 0.24500740673149984, "ClassEntropy": 1.5390345832497478, "kNN1NKappa": 0.14890873693558304, "MajorityClassSize": 629, "MinKurtosisOfNumericAtts": -0.9438944908638565, "Quartile2MeansOfNumericAtts": 17.899864222674818, "REPTreeDepth3AUC": 0.6719876165083715, "DecisionStumpAUC": 0.5552950487800741, "MaxAttributeEntropy": 1.8667550694041894, "MinMeansOfNumericAtts": 3.2613713509843865, "Quartile2MutualInformation": 0.03047421456026, "REPTreeDepth3ErrRate": 0.4881194840461643, "DecisionStumpErrRate": 0.572980312287848, "MaxKurtosisOfNumericAtts": 1.5296065513316615, "MinMutualInformation": 0.00258233237972, "Quartile2SkewnessOfNumericAtts": 0.6777315757939906, "REPTreeDepth3Kappa": 0.24500740673149984, "DecisionStumpKappa": 0, "MaxMeansOfNumericAtts": 32.53835709436525, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 30, "Quartile2StdDevOfNumericAtts": 5.2928968090790125, "RandomTreeDepth1AUC": 0.6012886776675508, "Dimensionality": 0.006788866259334691, "MaxMutualInformation": 0.07090633894894, "MinSkewnessOfNumericAtts": 0.25644920548189276, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 1.757839343635201, "RandomTreeDepth1ErrRate": 0.5207060420909708, "EquivalentNumberOfAtts": 53.274885238451205, "MaxNominalAttDistinctValues": 4, "MinStdDevOfNumericAtts": 2.3585488626874125, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 1.5296065513316615, "AutoCorrelation": 0.9966032608695652, "RandomTreeDepth1Kappa": 0.19342354382447932, "J48.00001.AUC": 0.6520164081542908, "MaxSkewnessOfNumericAtts": 1.0990139461060884, "MinorityClassPercentage": 22.606924643584524, "PercentageOfNumericFeatures": 20, "Quartile3MeansOfNumericAtts": 32.53835709436525, "CfsSubsetEval_DecisionStumpAUC": 0.6599986009904834, "RandomTreeDepth2AUC": 0.6012886776675508, "J48.00001.ErrRate": 0.5044127630685675, "MaxStdDevOfNumericAtts": 8.227244755470613, "MinorityClassSize": 333, "PercentageOfSymbolicFeatures": 80, "Quartile3MutualInformation": 0.04013859922938, "CfsSubsetEval_DecisionStumpErrRate": 0.4894772572980312, "RandomTreeDepth2ErrRate": 0.5207060420909708, "J48.00001.Kappa": 0.21816403682727648, "MeanAttributeEntropy": 1.2208122969788784, "NaiveBayesAUC": 0.6798006519603141, "Quartile1AttributeEntropy": 0.6082239803272842, "Quartile3SkewnessOfNumericAtts": 1.0990139461060884, "CfsSubsetEval_DecisionStumpKappa": 0.2302758889602379, "RandomTreeDepth2Kappa": 0.19342354382447932, "J48.0001.AUC": 0.6520164081542908, "MeanKurtosisOfNumericAtts": 0.2928560302339025, "NaiveBayesErrRate": 0.506449422946368, "Quartile1KurtosisOfNumericAtts": -0.9438944908638565, "Quartile3StdDevOfNumericAtts": 8.227244755470613, "CfsSubsetEval_NaiveBayesAUC": 0.6599986009904834, "RandomTreeDepth3AUC": 0.6012886776675508, "J48.0001.ErrRate": 0.5044127630685675, "MeanMeansOfNumericAtts": 17.89986422267482, "NaiveBayesKappa": 0.2336054769068532, "Quartile1MeansOfNumericAtts": 3.2613713509843865, "REPTreeDepth1AUC": 0.6719876165083715, "CfsSubsetEval_NaiveBayesErrRate": 0.4894772572980312, "RandomTreeDepth3ErrRate": 0.5207060420909708, "J48.0001.Kappa": 0.21816403682727648, "MeanMutualInformation": 0.028888557457444283, "NumberOfBinaryFeatures": 3, "Quartile1MutualInformation": 0.00982050143438, "REPTreeDepth1ErrRate": 0.4881194840461643, "CfsSubsetEval_NaiveBayesKappa": 0.2302758889602379, "RandomTreeDepth3Kappa": 0.19342354382447932, "J48.001.AUC": 0.6520164081542908, "MeanNoiseToSignalRatio": 41.259372029124556, "Quartile1SkewnessOfNumericAtts": 0.25644920548189276, "REPTreeDepth1Kappa": 0.24500740673149984, "CfsSubsetEval_kNN1NAUC": 0.6599986009904834, "StdvNominalAttDistinctValues": 0.9910312089651149, "J48.001.ErrRate": 0.5044127630685675, "MeanNominalAttDistinctValues": 3.125, "Quartile1StdDevOfNumericAtts": 2.3585488626874125, "REPTreeDepth2AUC": 0.6719876165083715, "CfsSubsetEval_kNN1NErrRate": 0.4894772572980312, "kNN1NAUC": 0.5810647503679196, "J48.001.Kappa": 0.21816403682727648, "MeanSkewnessOfNumericAtts": 0.6777315757939906, "MeanStdDevOfNumericAtts": 5.2928968090790125, "Quartile2AttributeEntropy": 1.4479885111323352, "REPTreeDepth2ErrRate": 0.4881194840461643, "CfsSubsetEval_kNN1NKappa": 0.2302758889602379, "kNN1NErrRate": 0.551255940257977, "MajorityClassPercentage": 42.701968771215206 }, "tags": [ { "tag": "OpenML-CC18", "uploader": "1" }, { "tag": "OpenML100", "uploader": "348" }, { "tag": "study_1", "uploader": "2" }, { "tag": "study_123", "uploader": "3886" }, { "tag": "study_14", "uploader": "64" }, { "tag": "study_34", "uploader": "1" }, { "tag": "study_37", "uploader": "1" }, { "tag": "study_41", "uploader": "1" }, { "tag": "study_50", "uploader": "64" }, { "tag": "study_7", "uploader": "64" }, { "tag": "study_70", "uploader": "1856" }, { "tag": "study_98", "uploader": "1935" }, { "tag": "study_99", "uploader": "1" }, { "tag": "uci", "uploader": "1" } ], "features": [ { "name": "Contraceptive_method_used", "index": "9", "type": "nominal", "distinct": "3", "missing": "0", "target": "1", "distr": [ [ "1", "2", "3" ], [ [ "629", "0", "0" ], [ "0", "333", "0" ], [ "0", "0", "511" ] ] ] }, { "name": "Wifes_age", "index": "0", "type": "numeric", "distinct": "34", "missing": "0", "min": "16", "max": "49", "mean": "33", "stdev": "8" }, { "name": "Wifes_education", "index": "1", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "1", "2", "3", "4" ], [ [ "103", "9", "40" ], [ "176", "37", "121" ], [ "175", "80", "155" ], [ "175", "207", "195" ] ] ] }, { "name": "Husbands_education", "index": "2", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "1", "2", "3", "4" ], [ [ "31", "10", "3" ], [ "99", "16", "63" ], [ "161", "50", "141" ], [ "338", "257", "304" ] ] ] }, { "name": "Number_of_children_ever_born", "index": "3", "type": "numeric", "distinct": "15", "missing": "0", "min": "0", "max": "16", "mean": "3", "stdev": "2" }, { "name": "Wifes_religion", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "75", "76", "69" ], [ "554", "257", "442" ] ] ] }, { "name": "Wifes_now_working%3F", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "170", "89", "110" ], [ "459", "244", "401" ] ] ] }, { "name": "Husbands_occupation", "index": "6", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "1", "2", "3", "4" ], [ [ "158", "156", "122" ], [ "200", "79", "146" ], [ "258", "93", "234" ], [ "13", "5", "9" ] ] ] }, { "name": "Standard-of-living_index", "index": "7", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "1", "2", "3", "4" ], [ [ "80", "9", "40" ], [ "117", "30", "82" ], [ "184", "90", "157" ], [ "248", "204", "232" ] ] ] }, { "name": "Media_exposure", "index": "8", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "555", "323", "486" ], [ "74", "10", "25" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 19, "total_downloads": 21, "reach": 19, "reuse": 1, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 1 }