{ "data_id": "1003", "name": "primary-tumor", "exact_name": "primary-tumor", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun.", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 22:44:55", "update_comment": null, "last_update": "2014-10-04 22:44:55", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53537\/primary-tumor.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 752, "suggest": { "input": [ "primary-tumor", "Binarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 339, "NumberOfFeatures": 18, "NumberOfClasses": 2, "NumberOfMissingValues": 225, "NumberOfInstancesWithMissingValues": 207, "NumberOfNumericFeatures": 0, "NumberOfSymbolicFeatures": 18, "kNN1NErrRate": 0.1887905604719764, "MajorityClassPercentage": 75.22123893805309, "MeanStdDevOfNumericAtts": null, "Quartile2AttributeEntropy": 0.8434470496889677, "REPTreeDepth2ErrRate": 0.19469026548672566, "CfsSubsetEval_kNN1NKappa": 0.3347653142402547, "kNN1NKappa": 0.4543534027463407, "MajorityClassSize": 255, "MinAttributeEntropy": 0.14506896855940504, "Quartile2KurtosisOfNumericAtts": null, "REPTreeDepth2Kappa": 0.41725269573370855, "ClassEntropy": 0.8077527023327316, "MaxAttributeEntropy": 1.2337942126841774, "MinKurtosisOfNumericAtts": null, "Quartile2MeansOfNumericAtts": null, "REPTreeDepth3AUC": 0.7811157796451914, "DecisionStumpAUC": 0.717203548085901, "DecisionStumpErrRate": 0.2536873156342183, "MaxKurtosisOfNumericAtts": null, "MinMeansOfNumericAtts": null, "Quartile2MutualInformation": 0.01515423696897, "REPTreeDepth3ErrRate": 0.19469026548672566, "DecisionStumpKappa": 0.38345387641162276, "MaxMeansOfNumericAtts": null, "MinMutualInformation": 0.00060704494722, "Quartile2SkewnessOfNumericAtts": null, "REPTreeDepth3Kappa": 0.41725269573370855, "Dimensionality": 0.05309734513274336, "MaxMutualInformation": 0.17643399591969, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 83.33333333333334, "Quartile2StdDevOfNumericAtts": null, "RandomTreeDepth1AUC": 0.7556187666807136, "EquivalentNumberOfAtts": 22.563961877340635, "MaxNominalAttDistinctValues": 3, "MinSkewnessOfNumericAtts": null, "PercentageOfInstancesWithMissingValues": 61.06194690265486, "Quartile3AttributeEntropy": 0.9613350601400221, "RandomTreeDepth1ErrRate": 0.22123893805309736, "RandomTreeDepth1Kappa": 0.38439747221616916, "J48.00001.AUC": 0.786624649859944, "MaxSkewnessOfNumericAtts": null, "MinStdDevOfNumericAtts": null, "PercentageOfMissingValues": 3.687315634218289, "Quartile3KurtosisOfNumericAtts": null, "AutoCorrelation": 0.6124260355029586, "RandomTreeDepth2AUC": 0.7556187666807136, "J48.00001.ErrRate": 0.2153392330383481, "MaxStdDevOfNumericAtts": null, "MinorityClassPercentage": 24.778761061946902, "PercentageOfNumericFeatures": 0, "Quartile3MeansOfNumericAtts": null, "CfsSubsetEval_DecisionStumpAUC": 0.7508169934640523, "RandomTreeDepth2ErrRate": 0.22123893805309736, "J48.00001.Kappa": 0.32853072853072834, "MeanAttributeEntropy": 0.7611060837128614, "MinorityClassSize": 84, "PercentageOfSymbolicFeatures": 100, "Quartile3MutualInformation": 0.029905266185039997, "CfsSubsetEval_DecisionStumpErrRate": 0.2182890855457227, "RandomTreeDepth2Kappa": 0.38439747221616916, "J48.0001.AUC": 0.786624649859944, "MeanKurtosisOfNumericAtts": null, "NaiveBayesAUC": 0.8547267874701502, "Quartile1AttributeEntropy": 0.513400796066442, "Quartile3SkewnessOfNumericAtts": null, "CfsSubsetEval_DecisionStumpKappa": 0.3347653142402547, "RandomTreeDepth3AUC": 0.7556187666807136, "J48.0001.ErrRate": 0.2153392330383481, "MeanMeansOfNumericAtts": null, "NaiveBayesErrRate": 0.18289085545722714, "Quartile1KurtosisOfNumericAtts": null, "Quartile3StdDevOfNumericAtts": null, "CfsSubsetEval_NaiveBayesAUC": 0.7508169934640523, "RandomTreeDepth3ErrRate": 0.22123893805309736, "J48.0001.Kappa": 0.32853072853072834, "MeanMutualInformation": 0.03579835432818647, "NaiveBayesKappa": 0.4803441625871532, "Quartile1MeansOfNumericAtts": null, "REPTreeDepth1AUC": 0.7811157796451914, "CfsSubsetEval_NaiveBayesErrRate": 0.2182890855457227, "RandomTreeDepth3Kappa": 0.38439747221616916, "J48.001.AUC": 0.786624649859944, "MeanNoiseToSignalRatio": 20.26092380491332, "NumberOfBinaryFeatures": 15, "Quartile1MutualInformation": 0.003641247931365, "REPTreeDepth1ErrRate": 0.19469026548672566, "CfsSubsetEval_NaiveBayesKappa": 0.3347653142402547, "StdvNominalAttDistinctValues": 0.38348249442368515, "J48.001.ErrRate": 0.2153392330383481, "MeanNominalAttDistinctValues": 2.1666666666666665, "Quartile1SkewnessOfNumericAtts": null, "REPTreeDepth1Kappa": 0.41725269573370855, "CfsSubsetEval_kNN1NAUC": 0.7508169934640523, "kNN1NAUC": 0.7877917833800187, "J48.001.Kappa": 0.32853072853072834, "MeanSkewnessOfNumericAtts": null, "Quartile1StdDevOfNumericAtts": null, "REPTreeDepth2AUC": 0.7811157796451914, "CfsSubsetEval_kNN1NErrRate": 0.2182890855457227 }, "tags": [ { "tag": "mythbusting_1", "uploader": "1" }, { "tag": "study_1", "uploader": "2" }, { "tag": "study_144", "uploader": "5824" }, { "tag": "study_15", "uploader": "939" }, { "tag": "study_20", "uploader": "939" }, { "tag": "study_41", "uploader": "1" } ], "features": [ { "name": "binaryClass", "index": "17", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "84", "0" ], [ "0", "255" ] ] ] }, { "name": "age", "index": "0", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "<30", "30-59", ">=60" ], [ [ "6", "17" ], [ "57", "152" ], [ "21", "86" ] ] ] }, { "name": "sex", "index": "1", "type": "nominal", "distinct": "2", "missing": "1", "distr": [ [ "male", "female" ], [ [ "55", "106" ], [ "29", "148" ] ] ] }, { "name": "histologic-type", "index": "2", "type": "nominal", "distinct": "3", "missing": "67", "distr": [ [ "epidermoid", "adeno", "anaplastic" ], [ [ "20", "24" ], [ "20", "200" ], [ "6", "2" ] ] ] }, { "name": "degree-of-diffe", "index": "3", "type": "nominal", "distinct": "3", "missing": "155", "distr": [ [ "well", "fairly", "poorly" ], [ [ "5", "52" ], [ "3", "24" ], [ "55", "45" ] ] ] }, { "name": "bone", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "33", "61" ], [ "51", "194" ] ] ] }, { "name": "bone-marrow", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "3", "4" ], [ "81", "251" ] ] ] }, { "name": "lung", "index": "6", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "16", "59" ], [ "68", "196" ] ] ] }, { "name": "pleura", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "24", "51" ], [ "60", "204" ] ] ] }, { "name": "peritoneum", "index": "8", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "14", "81" ], [ "70", "174" ] ] ] }, { "name": "liver", "index": "9", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "29", "80" ], [ "55", "175" ] ] ] }, { "name": "brain", "index": "10", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "13", "8" ], [ "71", "247" ] ] ] }, { "name": "skin", "index": "11", "type": "nominal", "distinct": "2", "missing": "1", "distr": [ [ "yes", "no" ], [ [ "10", "10" ], [ "73", "245" ] ] ] }, { "name": "neck", "index": "12", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "6", "38" ], [ "78", "217" ] ] ] }, { "name": "supraclavicular", "index": "13", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "24", "37" ], [ "60", "218" ] ] ] }, { "name": "axillar", "index": "14", "type": "nominal", "distinct": "2", "missing": "1", "distr": [ [ "yes", "no" ], [ [ "5", "28" ], [ "78", "227" ] ] ] }, { "name": "mediastinum", "index": "15", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "52", "40" ], [ "32", "215" ] ] ] }, { "name": "abdominal", "index": "16", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "yes", "no" ], [ [ "21", "94" ], [ "63", "161" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 7, "total_downloads": 9, "reach": 7, "reuse": 15, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 15 }