{ "data_id": "186", "name": "braziltourism", "exact_name": "braziltourism", "version": 1, "version_label": "1", "description": "**Author**: \n**Source**: Unknown - \n**Please cite**: \n\nanalcatdata A collection of data sets used in the book \"Analyzing Categorical Data,\"\n by Jeffrey S. Simonoff, Springer-Verlag, New York, 2003. The submission\n consists of a zip file containing two versions of each of 84 data sets, \n plus this README file. Each data set is given in comma-delimited ASCII\n (.csv) form, and Microsoft Excel (.xls) form.\n \n NOTICE: These data sets may be used freely for scientific, educational and\/or\n noncommercial purposes, provided suitable acknowledgment is given (by citing\n the above-named reference).\n \n Further details concerning the book, including information on statistical software\n (including sample S-PLUS\/R and SAS code), are available at the web site\n \n http:\/\/www.stern.nyu.edu\/~jsimonof\/AnalCatData\n\n\n Information about the dataset\n CLASSTYPE: nominal\n CLASSINDEX: last\n\n\n Note: Quotes, Single-Quotes and Backslashes were removed, Blanks replaced\n with Underscores", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": null, "contributor": null, "date": "2014-04-23 13:15:19", "update_comment": null, "last_update": "2014-04-23 13:15:19", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/3623\/dataset_190_braziltourism.arff", "default_target_attribute": "Trips", "row_id_attribute": null, "ignore_attribute": null, "runs": 1187, "suggest": { "input": [ "braziltourism", "analcatdata A collection of data sets used in the book \"Analyzing Categorical Data,\" by Jeffrey S. Simonoff, Springer-Verlag, New York, 2003. The submission consists of a zip file containing two versions of each of 84 data sets, plus this README file. Each data set is given in comma-delimited ASCII (.csv) form, and Microsoft Excel (.xls) form. NOTICE: These data sets may be used freely for scientific, educational and\/or noncommercial purposes, provided suitable acknowledgment is given (by citing " ], "weight": 5 }, "qualities": { "NumberOfInstances": 412, "NumberOfFeatures": 9, "NumberOfClasses": 7, "NumberOfMissingValues": 96, "NumberOfInstancesWithMissingValues": 49, "NumberOfNumericFeatures": 4, "NumberOfSymbolicFeatures": 5, "RandomTreeDepth2AUC": 0.5787870024875118, "J48.00001.ErrRate": 0.23786407766990292, "MaxStdDevOfNumericAtts": 768.3533035545145, "MinorityClassPercentage": 0.24271844660194172, "PercentageOfNumericFeatures": 44.44444444444444, "Quartile3MeansOfNumericAtts": 805.5389965699358, "CfsSubsetEval_DecisionStumpAUC": 0.4939889493738608, "RandomTreeDepth2ErrRate": 0.3106796116504854, "J48.00001.Kappa": -0.009450472523626028, "MeanAttributeEntropy": 1.3623378732357254, "MinorityClassSize": 1, "PercentageOfSymbolicFeatures": 55.55555555555556, "Quartile3MutualInformation": 0.152310460965645, "CfsSubsetEval_DecisionStumpErrRate": 0.23786407766990292, "CfsSubsetEval_DecisionStumpKappa": -0.00638085742771669, "RandomTreeDepth2Kappa": 0.1096103194435066, "J48.0001.AUC": 0.49387152483222335, "MeanKurtosisOfNumericAtts": 5.3216035800178325, "NaiveBayesAUC": 0.6653409358008442, "Quartile1AttributeEntropy": 0.7554329776007629, "Quartile3SkewnessOfNumericAtts": 2.748213626908119, "CfsSubsetEval_NaiveBayesAUC": 0.4939889493738608, "RandomTreeDepth3AUC": 0.5787870024875118, "J48.0001.ErrRate": 0.23786407766990292, "MeanMeansOfNumericAtts": 297.92990192920877, "NaiveBayesErrRate": 0.25, "Quartile1KurtosisOfNumericAtts": 0.30208384755402196, "Quartile3StdDevOfNumericAtts": 608.4038763190106, "CfsSubsetEval_NaiveBayesErrRate": 0.23786407766990292, "RandomTreeDepth3ErrRate": 0.3106796116504854, "J48.0001.Kappa": -0.009450472523626028, "MeanMutualInformation": 0.0799785589404025, "NaiveBayesKappa": 0.1872989122108166, "Quartile1MeansOfNumericAtts": 13.54691774867512, "REPTreeDepth1AUC": 0.5493586311004337, "CfsSubsetEval_NaiveBayesKappa": -0.00638085742771669, "RandomTreeDepth3Kappa": 0.1096103194435066, "J48.001.AUC": 0.49387152483222335, "MeanNoiseToSignalRatio": 16.03378869642921, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": 0.0220989881077225, "REPTreeDepth1ErrRate": 0.22572815533980584, "REPTreeDepth1Kappa": 0.040564903846153605, "CfsSubsetEval_kNN1NAUC": 0.4939889493738608, "StdvNominalAttDistinctValues": 2.280350850198276, "J48.001.ErrRate": 0.23786407766990292, "MeanNominalAttDistinctValues": 4.8, "Quartile1SkewnessOfNumericAtts": -0.5996384034760389, "REPTreeDepth2AUC": 0.5493586311004337, "CfsSubsetEval_kNN1NErrRate": 0.23786407766990292, "kNN1NAUC": 0.5760132142381226, "J48.001.Kappa": -0.009450472523626028, "MeanSkewnessOfNumericAtts": 1.114696467308079, "Quartile1StdDevOfNumericAtts": 3.6904257741965822, "REPTreeDepth2ErrRate": 0.22572815533980584, "CfsSubsetEval_kNN1NKappa": -0.00638085742771669, "kNN1NErrRate": 0.3325242718446602, "MajorityClassPercentage": 77.18446601941747, "MeanStdDevOfNumericAtts": 227.4785941226492, "Quartile2AttributeEntropy": 1.410904985959859, "REPTreeDepth2Kappa": 0.040564903846153605, "ClassEntropy": 1.1120878105833272, "kNN1NKappa": 0.11143995088393184, "MajorityClassSize": 318, "MinAttributeEntropy": 0.6684725699243226, "Quartile2KurtosisOfNumericAtts": 4.3380979199683285, "REPTreeDepth3AUC": 0.5493586311004337, "DecisionStumpAUC": 0.4987785111769919, "MaxAttributeEntropy": 1.9590689510988615, "MinKurtosisOfNumericAtts": -0.28405843705687284, "Quartile2MeansOfNumericAtts": 74.7037914690153, "REPTreeDepth3ErrRate": 0.22572815533980584, "DecisionStumpErrRate": 0.2354368932038835, "MaxKurtosisOfNumericAtts": 12.894276917191545, "MinMeansOfNumericAtts": 6.637577273983696, "Quartile2MutualInformation": 0.06552622774784, "REPTreeDepth3Kappa": 0.040564903846153605, "DecisionStumpKappa": 0.03014124156676203, "MaxMeansOfNumericAtts": 1035.6744475048206, "MinMutualInformation": 0.02174137745695, "Quartile2SkewnessOfNumericAtts": 1.1955141784921572, "RandomTreeDepth1AUC": 0.5787870024875118, "Dimensionality": 0.021844660194174758, "MaxMutualInformation": 0.16712040280898, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 11.11111111111111, "Quartile2StdDevOfNumericAtts": 70.34148027474038, "RandomTreeDepth1ErrRate": 0.3106796116504854, "EquivalentNumberOfAtts": 13.904824309375467, "MaxNominalAttDistinctValues": 7, "MinSkewnessOfNumericAtts": -1.0028541032944818, "PercentageOfInstancesWithMissingValues": 11.893203883495145, "Quartile3AttributeEntropy": 1.9206756561465546, "RandomTreeDepth1Kappa": 0.1096103194435066, "J48.00001.AUC": 0.49387152483222335, "MaxSkewnessOfNumericAtts": 3.0706116155424836, "MinStdDevOfNumericAtts": 0.8781123866015731, "PercentageOfMissingValues": 2.5889967637540456, "Quartile3KurtosisOfNumericAtts": 11.324628972531146, "AutoCorrelation": 0.9854014598540146 }, "tags": [ { "tag": "study_1", "uploader": "2" }, { "tag": "study_41", "uploader": "1" } ], "features": [ { "name": "Trips", "index": "8", "type": "nominal", "distinct": "7", "missing": "0", "target": "1", "distr": [ [ "0", "1", "2", "3", "4", "5", "7" ], [ [ "318", "0", "0", "0", "0", "0", "0" ], [ "0", "64", "0", "0", "0", "0", "0" ], [ "0", "0", "16", "0", "0", "0", "0" ], [ "0", "0", "0", "7", "0", "0", "0" ], [ "0", "0", "0", "0", "3", "0", "0" ], [ "0", "0", "0", "0", "0", "3", "0" ], [ "0", "0", "0", "0", "0", "0", "1" ] ] ] }, { "name": "Age", "index": "0", "type": "numeric", "distinct": "53", "missing": "1", "min": "13", "max": "69", "mean": "34", "stdev": "12" }, { "name": "Sex", "index": "1", "type": "nominal", "distinct": "3", "missing": "1", "distr": [ [ "0", "1", "4" ], [ [ "162", "41", "8", "6", "2", "3", "1" ], [ "154", "23", "8", "1", "1", "0", "0" ], [ "1", "0", "0", "0", "0", "0", "0" ] ] ] }, { "name": "Income", "index": "2", "type": "numeric", "distinct": "101", "missing": "44", "min": "7", "max": "6250", "mean": "1036", "stdev": "768" }, { "name": "Travel_cost", "index": "3", "type": "numeric", "distinct": "45", "missing": "3", "min": "21", "max": "1006", "mean": "115", "stdev": "129" }, { "name": "Access_road", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "255", "55", "16", "7", "3", "3", "1" ], [ "63", "9", "0", "0", "0", "0", "0" ] ] ] }, { "name": "Active", "index": "5", "type": "nominal", "distinct": "7", "missing": "2", "distr": [ [ "0", "1", "2", "3", "4", "5", "6" ], [ [ "164", "20", "2", "1", "1", "1", "1" ], [ "73", "13", "2", "2", "1", "0", "0" ], [ "61", "22", "2", "0", "0", "1", "0" ], [ "17", "7", "3", "0", "0", "0", "0" ], [ "0", "2", "4", "2", "1", "0", "0" ], [ "1", "0", "2", "2", "0", "0", "0" ], [ "1", "0", "0", "0", "0", "1", "0" ] ] ] }, { "name": "Passive", "index": "6", "type": "nominal", "distinct": "5", "missing": "1", "distr": [ [ "0", "1", "2", "3", "4" ], [ [ "155", "23", "0", "4", "2", "1", "1" ], [ "90", "23", "1", "0", "0", "2", "0" ], [ "55", "11", "10", "1", "0", "0", "0" ], [ "16", "6", "5", "1", "1", "0", "0" ], [ "1", "1", "0", "1", "0", "0", "0" ] ] ] }, { "name": "Logged_income", "index": "7", "type": "numeric", "distinct": "101", "missing": "44", "min": "2", "max": "9", "mean": "7", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 1, "nr_of_downloads": 10, "total_downloads": 13, "reach": 11, "reuse": 1, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 1 }