{ "data_id": "42087", "name": "beer_reviews", "exact_name": "beer_reviews", "version": 5, "version_label": "0.1", "description": "This dataset consists of beer reviews from Beeradvocate. The data span a period of more than 10 years, including all ~1.5 million reviews up to November 2011. Each review includes ratings in terms of five \"aspects\": appearance, aroma, palate, taste, and overall impression. Reviews include product and user information, followed by each of these five ratings, and a plaintext review. We also have reviews from ratebeer.", "format": "arff", "uploader": "Guillaume Lemaitre", "uploader_id": 5332, "visibility": "public", "creator": "\"socialmediadata\"", "contributor": null, "date": "2019-08-14 18:16:31", "update_comment": null, "last_update": "2019-08-14 18:16:31", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/21553084\/dataset", "default_target_attribute": "beer_style", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "beer_reviews", "This dataset consists of beer reviews from Beeradvocate. The data span a period of more than 10 years, including all ~1.5 million reviews up to November 2011. Each review includes ratings in terms of five \"aspects\": appearance, aroma, palate, taste, and overall impression. Reviews include product and user information, followed by each of these five ratings, and a plaintext review. We also have reviews from ratebeer. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1586614, "NumberOfFeatures": 13, "NumberOfClasses": 104, "NumberOfMissingValues": 68148, "NumberOfInstancesWithMissingValues": 68136, "NumberOfNumericFeatures": 9, "NumberOfSymbolicFeatures": 0, "MeanMeansOfNumericAtts": 136012683.20861137, "Quartile1SkewnessOfNumericAtts": -0.9379261805121906, "AutoCorrelation": 1, "MeanMutualInformation": null, "Quartile1StdDevOfNumericAtts": 0.6899175460861239, "ClassEntropy": null, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "Dimensionality": 8.193549281677838e-6, "MeanNominalAttDistinctValues": null, "Quartile2KurtosisOfNumericAtts": 1.3416693061500276, "EquivalentNumberOfAtts": null, "MeanSkewnessOfNumericAtts": -0.11402485555807243, "Quartile2MeansOfNumericAtts": 3.841641697350634, "MajorityClassPercentage": 7.411128352579771, "MeanStdDevOfNumericAtts": 8507964.083362993, "Quartile2MutualInformation": null, "MajorityClassSize": 117586, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": -0.8385305259473593, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -0.8339342225063833, "PercentageOfBinaryFeatures": 0, "Quartile2StdDevOfNumericAtts": 0.7319696098966487, "MaxKurtosisOfNumericAtts": 6.961811545288782, "MinMeansOfNumericAtts": 3.7356360778365207, "PercentageOfInstancesWithMissingValues": 4.294428260433855, "Quartile3AttributeEntropy": null, "MaxMeansOfNumericAtts": 1224089280.0122147, "MinMutualInformation": null, "PercentageOfMissingValues": 0.3303988144661428, "Quartile3KurtosisOfNumericAtts": 2.5736103342990426, "MaxMutualInformation": null, "MinNominalAttDistinctValues": null, "PercentageOfNumericFeatures": 69.23076923076923, "Quartile3MeansOfNumericAtts": 12421.446740364685, "MaxNominalAttDistinctValues": null, "MinSkewnessOfNumericAtts": -1.0239687125007078, "PercentageOfSymbolicFeatures": 0, "Quartile3MutualInformation": null, "MaxSkewnessOfNumericAtts": 2.0837475678168804, "MinStdDevOfNumericAtts": 0.6160927688920823, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 1.1164015398055205, "MaxStdDevOfNumericAtts": 76544274.53923745, "MinorityClassPercentage": 0.015189579822187375, "Quartile1KurtosisOfNumericAtts": 0.4157492272909389, "Quartile3StdDevOfNumericAtts": 13698.219992067268, "MeanAttributeEntropy": null, "MinorityClassSize": 241, "Quartile1MeansOfNumericAtts": 3.7682809114250637, "StdvNominalAttDistinctValues": null, "MeanKurtosisOfNumericAtts": 1.82030022193319, "NumberOfBinaryFeatures": 0, "Quartile1MutualInformation": null }, "tags": [], "features": [ { "name": "beer_style", "index": "7", "type": "string", "distinct": "104", "missing": "0", "target": "1" }, { "name": "brewery_id", "index": "0", "type": "numeric", "distinct": "5840", "missing": "0", "min": "1", "max": "28003", "mean": "3130", "stdev": "5578" }, { "name": "brewery_name", "index": "1", "type": "string", "distinct": "5742", "missing": "15" }, { "name": "review_time", "index": "2", "type": "numeric", "distinct": "1577960", "missing": "0", "min": "840672001", "max": "1326285348", "mean": "1224089280", "stdev": "76544275" }, { "name": "review_overall", "index": "3", "type": "numeric", "distinct": "10", "missing": "0", "min": "0", "max": "5", "mean": "4", "stdev": "1" }, { "name": "review_aroma", "index": "4", "type": "numeric", "distinct": "9", "missing": "0", "min": "1", "max": "5", "mean": "4", "stdev": "1" }, { "name": "review_appearance", "index": "5", "type": "numeric", "distinct": "10", "missing": "0", "min": "0", "max": "5", "mean": "4", "stdev": "1" }, { "name": "review_profilename", "index": "6", "type": "string", "distinct": "33387", "missing": "348" }, { "name": "review_palate", "index": "8", "type": "numeric", "distinct": "9", "missing": "0", "min": "1", "max": "5", "mean": "4", "stdev": "1" }, { "name": "review_taste", "index": "9", "type": "numeric", "distinct": "9", "missing": "0", "min": "1", "max": "5", "mean": "4", "stdev": "1" }, { "name": "beer_name", "index": "10", "type": "string", "distinct": "56857", "missing": "0" }, { "name": "beer_abv", "index": "11", "type": "numeric", "distinct": "530", "missing": "67785", "min": "0", "max": "58", "mean": "7", "stdev": "2" }, { "name": "beer_beerid", "index": "12", "type": "numeric", "distinct": "66055", "missing": "0", "min": "3", "max": "77317", "mean": "21713", "stdev": "21818" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 8, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 8 }