{ "data_id": "3", "name": "letter", "exact_name": "letter", "version": 1, "version_label": "1", "description": "**Author**: David J. Slate \r\n**Source**: [UCI](https:\/\/archive.ics.uci.edu\/ml\/datasets\/Letter+Recognition) - 01-01-1991 \r\n**Please cite**: P. W. Frey and D. J. Slate. \"Letter Recognition Using Holland-style Adaptive Classifiers\". Machine Learning 6(2), 1991 \r\n\r\n1. TITLE: \r\n Letter Image Recognition Data \r\n \r\n The objective is to identify each of a large number of black-and-white\r\n rectangular pixel displays as one of the 26 capital letters in the English\r\n alphabet. The character images were based on 20 different fonts and each\r\n letter within these 20 fonts was randomly distorted to produce a file of\r\n 20,000 unique stimuli. Each stimulus was converted into 16 primitive\r\n numerical attributes (statistical moments and edge counts) which were then\r\n scaled to fit into a range of integer values from 0 through 15. We\r\n typically train on the first 16000 items and then use the resulting model\r\n to predict the letter category for the remaining 4000. See the article\r\n cited above for more details.", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": null, "contributor": null, "date": "2014-04-06 23:19:41", "update_comment": null, "last_update": "2014-04-06 23:19:41", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/6\/dataset_6_letter.arff", "default_target_attribute": "class", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "letter", "1. TITLE: Letter Image Recognition Data The objective is to identify each of a large number of black-and-white rectangular pixel displays as one of the 26 capital letters in the English alphabet. The character images were based on 20 different fonts and each letter within these 20 fonts was randomly distorted to produce a file of 20,000 unique stimuli. Each stimulus was converted into 16 primitive numerical attributes (statistical moments and edge counts) which were then scaled to fit into a ran " ], "weight": 5 }, "qualities": { "NumberOfInstances": 20000, "NumberOfFeatures": 17, "NumberOfClasses": 26, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 16, "NumberOfSymbolicFeatures": 1, "AutoCorrelation": 0.04090204510225511, "CfsSubsetEval_DecisionStumpAUC": 0.9425298055650914, "CfsSubsetEval_DecisionStumpErrRate": 0.15215, "CfsSubsetEval_DecisionStumpKappa": 0.841756863867533, "CfsSubsetEval_NaiveBayesAUC": 0.9425298055650914, "CfsSubsetEval_NaiveBayesErrRate": 0.15215, "CfsSubsetEval_NaiveBayesKappa": 0.841756863867533, "CfsSubsetEval_kNN1NAUC": 0.9425298055650914, "CfsSubsetEval_kNN1NErrRate": 0.15215, "CfsSubsetEval_kNN1NKappa": 0.841756863867533, "ClassEntropy": 4.69981072657316, "DecisionStumpAUC": 0.6574545268026781, "DecisionStumpErrRate": 0.9293, "DecisionStumpKappa": 0.03276976655404448, "Dimensionality": 0.00085, "EquivalentNumberOfAtts": null, "J48.00001.AUC": 0.9379676053125593, "J48.00001.ErrRate": 0.15865, "J48.00001.Kappa": 0.8349979241615618, "J48.0001.AUC": 0.9379676053125593, "J48.0001.ErrRate": 0.15865, "J48.0001.Kappa": 0.8349979241615618, "J48.001.AUC": 0.9379676053125593, "J48.001.ErrRate": 0.15865, "J48.001.Kappa": 0.8349979241615618, "MajorityClassPercentage": 4.0649999999999995, "MajorityClassSize": 813, "MaxAttributeEntropy": null, "MaxKurtosisOfNumericAtts": 2.075245046157538, "MaxMeansOfNumericAtts": 8.338849999999995, "MaxMutualInformation": null, "MaxNominalAttDistinctValues": 26, "MaxSkewnessOfNumericAtts": 1.1599750154235924, "MaxStdDevOfNumericAtts": 3.304555303560269, "MeanAttributeEntropy": null, "MeanKurtosisOfNumericAtts": 0.6977379005298701, "MeanMeansOfNumericAtts": 5.925465624999998, "MeanMutualInformation": null, "MeanNoiseToSignalRatio": null, "MeanNominalAttDistinctValues": 26, "MeanSkewnessOfNumericAtts": 0.29029703410184804, "MeanStdDevOfNumericAtts": 2.273771145446362, "MinAttributeEntropy": null, "MinKurtosisOfNumericAtts": -0.4211788221168451, "MinMeansOfNumericAtts": 3.046099999999995, "MinMutualInformation": null, "MinNominalAttDistinctValues": 26, "MinSkewnessOfNumericAtts": -0.31007906987268463, "MinStdDevOfNumericAtts": 1.5467224363199539, "MinorityClassPercentage": 3.6700000000000004, "MinorityClassSize": 734, "NaiveBayesAUC": 0.9559207236903551, "NaiveBayesErrRate": 0.36025, "NaiveBayesKappa": 0.6253250509940796, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "PercentageOfMissingValues": 0, "PercentageOfNumericFeatures": 94.11764705882352, "PercentageOfSymbolicFeatures": 5.88235294117647, "Quartile1AttributeEntropy": null, "Quartile1KurtosisOfNumericAtts": 0.3091324958538607, "Quartile1MeansOfNumericAtts": 4.174812499999999, "Quartile1MutualInformation": null, "Quartile1SkewnessOfNumericAtts": -0.13733042812365298, "Quartile1StdDevOfNumericAtts": 2.017438812826727, "Quartile2AttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 0.8853044390128566, "Quartile2MeansOfNumericAtts": 5.913225000000001, "Quartile2MutualInformation": null, "Quartile2SkewnessOfNumericAtts": 0.2543345879398813, "Quartile2StdDevOfNumericAtts": 2.2933721022270195, "Quartile3AttributeEntropy": null, "Quartile3KurtosisOfNumericAtts": 1.1728389823381402, "Quartile3MeansOfNumericAtts": 7.7260124999999995, "Quartile3MutualInformation": null, "Quartile3SkewnessOfNumericAtts": 0.653378002627639, "Quartile3StdDevOfNumericAtts": 2.5474231354919117, "REPTreeDepth1AUC": 0.9544303249787935, "REPTreeDepth1ErrRate": 0.20315, "REPTreeDepth1Kappa": 0.7887152321892192, "REPTreeDepth2AUC": 0.9544303249787935, "REPTreeDepth2ErrRate": 0.20315, "REPTreeDepth2Kappa": 0.7887152321892192, "REPTreeDepth3AUC": 0.9544303249787935, "REPTreeDepth3ErrRate": 0.20315, "REPTreeDepth3Kappa": 0.7887152321892192, "RandomTreeDepth1AUC": 0.9080139521161272, "RandomTreeDepth1ErrRate": 0.1769, "RandomTreeDepth1Kappa": 0.816017080292, "RandomTreeDepth2AUC": 0.9080139521161272, "RandomTreeDepth2ErrRate": 0.1769, "RandomTreeDepth2Kappa": 0.816017080292, "RandomTreeDepth3AUC": 0.9080139521161272, "RandomTreeDepth3ErrRate": 0.1769, "RandomTreeDepth3Kappa": 0.816017080292, "StdvNominalAttDistinctValues": 0, "kNN1NAUC": 0.9731018928391187, "kNN1NErrRate": 0.05785, "kNN1NKappa": 0.939833878217649 }, "tags": [ { "tag": "study_14", "uploader": "1" }, { "tag": "study_1", "uploader": "0" }, { "tag": "study_195", "uploader": "0" }, { "tag": "study_173", "uploader": "0" }, { "tag": "study_346", "uploader": "0" }, { "tag": "study_334", "uploader": "0" } ], "features": [ { "name": "class", "index": "16", "type": "nominal", "distinct": "26", "missing": "0", "target": "1", "distr": [ [ "A", "B", "C", "D", "E", "F", "G", "H", "I", "J", "K", "L", "M", "N", "O", "P", "Q", "R", "S", "T", "U", "V", "W", "X", "Y", "Z" ], [ [ "789", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "766", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "736", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "805", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "768", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "775", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "773", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "734", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "755", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "747", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "739", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "761", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "792", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "783", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "753", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "803", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "783", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "758", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "748", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "796", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "813", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "764", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "752", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "787", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "786", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "0", "734" ] ] ] }, { "name": "y2bar", "index": "8", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "5", "stdev": "2" }, { "name": "yegvx", "index": "15", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "8", "stdev": "2" }, { "name": "y-ege", "index": "14", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "4", "stdev": "3" }, { "name": "xegvy", "index": "13", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "8", "stdev": "2" }, { "name": "x-ege", "index": "12", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "3", "stdev": "2" }, { "name": "xy2br", "index": "11", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "8", "stdev": "2" }, { "name": "x2ybr", "index": "10", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "6", "stdev": "3" }, { "name": "xybar", "index": "9", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "8", "stdev": "2" }, { "name": "x-box", "index": "0", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "4", "stdev": "2" }, { "name": "x2bar", "index": "7", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "5", "stdev": "3" }, { "name": "y-bar", "index": "6", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "8", "stdev": "2" }, { "name": "x-bar", "index": "5", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "7", "stdev": "2" }, { "name": "onpix", "index": "4", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "4", "stdev": "2" }, { "name": "high", "index": "3", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "5", "stdev": "2" }, { "name": "width", "index": "2", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "5", "stdev": "2" }, { "name": "y-box", "index": "1", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "7", "stdev": "3" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }