{ "data_id": "98", "name": "LED-display-domain-7digit", "exact_name": "LED-display-domain-7digit", "version": 1, "version_label": "1", "description": "1. Title of Database: LED display domain\n\n2. Sources:\n (a) Breiman,L., Friedman,J.H., Olshen,R.A., & Stone,C.J. (1984). \n Classification and Regression Trees. Wadsworth International\n Group: Belmont, California. (see pages 43-49).\n (b) Donor: David Aha \n (c) Date: 11\/10\/1988\n\n3. Past Usage: (many)\n 1. CART book (above):\n -- Optimal Bayes classification rate: 74%\n -- CART decision tree algorithm: 71% (resubstitution estimate)\n -- Nearest Neighbor Algorithm: 71%\n -- 200 training and 5000 test instances\n \n 2. Quinlan,J.R. (1987). Simplifying Decision Trees. In International\n Journal of Man-Machine Studies (to appear).\n -- C4 decision tree algorithm: 72.6% (using pessimistic pruning)\n -- 2000 training and 500 test instances\n 3. Tan,M. & Eshelman,L. (1988). Using Weighted Networks to Represent\n Classification Knowledge in Noisy Domains. In Proceedings of the\n 5th International Conference on Machine Learning, 121-134, Ann\n Arbor, Michigan: Morgan Kaufmann. \n -- IWN system: 73.3% (using the And-OR classification algorithm)\n -- 400 training and 500 test cases\n\n4. Relevant Information Paragraph:\n This simple domain contains 7 Boolean attributes and 10 concepts,\n the set of decimal digits. Recall that LED displays contain 7\n light-emitting diodes -- hence the reason for 7 attributes. The\n problem would be easy if not for the introduction of noise. In\n this case, each attribute value has the 10% probability of having\n its value inverted. \n\n It's valuable to know the optimal Bayes rate for these databases.\n In this case, the misclassification rate is 26% (74% classification\n accuracy).\n \n5. Number of Instances: 500. But in the original URL you can find a C script and run it choosing the number of instances to be generated.\n\n6. Number of Attributes: 7 (all Boolean-valued)\n\n7. Attribute Information:\n -- All attribute values are either 0 or 1, according to whether\n the corresponding light is on or not for the decimal digit.\n -- Each attribute (excluding the class attribute, which is an\n integer ranging between 0 and 9 inclusive) has a 10% percent\n chance of being inverted.\n\n8. Missing Attribute Values: None\n\n9. Class Distribution: 10% (Theoretical)\n -- Each concept (digit) has the same theoretical probability\n distribution. The program randomly selects the attribute.", "format": "ARFF", "uploader": "Rafael Gomes Mantovani", "uploader_id": 64, "visibility": "public", "creator": null, "contributor": null, "date": "2016-07-29 20:36:10", "update_comment": null, "last_update": "2016-07-29 20:36:10", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/4535757\/phpSj3fWL", "default_target_attribute": "Class", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "LED-display-domain-7digit", "1. Title of Database: LED display domain 2. Sources: (a) Breiman,L., Friedman,J.H., Olshen,R.A., & Stone,C.J. (1984). Classification and Regression Trees. Wadsworth International Group: Belmont, California. (see pages 43-49). (b) Donor: David Aha (c) Date: 11\/10\/1988 3. Past Usage: (many) 1. CART book (above): -- Optimal Bayes classification rate: 74% -- CART decision tree algorithm: 71% (resubstitution estimate) -- Nearest Neighbor Algorithm: 71% -- 200 training and 5000 test instances 2. Q " ], "weight": 5 }, "qualities": { "NumberOfInstances": 500, "NumberOfFeatures": 8, "NumberOfClasses": 10, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 1, "AutoCorrelation": 0.7214428857715431, "CfsSubsetEval_DecisionStumpAUC": 0.8868692509275039, "CfsSubsetEval_DecisionStumpErrRate": 0.312, "CfsSubsetEval_DecisionStumpKappa": 0.6530218240375804, "CfsSubsetEval_NaiveBayesAUC": 0.8868692509275039, "CfsSubsetEval_NaiveBayesErrRate": 0.312, "CfsSubsetEval_NaiveBayesKappa": 0.6530218240375804, "CfsSubsetEval_kNN1NAUC": 0.8868692509275039, "CfsSubsetEval_kNN1NErrRate": 0.312, "CfsSubsetEval_kNN1NKappa": 0.6530218240375804, "ClassEntropy": 3.312307702487186, "DecisionStumpAUC": 0.7091836507594189, "DecisionStumpErrRate": 0.798, "DecisionStumpKappa": 0.10169125195871834, "Dimensionality": 0.016, "EquivalentNumberOfAtts": null, "J48.00001.AUC": 0.8868692509275039, "J48.00001.ErrRate": 0.312, "J48.00001.Kappa": 0.6530218240375804, "J48.0001.AUC": 0.8868692509275039, "J48.0001.ErrRate": 0.312, "J48.0001.Kappa": 0.6530218240375804, "J48.001.AUC": 0.8868692509275039, "J48.001.ErrRate": 0.312, "J48.001.Kappa": 0.6530218240375804, "MajorityClassPercentage": 11.4, "MajorityClassSize": 57, "MaxAttributeEntropy": null, "MaxKurtosisOfNumericAtts": 0.7363180226323118, "MaxMeansOfNumericAtts": 0.818, "MaxMutualInformation": null, "MaxNominalAttDistinctValues": 10, "MaxSkewnessOfNumericAtts": 0.4265826667894626, "MaxStdDevOfNumericAtts": 0.492325877381108, "MeanAttributeEntropy": null, "MeanKurtosisOfNumericAtts": -1.1173581845410985, "MeanMeansOfNumericAtts": 0.6565714285714286, "MeanMutualInformation": null, "MeanNoiseToSignalRatio": null, "MeanNominalAttDistinctValues": 10, "MeanSkewnessOfNumericAtts": -0.7264117116188794, "MeanStdDevOfNumericAtts": 0.45729419529310666, "MinAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.872759540452944, "MinMeansOfNumericAtts": 0.3960000000000001, "MinMutualInformation": null, "MinNominalAttDistinctValues": 10, "MinSkewnessOfNumericAtts": -1.6532963313105244, "MinStdDevOfNumericAtts": 0.386230952536685, "MinorityClassPercentage": 7.3999999999999995, "MinorityClassSize": 37, "NaiveBayesAUC": 0.9426624116134431, "NaiveBayesErrRate": 0.296, "NaiveBayesKappa": 0.670663213080901, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "PercentageOfMissingValues": 0, "PercentageOfNumericFeatures": 87.5, "PercentageOfSymbolicFeatures": 12.5, "Quartile1AttributeEntropy": null, "Quartile1KurtosisOfNumericAtts": -1.8253446979076169, "Quartile1MeansOfNumericAtts": 0.5900000000000001, "Quartile1MutualInformation": null, "Quartile1SkewnessOfNumericAtts": -1.0623385393261326, "Quartile1StdDevOfNumericAtts": 0.44230676067756874, "Quartile2AttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": -1.4799416454808219, "Quartile2MeansOfNumericAtts": 0.67, "Quartile2MutualInformation": null, "Quartile2SkewnessOfNumericAtts": -0.7252545765089368, "Quartile2StdDevOfNumericAtts": 0.4706836370348403, "Quartile3AttributeEntropy": null, "Quartile3KurtosisOfNumericAtts": -0.8749526989054361, "Quartile3MeansOfNumericAtts": 0.734, "Quartile3MutualInformation": null, "Quartile3SkewnessOfNumericAtts": -0.36707981414182267, "Quartile3StdDevOfNumericAtts": 0.4895542121699178, "REPTreeDepth1AUC": 0.8875253668134538, "REPTreeDepth1ErrRate": 0.308, "REPTreeDepth1Kappa": 0.6574931165012698, "REPTreeDepth2AUC": 0.8875253668134538, "REPTreeDepth2ErrRate": 0.308, "REPTreeDepth2Kappa": 0.6574931165012698, "REPTreeDepth3AUC": 0.8875253668134538, "REPTreeDepth3ErrRate": 0.308, "REPTreeDepth3Kappa": 0.6574931165012698, "RandomTreeDepth1AUC": 0.8737675816131757, "RandomTreeDepth1ErrRate": 0.326, "RandomTreeDepth1Kappa": 0.637629608551052, "RandomTreeDepth2AUC": 0.8737675816131757, "RandomTreeDepth2ErrRate": 0.326, "RandomTreeDepth2Kappa": 0.637629608551052, "RandomTreeDepth3AUC": 0.8737675816131757, "RandomTreeDepth3ErrRate": 0.326, "RandomTreeDepth3Kappa": 0.637629608551052, "StdvNominalAttDistinctValues": 0, "kNN1NAUC": 0.9200048199492538, "kNN1NErrRate": 0.296, "kNN1NKappa": 0.6707496674126707 }, "tags": [ { "tag": "study_14", "uploader": "1" }, { "tag": "study_1", "uploader": "0" }, { "tag": "study_407", "uploader": "0" }, { "tag": "study_662", "uploader": "0" }, { "tag": "study_102", "uploader": "0" }, { "tag": "study_366", "uploader": "0" }, { "tag": "study_277", "uploader": "0" }, { "tag": "study_446", "uploader": "0" }, { "tag": "study_110", "uploader": "0" }, { "tag": "study_263", "uploader": "0" }, { "tag": "study_429", "uploader": "0" }, { "tag": "study_237", "uploader": "0" }, { "tag": "study_538", "uploader": "0" }, { "tag": "study_201", "uploader": "0" }, { "tag": "study_263", "uploader": "0" }, { "tag": "study_344", "uploader": "0" }, { "tag": "study_521", "uploader": "0" }, { "tag": "study_114", "uploader": "0" }, { "tag": "study_121", "uploader": "0" }, { "tag": "study_201", "uploader": "0" } ], "features": [ { "name": "Class", "index": "7", "type": "nominal", "distinct": "10", "missing": "0", "target": "1", "distr": [ [ "1", "2", "3", "4", "5", "6", "7", "8", "9", "10" ], [ [ "45", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "37", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "51", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "57", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "52", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "52", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "47", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "57", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "53", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "49" ] ] ] }, { "name": "V1", "index": "0", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "V2", "index": "1", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "V3", "index": "2", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "V4", "index": "3", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "V5", "index": "4", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "V6", "index": "5", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "V7", "index": "6", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 11, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 11 }