{ "data_id": "8", "name": "mfeat-karhunen", "exact_name": "mfeat-karhunen", "version": 1, "version_label": "1", "description": "**Author**: \n**Source**: Unknown - \n**Please cite**: \n\nThe multi-feature digit dataset\n -------------------------------\n \n Oowned and donated by:\n ----------------------\n \n Robert P.W. Duin\n Department of Applied Physics \n Delft University of Technology \n P.O. Box 5046, 2600 GA Delft\n The Netherlands\n \n email: duin@ph.tn.tudelft.nl\n http : \/\/www.ph.tn.tudelft.nl\/~duin\n tel +31 15 2786143\n \n Usage\n -----\n A slightly different version of the database is used in\n \n M. van Breukelen, R.P.W. Duin, D.M.J. Tax, and J.E. den Hartog, Handwritten\n digit recognition by combined classifiers, Kybernetika, vol. 34, no. 4,\n 1998, 381-386.\n \n M. van Breukelen and R.P.W. Duin, Neural Network Initialization by Combined\n Classifiers, in: A.K. Jain, S. Venkatesh, B.C. Lovell (eds.), ICPR'98,\n Proc. 14th Int. Conference on Pattern Recognition (Brisbane, Aug. 16-20),\n \n The database as it is is used in:\n \n A.K. Jain, R.P.W. Duin, J. Mao, Statisitcal Pattern Recognition: A Review,\n in preparation\n \n Description\n -----------\n \n This dataset consists of features of handwritten numerals (`0'--`9')\n extracted from a collection of Dutch utility maps. 200 patterns per\n class (for a total of 2,000 patterns) have been digitized in binary\n images. These digits are represented in terms of the following six\n feature sets (files): \n \n 1. mfeat-fou: 76 Fourier coefficients of the character shapes; \n 2. mfeat-fac: 216 profile correlations; \n 3. mfeat-kar: 64 Karhunen-Love coefficients; \n 4. mfeat-pix: 240 pixel averages in 2 x 3 windows; \n 5. mfeat-zer: 47 Zernike moments; \n 6. mfeat-mor: 6 morphological features. \n \n In each file the 2000 patterns are stored in ASCI on 2000 lines. The\n first 200 patterns are of class `0', followed by sets of 200 patterns\n for each of the classes `1' - `9'. Corresponding patterns in different\n feature sets (files) correspond to the same original character.\n \n The source image dataset is lost. Using the pixel-dataset (mfeat-pix)\n sampled versions of the original images may be obtained (15 x 16 pixels).\n \n Total number of instances:\n --------------------------\n 2000 (200 instances per class)\n \n Total number of attributes:\n ---------------------------\n 649 (distributed over 6 datasets,see above)\n \n no missing attributes\n \n Total number of classes:\n ------------------------\n 10\n \n Format:\n ------\n 6 files, see above.\n Each file contains 2000 lines, one for each instance.\n Attributes are SPACE separated and can be loaded by Matlab as\n > load filename\n No missing attributes. Some are integer, others are real.\n \n\n Information about the dataset\n CLASSTYPE: nominal\n CLASSINDEX: last", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": null, "contributor": null, "date": "2014-04-06 23:20:30", "update_comment": null, "last_update": "2014-04-06 23:20:30", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/16\/dataset_16_mfeat-karhunen.arff", "default_target_attribute": "class", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "mfeat-karhunen", "The multi-feature digit dataset ------------------------------- Oowned and donated by: ---------------------- Robert P.W. Duin Department of Applied Physics Delft University of Technology P.O. Box 5046, 2600 GA Delft The Netherlands email: duin@ph.tn.tudelft.nl http : \/\/www.ph.tn.tudelft.nl\/~duin tel +31 15 2786143 Usage ----- A slightly different version of the database is used in M. van Breukelen, R.P.W. Duin, D.M.J. Tax, and J.E. den Hartog, Handwritten digit recognition by combined classifie " ], "weight": 5 }, "qualities": { "NumberOfInstances": 2000, "NumberOfFeatures": 65, "NumberOfClasses": 10, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 64, "NumberOfSymbolicFeatures": 1, "AutoCorrelation": 0.9954977488744372, "CfsSubsetEval_DecisionStumpAUC": 0.8933529166666667, "CfsSubsetEval_DecisionStumpErrRate": 0.2105, "CfsSubsetEval_DecisionStumpKappa": 0.7661111111111111, "CfsSubsetEval_NaiveBayesAUC": 0.8933529166666667, "CfsSubsetEval_NaiveBayesErrRate": 0.2105, "CfsSubsetEval_NaiveBayesKappa": 0.7661111111111111, "CfsSubsetEval_kNN1NAUC": 0.8933529166666667, "CfsSubsetEval_kNN1NErrRate": 0.2105, "CfsSubsetEval_kNN1NKappa": 0.7661111111111111, "ClassEntropy": 3.321928094887362, "DecisionStumpAUC": 0.6936666666666667, "DecisionStumpErrRate": 0.8045, "DecisionStumpKappa": 0.10611111111111111, "Dimensionality": 0.0325, "EquivalentNumberOfAtts": null, "J48.00001.AUC": 0.8896487500000001, "J48.00001.ErrRate": 0.21, "J48.00001.Kappa": 0.7666666666666667, "J48.0001.AUC": 0.8896487500000001, "J48.0001.ErrRate": 0.21, "J48.0001.Kappa": 0.7666666666666667, "J48.001.AUC": 0.8896487500000001, "J48.001.ErrRate": 0.21, "J48.001.Kappa": 0.7666666666666667, "MajorityClassPercentage": 10, "MajorityClassSize": 200, "MaxAttributeEntropy": null, "MaxKurtosisOfNumericAtts": 0.580942601366925, "MaxMeansOfNumericAtts": 2.891171124290001, "MaxMutualInformation": null, "MaxNominalAttDistinctValues": 10, "MaxSkewnessOfNumericAtts": 0.4187220480956684, "MaxStdDevOfNumericAtts": 7.691305182325387, "MeanAttributeEntropy": null, "MeanKurtosisOfNumericAtts": -0.045654845752496065, "MeanMeansOfNumericAtts": 0.053084739246640686, "MeanMutualInformation": null, "MeanNoiseToSignalRatio": null, "MeanNominalAttDistinctValues": 10, "MeanSkewnessOfNumericAtts": -0.004285662607736754, "MeanStdDevOfNumericAtts": 2.152662828702679, "MinAttributeEntropy": null, "MinKurtosisOfNumericAtts": -0.944709265915264, "MinMeansOfNumericAtts": -1.8197072740500002, "MinMutualInformation": null, "MinNominalAttDistinctValues": 10, "MinSkewnessOfNumericAtts": -0.3391130927319128, "MinStdDevOfNumericAtts": 0.8923441138647591, "MinorityClassPercentage": 10, "MinorityClassSize": 200, "NaiveBayesAUC": 0.9956313888888889, "NaiveBayesErrRate": 0.068, "NaiveBayesKappa": 0.9244444444444445, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "PercentageOfMissingValues": 0, "PercentageOfNumericFeatures": 98.46153846153847, "PercentageOfSymbolicFeatures": 1.5384615384615385, "Quartile1AttributeEntropy": null, "Quartile1KurtosisOfNumericAtts": -0.14952953711034322, "Quartile1MeansOfNumericAtts": -0.29841679518749986, "Quartile1MutualInformation": null, "Quartile1SkewnessOfNumericAtts": -0.10420201025097077, "Quartile1StdDevOfNumericAtts": 1.1438482801014436, "Quartile2AttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": -0.017345885787890536, "Quartile2MeansOfNumericAtts": 0.004483087817499813, "Quartile2MutualInformation": null, "Quartile2SkewnessOfNumericAtts": -0.020815908469464905, "Quartile2StdDevOfNumericAtts": 1.6476505065816718, "Quartile3AttributeEntropy": null, "Quartile3KurtosisOfNumericAtts": 0.07165494057478039, "Quartile3MeansOfNumericAtts": 0.33246113886500006, "Quartile3MutualInformation": null, "Quartile3SkewnessOfNumericAtts": 0.0591765364965291, "Quartile3StdDevOfNumericAtts": 2.6614803695239697, "REPTreeDepth1AUC": 0.9227765277777779, "REPTreeDepth1ErrRate": 0.2055, "REPTreeDepth1Kappa": 0.7716666666666666, "REPTreeDepth2AUC": 0.9227765277777779, "REPTreeDepth2ErrRate": 0.2055, "REPTreeDepth2Kappa": 0.7716666666666666, "REPTreeDepth3AUC": 0.9227765277777779, "REPTreeDepth3ErrRate": 0.2055, "REPTreeDepth3Kappa": 0.7716666666666666, "RandomTreeDepth1AUC": 0.83, "RandomTreeDepth1ErrRate": 0.306, "RandomTreeDepth1Kappa": 0.6599999999999999, "RandomTreeDepth2AUC": 0.83, "RandomTreeDepth2ErrRate": 0.306, "RandomTreeDepth2Kappa": 0.6599999999999999, "RandomTreeDepth3AUC": 0.83, "RandomTreeDepth3ErrRate": 0.306, "RandomTreeDepth3Kappa": 0.6599999999999999, "StdvNominalAttDistinctValues": 0, "kNN1NAUC": 0.972274861111111, "kNN1NErrRate": 0.05, "kNN1NKappa": 0.9444444444444444 }, "tags": [ { "tag": "study_14", "uploader": "1" }, { "tag": "study_1", "uploader": "0" }, { "tag": "study_170", "uploader": "0" }, { "tag": "study_661", "uploader": "0" }, { "tag": "study_249", "uploader": "0" }, { "tag": "study_697", "uploader": "0" }, { "tag": "study_509", "uploader": "0" }, { "tag": "study_407", "uploader": "0" }, { "tag": "study_781", "uploader": "0" }, { "tag": "study_117", "uploader": "0" }, { "tag": "study_122", "uploader": "0" }, { "tag": "study_213", "uploader": "0" }, { "tag": "study_118", "uploader": "0" }, { "tag": "study_251", "uploader": "0" }, { "tag": "study_391", "uploader": "0" } ], "features": [ { "name": "class", "index": "64", "type": "nominal", "distinct": "10", "missing": "0", "target": "1", "distr": [ [ "1", "2", "3", "4", "5", "6", "7", "8", "9", "10" ], [ [ "200", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "200", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "200", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "200", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "200", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "200", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "200", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "200", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "200", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "200" ] ] ] }, { "name": "att48", "index": "47", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att34", "index": "33", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-7", "max": "5", "mean": "0", "stdev": "2" }, { "name": "att47", "index": "46", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att46", "index": "45", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att45", "index": "44", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "5", "mean": "0", "stdev": "1" }, { "name": "att44", "index": "43", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "5", "mean": "0", "stdev": "1" }, { "name": "att43", "index": "42", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "5", "mean": "0", "stdev": "2" }, { "name": "att42", "index": "41", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "5", "mean": "0", "stdev": "1" }, { "name": "att41", "index": "40", "type": "numeric", "distinct": "1993", "missing": "0", "min": "-5", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att40", "index": "39", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "5", "mean": "0", "stdev": "1" }, { "name": "att39", "index": "38", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-6", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att38", "index": "37", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "5", "mean": "0", "stdev": "2" }, { "name": "att37", "index": "36", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "5", "mean": "0", "stdev": "2" }, { "name": "att36", "index": "35", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-6", "max": "6", "mean": "0", "stdev": "2" }, { "name": "att35", "index": "34", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "5", "mean": "0", "stdev": "2" }, { "name": "att33", "index": "32", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-6", "max": "5", "mean": "0", "stdev": "2" }, { "name": "att49", "index": "48", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "5", "mean": "0", "stdev": "1" }, { "name": "att50", "index": "49", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att51", "index": "50", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att52", "index": "51", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att53", "index": "52", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att54", "index": "53", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-3", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att55", "index": "54", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att56", "index": "55", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att57", "index": "56", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-3", "max": "4", "mean": "0", "stdev": "1" }, { "name": "att58", "index": "57", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att59", "index": "58", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-3", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att60", "index": "59", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-4", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att61", "index": "60", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-3", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att62", "index": "61", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-3", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att63", "index": "62", "type": "numeric", "distinct": "1993", "missing": "0", "min": "-3", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att64", "index": "63", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-3", "max": "3", "mean": "0", "stdev": "1" }, { "name": "att17", "index": "16", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-8", "max": "8", "mean": "0", "stdev": "2" }, { "name": "att2", "index": "1", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-16", "max": "15", "mean": "-1", "stdev": "6" }, { "name": "att3", "index": "2", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-14", "max": "15", "mean": "1", "stdev": "6" }, { "name": "att4", "index": "3", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-14", "max": "17", "mean": "2", "stdev": "6" }, { "name": "att5", "index": "4", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-8", "max": "15", "mean": "3", "stdev": "4" }, { "name": "att6", "index": "5", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-9", "max": "14", "mean": "1", "stdev": "3" }, { "name": "att7", "index": "6", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-13", "max": "12", "mean": "-1", "stdev": "4" }, { "name": "att8", "index": "7", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-11", "max": "9", "mean": "-1", "stdev": "3" }, { "name": "att9", "index": "8", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-11", "max": "17", "mean": "0", "stdev": "4" }, { "name": "att10", "index": "9", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-13", "max": "8", "mean": "-2", "stdev": "4" }, { "name": "att11", "index": "10", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-9", "max": "13", "mean": "0", "stdev": "3" }, { "name": "att12", "index": "11", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-10", "max": "11", "mean": "2", "stdev": "3" }, { "name": "att13", "index": "12", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-8", "max": "10", "mean": "1", "stdev": "3" }, { "name": "att14", "index": "13", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-10", "max": "10", "mean": "0", "stdev": "3" }, { "name": "att15", "index": "14", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-7", "max": "9", "mean": "-1", "stdev": "3" }, { "name": "att16", "index": "15", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-8", "max": "10", "mean": "1", "stdev": "3" }, { "name": "att1", "index": "0", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-16", "max": "16", "mean": "-1", "stdev": "8" }, { "name": "att18", "index": "17", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-7", "max": "9", "mean": "1", "stdev": "2" }, { "name": "att19", "index": "18", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-12", "max": "8", "mean": "-1", "stdev": "3" }, { "name": "att20", "index": "19", "type": "numeric", "distinct": "1993", "missing": "0", "min": "-9", "max": "7", "mean": "1", "stdev": "2" }, { "name": "att21", "index": "20", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-9", "max": "6", "mean": "0", "stdev": "3" }, { "name": "att22", "index": "21", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-8", "max": "8", "mean": "0", "stdev": "2" }, { "name": "att23", "index": "22", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-9", "max": "9", "mean": "1", "stdev": "3" }, { "name": "att24", "index": "23", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-7", "max": "6", "mean": "0", "stdev": "2" }, { "name": "att25", "index": "24", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-7", "max": "8", "mean": "0", "stdev": "2" }, { "name": "att26", "index": "25", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-8", "max": "5", "mean": "-1", "stdev": "2" }, { "name": "att27", "index": "26", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "7", "mean": "1", "stdev": "2" }, { "name": "att28", "index": "27", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-7", "max": "7", "mean": "0", "stdev": "2" }, { "name": "att29", "index": "28", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "5", "mean": "0", "stdev": "2" }, { "name": "att30", "index": "29", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-7", "max": "5", "mean": "0", "stdev": "2" }, { "name": "att31", "index": "30", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-6", "max": "6", "mean": "-1", "stdev": "2" }, { "name": "att32", "index": "31", "type": "numeric", "distinct": "1994", "missing": "0", "min": "-5", "max": "6", "mean": "0", "stdev": "2" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }