{ "data_id": "21", "name": "sick", "exact_name": "sick", "version": 1, "version_label": "1", "description": "**Author**: \n**Source**: Unknown - \n**Please cite**: \n\n;\n ; Thyroid disease records supplied by the Garavan Institute and J. Ross\n ; Quinlan, New South Wales Institute, Syndney, Australia.\n ;\n ; 1987.\n ;\n \n sick, negative.\t\t\t| classes\n \n age:\t\t\t\tcontinuous.\n sex:\t\t\t\tM, F.\n on thyroxine:\t\t\tf, t.\n query on thyroxine:\t\tf, t.\n on antithyroid medication:\tf, t.\n sick:\t\t\t\tf, t.\n pregnant:\t\t\tf, t.\n thyroid surgery:\t\tf, t.\n I131 treatment:\t\t\tf, t.\n query hypothyroid:\t\tf, t.\n query hyperthyroid:\t\tf, t.\n lithium:\t\t\tf, t.\n goitre:\t\t\t\tf, t.\n tumor:\t\t\t\tf, t.\n hypopituitary:\t\t\tf, t.\n psych:\t\t\t\tf, t.\n TSH measured:\t\t\tf, t.\n TSH:\t\t\t\tcontinuous.\n T3 measured:\t\t\tf, t.\n T3:\t\t\t\tcontinuous.\n TT4 measured:\t\t\tf, t.\n TT4:\t\t\t\tcontinuous.\n T4U measured:\t\t\tf, t.\n T4U:\t\t\t\tcontinuous.\n FTI measured:\t\t\tf, t.\n FTI:\t\t\t\tcontinuous.\n TBG measured:\t\t\tf, t.\n TBG:\t\t\t\tcontinuous.\n referral source:\t\tWEST, STMW, SVHC, SVI, SVHD, other.\n \n\n Num Instances: 3772\n Num Attributes: 30\n Num Continuous: 7 (Int 1 \/ Real 6)\n Num Discrete: 23\n Missing values: 6064 \/ 5.4%\n\n name type enum ints real missing distinct (1)\n 1 'age' Int 0% 100% 0% 1 \/ 0% 93 \/ 2% 0% \n 2 'sex' Enum 96% 0% 0% 150 \/ 4% 2 \/ 0% 0% \n 3 'on thyroxine' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 4 'query on thyroxine' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 5 'on antithyroid medicati Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 6 'sick' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 7 'pregnant' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 8 'thyroid surgery' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 9 'I131 treatment' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 10 'query hypothyroid' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 11 'query hyperthyroid' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 12 'lithium' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 13 'goitre' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 14 'tumor' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 15 'hypopituitary' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 16 'psych' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 17 'TSH measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 18 'TSH' Real 0% 11% 79% 369 \/ 10% 287 \/ 8% 2% \n 19 'T3 measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 20 'T3' Real 0% 9% 71% 769 \/ 20% 69 \/ 2% 0% \n 21 'TT4 measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 22 'TT4' Real 0% 94% 0% 231 \/ 6% 241 \/ 6% 1% \n 23 'T4U measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 24 'T4U' Real 0% 2% 87% 387 \/ 10% 146 \/ 4% 1% \n 25 'FTI measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 26 'FTI' Real 0% 90% 0% 385 \/ 10% 234 \/ 6% 2% \n 27 'TBG measured' Enum 100% 0% 0% 0 \/ 0% 1 \/ 0% 0% \n 28 'TBG' Real 0% 0% 0% 3772 \/100% 0 \/ 0% 0% \n 29 'referral source' Enum 100% 0% 0% 0 \/ 0% 5 \/ 0% 0% \n 30 'Class' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0%", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": null, "contributor": null, "date": "2014-04-06 23:22:19", "update_comment": null, "last_update": "2014-04-06 23:22:19", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/38\/dataset_38_sick.arff", "default_target_attribute": "Class", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "sick", "; ; Thyroid disease records supplied by the Garavan Institute and J. Ross ; Quinlan, New South Wales Institute, Syndney, Australia. ; ; 1987. ; sick, negative. | classes age: continuous. sex: M, F. on thyroxine: f, t. query on thyroxine: f, t. on antithyroid medication: f, t. sick: f, t. pregnant: f, t. thyroid surgery: f, t. I131 treatment: f, t. query hypothyroid: f, t. query hyperthyroid: f, t. lithium: f, t. goitre: f, t. tumor: f, t. hypopituitary: f, t. psych: f, t. TSH measured: f, t. TSH " ], "weight": 5 }, "qualities": { "NumberOfInstances": 3772, "NumberOfFeatures": 30, "NumberOfClasses": 2, "NumberOfMissingValues": 6064, "NumberOfInstancesWithMissingValues": 3772, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 23, "AutoCorrelation": 0.8865022540440202, "CfsSubsetEval_DecisionStumpAUC": 0.9322127557089432, "CfsSubsetEval_DecisionStumpErrRate": 0.0344644750795334, "CfsSubsetEval_DecisionStumpKappa": 0.7420165388043194, "CfsSubsetEval_NaiveBayesAUC": 0.9340166093907973, "CfsSubsetEval_NaiveBayesErrRate": 0.0408271474019088, "CfsSubsetEval_NaiveBayesKappa": 0.6067274088697694, "CfsSubsetEval_kNN1NAUC": 0.8676933534318454, "CfsSubsetEval_kNN1NErrRate": 0.03870625662778367, "CfsSubsetEval_kNN1NKappa": 0.65064369732333, "ClassEntropy": 0.33235055553211046, "DecisionStumpAUC": 0.9322127557089432, "DecisionStumpErrRate": 0.0344644750795334, "DecisionStumpKappa": 0.7420165388043194, "Dimensionality": 0.007953340402969246, "EquivalentNumberOfAtts": 64.92919423455584, "J48.00001.AUC": 0.9284149438060761, "J48.00001.ErrRate": 0.01855779427359491, "J48.00001.Kappa": 0.8379448629552658, "J48.0001.AUC": 0.9284149438060761, "J48.0001.ErrRate": 0.01855779427359491, "J48.0001.Kappa": 0.8379448629552658, "J48.001.AUC": 0.9288299951954286, "J48.001.ErrRate": 0.018292682926829267, "J48.001.Kappa": 0.8431281311930718, "MajorityClassPercentage": 93.87592788971368, "MajorityClassSize": 3541, "MaxAttributeEntropy": 1.520689912507409, "MaxKurtosisOfNumericAtts": 238.1814623780636, "MaxMeansOfNumericAtts": 110.46964865662825, "MaxMutualInformation": 0.06006915971583, "MaxNominalAttDistinctValues": 5, "MaxSkewnessOfNumericAtts": 13.882652755041702, "MaxStdDevOfNumericAtts": 35.604247607641, "MeanAttributeEntropy": 0.33755530471128503, "MeanKurtosisOfNumericAtts": 51.41313506551009, "MeanMeansOfNumericAtts": 46.43668969641138, "MeanMutualInformation": 0.005118661327160454, "MeanNoiseToSignalRatio": 64.94601266549154, "MeanNominalAttDistinctValues": 2.0869565217391304, "MeanSkewnessOfNumericAtts": 3.5691918824691085, "MeanStdDevOfNumericAtts": 19.05387758896556, "MinAttributeEntropy": -0, "MinKurtosisOfNumericAtts": 4.073471498748956, "MinMeansOfNumericAtts": 0.9949997045790251, "MinMutualInformation": 0, "MinNominalAttDistinctValues": 1, "MinSkewnessOfNumericAtts": 1.232674238507278, "MinStdDevOfNumericAtts": 0.19545727511328811, "MinorityClassPercentage": 6.1240721102863205, "MinorityClassSize": 231, "NaiveBayesAUC": 0.921866947220681, "NaiveBayesErrRate": 0.07423117709437964, "NaiveBayesKappa": 0.5196307538926299, "NumberOfBinaryFeatures": 21, "PercentageOfBinaryFeatures": 70, "PercentageOfInstancesWithMissingValues": 100, "PercentageOfMissingValues": 5.358784022622834, "PercentageOfNumericFeatures": 23.333333333333332, "PercentageOfSymbolicFeatures": 76.66666666666667, "Quartile1AttributeEntropy": 0.0987401719719687, "Quartile1KurtosisOfNumericAtts": 5.982197043232063, "Quartile1MeansOfNumericAtts": 1.7588748012696314, "Quartile1MutualInformation": 0.0005017739084375, "Quartile1SkewnessOfNumericAtts": 1.2589465934783108, "Quartile1StdDevOfNumericAtts": 0.669439962143292, "Quartile2AttributeEntropy": 0.25937485231702934, "Quartile2KurtosisOfNumericAtts": 8.87130380657577, "Quartile2MeansOfNumericAtts": 28.41132258295655, "Quartile2MutualInformation": 0.00129044182719, "Quartile2SkewnessOfNumericAtts": 1.5381528946217138, "Quartile2StdDevOfNumericAtts": 22.3032143933016, "Quartile3AttributeEntropy": 0.4759318019149815, "Quartile3KurtosisOfNumericAtts": 90.94248810329343, "Quartile3MeansOfNumericAtts": 108.85692077754308, "Quartile3MutualInformation": 0.0033491752406775003, "Quartile3SkewnessOfNumericAtts": 4.937524038925616, "Quartile3StdDevOfNumericAtts": 33.71833515687218, "REPTreeDepth1AUC": 0.8123368676884632, "REPTreeDepth1ErrRate": 0.04984093319194061, "REPTreeDepth1Kappa": 0.49019771359063496, "REPTreeDepth2AUC": 0.9297395628940391, "REPTreeDepth2ErrRate": 0.0299575821845175, "REPTreeDepth2Kappa": 0.7576017452110199, "REPTreeDepth3AUC": 0.934156589903554, "REPTreeDepth3ErrRate": 0.0204135737009544, "REPTreeDepth3Kappa": 0.8206462672410385, "RandomTreeDepth1AUC": 0.599974815733076, "RandomTreeDepth1ErrRate": 0.0612407211028632, "RandomTreeDepth1Kappa": 0, "RandomTreeDepth2AUC": 0.7606296555745864, "RandomTreeDepth2ErrRate": 0.0612407211028632, "RandomTreeDepth2Kappa": 0, "RandomTreeDepth3AUC": 0.8360320842670461, "RandomTreeDepth3ErrRate": 0.05885471898197243, "RandomTreeDepth3Kappa": 0.09725938495173561, "StdvNominalAttDistinctValues": 0.668311541278118, "kNN1NAUC": 0.7895585540318668, "kNN1NErrRate": 0.04109225874867444, "kNN1NKappa": 0.6153785428776684 }, "tags": [ { "tag": "study_14", "uploader": "1" }, { "tag": "study_1", "uploader": "0" }, { "tag": "study_286", "uploader": "0" }, { "tag": "study_106", "uploader": "0" }, { "tag": "study_293", "uploader": "0" }, { "tag": "study_380", "uploader": "0" }, { "tag": "study_101", "uploader": "0" }, { "tag": "study_380", "uploader": "0" }, { "tag": "study_429", "uploader": "0" }, { "tag": "study_615", "uploader": "0" }, { "tag": "study_79", "uploader": "0" }, { "tag": "study_201", "uploader": "0" }, { "tag": "study_284", "uploader": "0" }, { "tag": "study_757", "uploader": "0" }, { "tag": "study_275", "uploader": "0" } ], "features": [ { "name": "Class", "index": "29", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "negative", "sick" ], [ [ "3541", "0" ], [ "0", "231" ] ] ] }, { "name": "psych", "index": "15", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3364", "224" ], [ "177", "7" ] ] ] }, { "name": "referral_source", "index": "28", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "SVHC", "other", "SVI", "STMW", "SVHD" ], [ [ "377", "9" ], [ "2168", "33" ], [ "848", "186" ], [ "112", "0" ], [ "36", "3" ] ] ] }, { "name": "TBG", "index": "27", "type": "numeric", "distinct": "0", "missing": "3772", "min": "2147483647", "max": "0", "mean": "0", "stdev": "0" }, { "name": "TBG_measured", "index": "26", "type": "nominal", "distinct": "1", "missing": "0", "distr": [ [ "f" ], [ [ "3541", "231" ] ] ] }, { "name": "FTI", "index": "25", "type": "numeric", "distinct": "234", "missing": "385", "min": "2", "max": "395", "mean": "110", "stdev": "33" }, { "name": "FTI_measured", "index": "24", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3164", "223" ], [ "377", "8" ] ] ] }, { "name": "T4U", "index": "23", "type": "numeric", "distinct": "146", "missing": "387", "min": "0", "max": "2", "mean": "1", "stdev": "0" }, { "name": "T4U_measured", "index": "22", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3162", "223" ], [ "379", "8" ] ] ] }, { "name": "TT4", "index": "21", "type": "numeric", "distinct": "241", "missing": "231", "min": "2", "max": "430", "mean": "108", "stdev": "36" }, { "name": "TT4_measured", "index": "20", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3310", "231" ], [ "231", "0" ] ] ] }, { "name": "T3", "index": "19", "type": "numeric", "distinct": "69", "missing": "769", "min": "0", "max": "11", "mean": "2", "stdev": "1" }, { "name": "T3_measured", "index": "18", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "2775", "228" ], [ "766", "3" ] ] ] }, { "name": "TSH", "index": "17", "type": "numeric", "distinct": "287", "missing": "369", "min": "0", "max": "530", "mean": "5", "stdev": "25" }, { "name": "TSH_measured", "index": "16", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3174", "229" ], [ "367", "2" ] ] ] }, { "name": "age", "index": "0", "type": "numeric", "distinct": "93", "missing": "1", "min": "1", "max": "455", "mean": "52", "stdev": "20" }, { "name": "hypopituitary", "index": "14", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3541", "230" ], [ "0", "1" ] ] ] }, { "name": "tumor", "index": "13", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3447", "229" ], [ "94", "2" ] ] ] }, { "name": "goitre", "index": "12", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3509", "229" ], [ "32", "2" ] ] ] }, { "name": "lithium", "index": "11", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3524", "230" ], [ "17", "1" ] ] ] }, { "name": "query_hyperthyroid", "index": "10", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3312", "223" ], [ "229", "8" ] ] ] }, { "name": "query_hypothyroid", "index": "9", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3335", "203" ], [ "206", "28" ] ] ] }, { "name": "I131_treatment", "index": "8", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3483", "230" ], [ "58", "1" ] ] ] }, { "name": "thyroid_surgery", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3488", "231" ], [ "53", "0" ] ] ] }, { "name": "pregnant", "index": "6", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3488", "231" ], [ "53", "0" ] ] ] }, { "name": "sick", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3419", "206" ], [ "122", "25" ] ] ] }, { "name": "on_antithyroid_medication", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3498", "231" ], [ "43", "0" ] ] ] }, { "name": "query_on_thyroxine", "index": "3", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3495", "227" ], [ "46", "4" ] ] ] }, { "name": "on_thyroxine", "index": "2", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3089", "219" ], [ "452", "12" ] ] ] }, { "name": "sex", "index": "1", "type": "nominal", "distinct": "2", "missing": "150", "distr": [ [ "F", "M" ], [ [ "2344", "136" ], [ "1053", "89" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }