{ "data_id": "31", "name": "eucalyptus", "exact_name": "eucalyptus", "version": 1, "version_label": "1", "description": "**Author**: Bruce Bulloch \n**Source**: [WEKA Dataset Collection](http:\/\/www.cs.waikato.ac.nz\/ml\/weka\/datasets.html) \n**Please cite**: \n\n**Eucalyptus Soil Conservation** \nThe objective was to determine which seedlots in a species are best for soil conservation in seasonally dry hill country. Determination is found by measurement of height, diameter by height, survival, and other contributing factors. \n \nIt is important to note that eucalypt trial methods changed over time; earlier trials included mostly 15 - 30cm tall seedling grown in peat plots and the later trials have included mostly three replications of eight trees grown. This change may contribute to less significant results.\n\nExperimental data recording procedures which require noting include:\n - instances with no data recorded due to experimental recording procedures\n require that the absence of a species from one replicate at a site was\n treated as a missing value, but if absent from two or more replicates at a\n site the species was excluded from the site's analyses.\n - missing data for survival, vigour, insect resistance, stem form, crown form\n and utility especially for the data recorded at the Morea Station; this \n could indicate the death of species in these areas or a lack in collection\n of data. \n\n Attribute Information: \n 1. Abbrev - site abbreviation - enumerated\n 2. Rep - site rep - integer\n 3. Locality - site locality in the North Island - enumerated\n 4. Map_Ref - map location in the North Island - enumerated\n 5. Latitude - latitude approximation - enumerated\n 6. Altitude - altitude approximation - integer\n 7. Rainfall - rainfall (mm pa) - integer\n 8. Frosts - frosts (deg. c) - integer\n 9. Year - year of planting - integer\n 10. Sp - species code - enumerated\n 11. PMCno - seedlot number - integer\n 12. DBH - best diameter base height (cm) - real\n 13. Ht - height (m) - real\n 14. Surv - survival - integer\n 15. Vig - vigour - real\n 16. Ins_res - insect resistance - real\n 17. Stem_Fm - stem form - real\n 18. Crown_Fm - crown form - real\n 19. Brnch_Fm - branch form - real\n Class:\n 20. Utility - utility rating - enumerated\n\n Class Distribution:\n none - 180\n low - 107\n average - 130\n good - 214\n best - 105\n\n Contact: Bruce Bulloch, 128 Cook Street, Palmerston North, New Zealand", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": null, "contributor": null, "date": "2014-04-23 13:15:28", "update_comment": null, "last_update": "2014-04-23 13:15:28", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/3625\/dataset_194_eucalyptus.arff", "default_target_attribute": "Utility", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "eucalyptus", "The objective was to determine which seedlots in a species are best for soil conservation in seasonally dry hill country. Determination is found by measurement of height, diameter by height, survival, and other contributing factors. It is important to note that eucalypt trial methods changed over time; earlier trials included mostly 15 - 30cm tall seedling grown in peat plots and the later trials have included mostly three replications of eight trees grown. This change may contribute to less sig " ], "weight": 5 }, "qualities": { "NumberOfInstances": 736, "NumberOfFeatures": 20, "NumberOfClasses": 5, "NumberOfMissingValues": 448, "NumberOfInstancesWithMissingValues": 95, "NumberOfNumericFeatures": 14, "NumberOfSymbolicFeatures": 6, "AutoCorrelation": 0.39319727891156464, "CfsSubsetEval_DecisionStumpAUC": 0.8239493966657213, "CfsSubsetEval_DecisionStumpErrRate": 0.41847826086956524, "CfsSubsetEval_DecisionStumpKappa": 0.4637307109078737, "CfsSubsetEval_NaiveBayesAUC": 0.8239493966657213, "CfsSubsetEval_NaiveBayesErrRate": 0.41847826086956524, "CfsSubsetEval_NaiveBayesKappa": 0.4637307109078737, "CfsSubsetEval_kNN1NAUC": 0.8239493966657213, "CfsSubsetEval_kNN1NErrRate": 0.41847826086956524, "CfsSubsetEval_kNN1NKappa": 0.4637307109078737, "ClassEntropy": 2.262083620428274, "DecisionStumpAUC": 0.7519401667350958, "DecisionStumpErrRate": 0.5054347826086957, "DecisionStumpKappa": 0.30247986100142155, "Dimensionality": 0.02717391304347826, "EquivalentNumberOfAtts": 5.9334684401020565, "J48.00001.AUC": 0.8184137151683228, "J48.00001.ErrRate": 0.3967391304347826, "J48.00001.Kappa": 0.49336985707179887, "J48.0001.AUC": 0.8184137151683228, "J48.0001.ErrRate": 0.3967391304347826, "J48.0001.Kappa": 0.49336985707179887, "J48.001.AUC": 0.8184137151683228, "J48.001.ErrRate": 0.3967391304347826, "J48.001.Kappa": 0.49336985707179887, "MajorityClassPercentage": 29.076086956521742, "MajorityClassSize": 214, "MaxAttributeEntropy": 4.2373637557635595, "MaxKurtosisOfNumericAtts": 734.9416211795777, "MaxMeansOfNumericAtts": 2054.7393689986247, "MaxMutualInformation": 0.42753276429854, "MaxNominalAttDistinctValues": 27, "MaxSkewnessOfNumericAtts": 27.109270846229688, "MaxStdDevOfNumericAtts": 1551.7798185802085, "MeanAttributeEntropy": 3.4626363060529055, "MeanKurtosisOfNumericAtts": 62.86596625813314, "MeanMeansOfNumericAtts": 390.0868288072735, "MeanMutualInformation": 0.381241367214446, "MeanNoiseToSignalRatio": 8.082530396301912, "MeanNominalAttDistinctValues": 13.666666666666666, "MeanSkewnessOfNumericAtts": 2.551453016115177, "MeanStdDevOfNumericAtts": 172.61081562461396, "MinAttributeEntropy": 2.5810641739409617, "MinKurtosisOfNumericAtts": -1.887802596870339, "MinMeansOfNumericAtts": -2.5842391304347836, "MinMutualInformation": 0.24650313929826, "MinNominalAttDistinctValues": 5, "MinSkewnessOfNumericAtts": -0.6970908724266737, "MinStdDevOfNumericAtts": 0.49318784476285216, "MinorityClassPercentage": 14.266304347826086, "MinorityClassSize": 105, "NaiveBayesAUC": 0.8520788174118736, "NaiveBayesErrRate": 0.45108695652173914, "NaiveBayesKappa": 0.42741183362624485, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 12.907608695652172, "PercentageOfMissingValues": 3.0434782608695654, "PercentageOfNumericFeatures": 70, "PercentageOfSymbolicFeatures": 30, "Quartile1AttributeEntropy": 2.908861461974274, "Quartile1KurtosisOfNumericAtts": -0.4961422376730956, "Quartile1MeansOfNumericAtts": 2.882908545727137, "Quartile1MutualInformation": 0.323312362530555, "Quartile1SkewnessOfNumericAtts": -0.3960800165047112, "Quartile1StdDevOfNumericAtts": 0.778502789181291, "Quartile2AttributeEntropy": 3.4759821137655975, "Quartile2KurtosisOfNumericAtts": 0.4289115082721384, "Quartile2MeansOfNumericAtts": 6.249602617058818, "Quartile2MutualInformation": 0.40765214345173, "Quartile2SkewnessOfNumericAtts": 0.11119478923130877, "Quartile2StdDevOfNumericAtts": 1.3465996573398586, "Quartile3AttributeEntropy": 4.009738246275191, "Quartile3KurtosisOfNumericAtts": 1.3641239688052669, "Quartile3MeansOfNumericAtts": 403.0027173913041, "Quartile3MutualInformation": 0.425964983779695, "Quartile3SkewnessOfNumericAtts": 0.9548948008878528, "Quartile3StdDevOfNumericAtts": 80.61760056258042, "REPTreeDepth1AUC": 0.7171370640805235, "REPTreeDepth1ErrRate": 0.5557065217391305, "REPTreeDepth1Kappa": 0.2672017371533179, "REPTreeDepth2AUC": 0.7171370640805235, "REPTreeDepth2ErrRate": 0.5557065217391305, "REPTreeDepth2Kappa": 0.2672017371533179, "REPTreeDepth3AUC": 0.7171370640805235, "REPTreeDepth3ErrRate": 0.5557065217391305, "REPTreeDepth3Kappa": 0.2672017371533179, "RandomTreeDepth1AUC": 0.7219508813313532, "RandomTreeDepth1ErrRate": 0.47690217391304346, "RandomTreeDepth1Kappa": 0.3915134670419616, "RandomTreeDepth2AUC": 0.7219508813313532, "RandomTreeDepth2ErrRate": 0.47690217391304346, "RandomTreeDepth2Kappa": 0.3915134670419616, "RandomTreeDepth3AUC": 0.7219508813313532, "RandomTreeDepth3ErrRate": 0.47690217391304346, "RandomTreeDepth3Kappa": 0.3915134670419616, "StdvNominalAttDistinctValues": 7.659416862050705, "kNN1NAUC": 0.7018152602695222, "kNN1NErrRate": 0.46603260869565216, "kNN1NKappa": 0.40228622299671357 }, "tags": [ { "tag": "study_14", "uploader": "1" }, { "tag": "study_1", "uploader": "0" }, { "tag": "study_105", "uploader": "0" }, { "tag": "study_429", "uploader": "0" }, { "tag": "study_429", "uploader": "0" }, { "tag": "study_391", "uploader": "0" }, { "tag": "study_105", "uploader": "0" }, { "tag": "study_391", "uploader": "0" }, { "tag": "study_407", "uploader": "0" }, { "tag": "study_463", "uploader": "0" }, { "tag": "study_722", "uploader": "0" } ], "features": [ { "name": "Utility", "index": "19", "type": "nominal", "distinct": "5", "missing": "0", "target": "1", "distr": [ [ "none", "low", "average", "good", "best" ], [ [ "180", "0", "0", "0", "0" ], [ "0", "107", "0", "0", "0" ], [ "0", "0", "130", "0", "0" ], [ "0", "0", "0", "214", "0" ], [ "0", "0", "0", "0", "105" ] ] ] }, { "name": "PMCno", "index": "10", "type": "numeric", "distinct": "85", "missing": "7", "min": "1", "max": "3275", "mean": "2055", "stdev": "618" }, { "name": "Brnch_Fm", "index": "18", "type": "numeric", "distinct": "28", "missing": "69", "min": "0", "max": "5", "mean": "3", "stdev": "1" }, { "name": "Crown_Fm", "index": "17", "type": "numeric", "distinct": "29", "missing": "69", "min": "0", "max": "5", "mean": "3", "stdev": "1" }, { "name": "Stem_Fm", "index": "16", "type": "numeric", "distinct": "26", "missing": "69", "min": "0", "max": "5", "mean": "3", "stdev": "1" }, { "name": "Ins_res", "index": "15", "type": "numeric", "distinct": "28", "missing": "69", "min": "0", "max": "5", "mean": "3", "stdev": "1" }, { "name": "Vig", "index": "14", "type": "numeric", "distinct": "33", "missing": "69", "min": "1", "max": "5", "mean": "3", "stdev": "1" }, { "name": "Surv", "index": "13", "type": "numeric", "distinct": "47", "missing": "94", "min": "2", "max": "100", "mean": "60", "stdev": "31" }, { "name": "Ht", "index": "12", "type": "numeric", "distinct": "531", "missing": "1", "min": "1", "max": "22", "mean": "9", "stdev": "4" }, { "name": "DBH", "index": "11", "type": "numeric", "distinct": "603", "missing": "1", "min": "1", "max": "42085", "mean": "73", "stdev": "1552" }, { "name": "Abbrev", "index": "0", "type": "nominal", "distinct": "16", "missing": "0", "distr": [ [ "Cra", "Cly", "Nga", "Wai", "K81", "Wak", "K82", "WSp", "K83", "Lon", "Puk", "Paw", "K81a", "Mor", "Wen", "WSh" ], [ [ "0", "4", "7", "13", "6" ], [ "0", "5", "1", "11", "7" ], [ "4", "1", "3", "13", "1" ], [ "14", "14", "5", "14", "23" ], [ "7", "17", "9", "16", "16" ], [ "29", "12", "10", "14", "8" ], [ "10", "14", "11", "4", "6" ], [ "4", "1", "17", "31", "6" ], [ "10", "12", "14", "10", "3" ], [ "4", "8", "8", "30", "3" ], [ "22", "10", "24", "23", "5" ], [ "3", "4", "6", "27", "15" ], [ "4", "5", "13", "5", "6" ], [ "63", "0", "0", "0", "0" ], [ "6", "0", "0", "0", "0" ], [ "0", "0", "2", "3", "0" ] ] ] }, { "name": "Sp", "index": "9", "type": "nominal", "distinct": "27", "missing": "0", "distr": [ [ "co", "fr", "ma", "nd", "ni", "ob", "ov", "pu", "rd", "si", "mn", "ag", "bxs", "br", "el", "fa", "jo", "ka", "re", "sm", "ro", "nc", "am", "cr", "pa", "ra", "te" ], [ [ "4", "4", "7", "10", "2" ], [ "5", "5", "9", "24", "9" ], [ "0", "2", "1", "0", "0" ], [ "20", "2", "14", "36", "14" ], [ "0", "3", "5", "20", "3" ], [ "6", "2", "6", "19", "17" ], [ "11", "12", "16", "15", "8" ], [ "16", "0", "6", "9", "8" ], [ "15", "14", "6", "2", "0" ], [ "1", "1", "1", "5", "1" ], [ "1", "1", "0", "1", "0" ], [ "7", "2", "0", "0", "0" ], [ "3", "3", "7", "4", "0" ], [ "6", "14", "5", "1", "2" ], [ "4", "5", "2", "1", "0" ], [ "6", "5", "13", "20", "8" ], [ "4", "4", "1", "0", "0" ], [ "11", "8", "0", "0", "0" ], [ "7", "4", "17", "29", "25" ], [ "8", "6", "0", "0", "0" ], [ "1", "1", "0", "0", "0" ], [ "2", "3", "1", "0", "0" ], [ "19", "0", "7", "16", "6" ], [ "0", "5", "5", "1", "0" ], [ "3", "1", "1", "1", "2" ], [ "7", "0", "0", "0", "0" ], [ "13", "0", "0", "0", "0" ] ] ] }, { "name": "Year", "index": "8", "type": "numeric", "distinct": "5", "missing": "0", "min": "1980", "max": "1986", "mean": "1982", "stdev": "2" }, { "name": "Frosts", "index": "7", "type": "numeric", "distinct": "2", "missing": "0", "min": "-3", "max": "0", "mean": "-3", "stdev": "0" }, { "name": "Rainfall", "index": "6", "type": "numeric", "distinct": "10", "missing": "0", "min": "850", "max": "1750", "mean": "1096", "stdev": "145" }, { "name": "Altitude", "index": "5", "type": "numeric", "distinct": "9", "missing": "0", "min": "70", "max": "300", "mean": "172", "stdev": "59" }, { "name": "Latitude", "index": "4", "type": "nominal", "distinct": "12", "missing": "0", "distr": [ [ "39__38", "39__00", "40__11", "39__50", "40__57", "41__12", "40__36", "41__08", "41__16", "40__00", "39__43", "82__32" ], [ [ "0", "4", "7", "13", "6" ], [ "0", "5", "1", "11", "7" ], [ "4", "1", "3", "13", "1" ], [ "14", "14", "5", "14", "23" ], [ "31", "48", "47", "35", "31" ], [ "29", "12", "10", "14", "8" ], [ "4", "1", "19", "34", "6" ], [ "4", "8", "8", "30", "3" ], [ "22", "10", "24", "23", "5" ], [ "3", "4", "6", "27", "15" ], [ "63", "0", "0", "0", "0" ], [ "6", "0", "0", "0", "0" ] ] ] }, { "name": "Map_Ref", "index": "3", "type": "nominal", "distinct": "14", "missing": "0", "distr": [ [ "N135_382\/137", "N116_848\/985", "N145_874\/586", "N142_377\/957", "N158_344\/626", "N162_081\/300", "N158_343\/625", "N151_912\/221", "N162_097\/424", "N166_063\/197", "N146_273\/737", "N141_295\/063", "N98_539\/567", "N151_922\/226" ], [ [ "0", "4", "7", "13", "6" ], [ "0", "5", "1", "11", "7" ], [ "4", "1", "3", "13", "1" ], [ "14", "14", "5", "14", "23" ], [ "21", "34", "36", "31", "25" ], [ "29", "12", "10", "14", "8" ], [ "10", "14", "11", "4", "6" ], [ "4", "1", "17", "31", "6" ], [ "4", "8", "8", "30", "3" ], [ "22", "10", "24", "23", "5" ], [ "3", "4", "6", "27", "15" ], [ "63", "0", "0", "0", "0" ], [ "6", "0", "0", "0", "0" ], [ "0", "0", "2", "3", "0" ] ] ] }, { "name": "Locality", "index": "2", "type": "nominal", "distinct": "8", "missing": "0", "distr": [ [ "Central_Hawkes_Bay", "Northern_Hawkes_Bay", "Southern_Hawkes_Bay", "Central_Hawkes_Bay_(coastal)", "Central_Wairarapa", "South_Wairarapa", "Southern_Hawkes_Bay_(coastal)", "Central_Poverty_Bay" ], [ [ "63", "4", "7", "13", "6" ], [ "0", "5", "1", "11", "7" ], [ "8", "2", "22", "47", "7" ], [ "14", "14", "5", "14", "23" ], [ "31", "48", "47", "35", "31" ], [ "55", "30", "42", "67", "16" ], [ "3", "4", "6", "27", "15" ], [ "6", "0", "0", "0", "0" ] ] ] }, { "name": "Rep", "index": "1", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "22", "mean": "2", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }