{ "data_id": "24", "name": "splice", "exact_name": "splice", "version": 1, "version_label": "1", "description": "**Author**: Genbank \nDonor: G. Towell, M. Noordewier, and J. Shavlik \n**Source**: [Genbank 64.1](genbank.bio.net) - 1\/1\/92 \n**Please cite**: \n\nPrimate splice-junction gene sequences (DNA) with associated imperfect domain theory. All examples taken from Genbank 64.1. Categories \"ei\" and \"ie\" include every \"split-gene\" for primates in Genbank 64.1. Non-splice examples taken from sequences known not to include a splicing site.\n \nProblem Description: \nSplice junctions are points on a DNA sequence at which 'superfluous' DNA is removed during the process of protein creation in higher organisms. The problem posed in this dataset is to recognize, given a sequence of DNA, the boundaries between exons (the parts of the DNA sequence retained after splicing) and introns (the parts of the DNA sequence that are spliced out). This problem consists of two subtasks: recognizing exon\/intron boundaries (referred to as EI sites), and recognizing intron\/exon boundaries (IE sites). (In the biological community, IE borders are referred to a ''acceptors'' while EI borders are referred to as ''donors''.)\n \nThis dataset has been developed to help evaluate a \"hybrid\" learning algorithm (KBANN) that uses examples to inductively refine preexisting knowledge.\n \nAttributes: \n>\n 1 One of {n ei ie}, indicating the class.\n 2 The instance name.\n 3-62 The remaining 60 fields are the sequence, starting at \n position -30 and ending at position +30. Each of\n these fields is almost always filled by one of \n {a, g, t, c}. Other characters indicate ambiguity among\n the standard characters according to the following table:\n character: meaning\n D: A or G or T\n N: A or G or C or T\n S: C or G\n R: A or G\n\nNotes: \n* Instance_name is an identifier and should be ignored for modelling", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": null, "contributor": null, "date": "2014-04-06 23:22:49", "update_comment": "Instance_name is an identifier and should be ignored for modelling", "last_update": "2014-09-19 17:06:29", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/46\/dataset_46_splice.arff", "default_target_attribute": "Class", "row_id_attribute": null, "ignore_attribute": "Instance_name", "runs": 0, "suggest": { "input": [ "splice", "Donor: G. Towell, M. Noordewier, and J. Shavlik Primate splice-junction gene sequences (DNA) with associated imperfect domain theory. All examples taken from Genbank 64.1. Categories \"ei\" and \"ie\" include every \"split-gene\" for primates in Genbank 64.1. Non-splice examples taken from sequences known not to include a splicing site. Problem Description: Splice junctions are points on a DNA sequence at which 'superfluous' DNA is removed during the process of protein creation in higher organisms. Th " ], "weight": 5 }, "qualities": { "NumberOfInstances": 3190, "NumberOfFeatures": 61, "NumberOfClasses": 3, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 0, "NumberOfSymbolicFeatures": 61, "AutoCorrelation": 0.9993728441517717, "CfsSubsetEval_DecisionStumpAUC": 0.9645392222677037, "CfsSubsetEval_DecisionStumpErrRate": 0.06363636363636363, "CfsSubsetEval_DecisionStumpKappa": 0.8978122508210037, "CfsSubsetEval_NaiveBayesAUC": 0.9645392222677037, "CfsSubsetEval_NaiveBayesErrRate": 0.06363636363636363, "CfsSubsetEval_NaiveBayesKappa": 0.8978122508210037, "CfsSubsetEval_kNN1NAUC": 0.9645392222677037, "CfsSubsetEval_kNN1NErrRate": 0.06363636363636363, "CfsSubsetEval_kNN1NKappa": 0.8978122508210037, "ClassEntropy": 1.4801700696136337, "DecisionStumpAUC": 0.7717484305673256, "DecisionStumpErrRate": 0.3761755485893417, "DecisionStumpKappa": 0.4122311203046818, "Dimensionality": 0.019122257053291535, "EquivalentNumberOfAtts": 26.313211437704414, "J48.00001.AUC": 0.9590500108986266, "J48.00001.ErrRate": 0.06551724137931035, "J48.00001.Kappa": 0.8944375252739722, "J48.0001.AUC": 0.9590500108986266, "J48.0001.ErrRate": 0.06551724137931035, "J48.0001.Kappa": 0.8944375252739722, "J48.001.AUC": 0.9590500108986266, "J48.001.ErrRate": 0.06551724137931035, "J48.001.Kappa": 0.8944375252739722, "MajorityClassPercentage": 51.88087774294671, "MajorityClassSize": 1655, "MaxAttributeEntropy": 2.0085632801967233, "MaxKurtosisOfNumericAtts": null, "MaxMeansOfNumericAtts": null, "MaxMutualInformation": 0.38964063813375, "MaxNominalAttDistinctValues": 6, "MaxSkewnessOfNumericAtts": null, "MaxStdDevOfNumericAtts": null, "MeanAttributeEntropy": 1.9780144516767606, "MeanKurtosisOfNumericAtts": null, "MeanMeansOfNumericAtts": null, "MeanMutualInformation": 0.056251973390548826, "MeanNoiseToSignalRatio": 34.16346774083301, "MeanNominalAttDistinctValues": 4.754098360655737, "MeanSkewnessOfNumericAtts": null, "MeanStdDevOfNumericAtts": null, "MinAttributeEntropy": 1.6679869019048021, "MinKurtosisOfNumericAtts": null, "MinMeansOfNumericAtts": null, "MinMutualInformation": 0.00239174071595, "MinNominalAttDistinctValues": 3, "MinSkewnessOfNumericAtts": null, "MinStdDevOfNumericAtts": null, "MinorityClassPercentage": 24.043887147335425, "MinorityClassSize": 767, "NaiveBayesAUC": 0.9928619979725506, "NaiveBayesErrRate": 0.047021943573667714, "NaiveBayesKappa": 0.9235168869438932, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "PercentageOfMissingValues": 0, "PercentageOfNumericFeatures": 0, "PercentageOfSymbolicFeatures": 100, "Quartile1AttributeEntropy": 1.986921112054029, "Quartile1KurtosisOfNumericAtts": null, "Quartile1MeansOfNumericAtts": null, "Quartile1MutualInformation": 0.008114095339065, "Quartile1SkewnessOfNumericAtts": null, "Quartile1StdDevOfNumericAtts": null, "Quartile2AttributeEntropy": 1.9958149659372768, "Quartile2KurtosisOfNumericAtts": null, "Quartile2MeansOfNumericAtts": null, "Quartile2MutualInformation": 0.012445557396825, "Quartile2SkewnessOfNumericAtts": null, "Quartile2StdDevOfNumericAtts": null, "Quartile3AttributeEntropy": 1.9985747676028534, "Quartile3KurtosisOfNumericAtts": null, "Quartile3MeansOfNumericAtts": null, "Quartile3MutualInformation": 0.06388006173431, "Quartile3SkewnessOfNumericAtts": null, "Quartile3StdDevOfNumericAtts": null, "REPTreeDepth1AUC": 0.9624981083963462, "REPTreeDepth1ErrRate": 0.09435736677115987, "REPTreeDepth1Kappa": 0.8488820745392759, "REPTreeDepth2AUC": 0.9624981083963462, "REPTreeDepth2ErrRate": 0.09435736677115987, "REPTreeDepth2Kappa": 0.8488820745392759, "REPTreeDepth3AUC": 0.9624981083963462, "REPTreeDepth3ErrRate": 0.09435736677115987, "REPTreeDepth3Kappa": 0.8488820745392759, "RandomTreeDepth1AUC": 0.7723490181560075, "RandomTreeDepth1ErrRate": 0.31191222570532917, "RandomTreeDepth1Kappa": 0.5030951953788269, "RandomTreeDepth2AUC": 0.7723490181560075, "RandomTreeDepth2ErrRate": 0.31191222570532917, "RandomTreeDepth2Kappa": 0.5030951953788269, "RandomTreeDepth3AUC": 0.7723490181560075, "RandomTreeDepth3ErrRate": 0.31191222570532917, "RandomTreeDepth3Kappa": 0.5030951953788269, "StdvNominalAttDistinctValues": 0.537144850262882, "kNN1NAUC": 0.8617257940278134, "kNN1NErrRate": 0.2689655172413793, "kNN1NKappa": 0.5976262917909895 }, "tags": [ { "tag": "study_14", "uploader": "1" }, { "tag": "study_1", "uploader": "0" }, { "tag": "study_395", "uploader": "0" }, { "tag": "study_709", "uploader": "0" }, { "tag": "study_721", "uploader": "0" }, { "tag": "study_101", "uploader": "0" }, { "tag": "study_114", "uploader": "0" }, { "tag": "study_722", "uploader": "0" }, { "tag": "study_509", "uploader": "0" }, { "tag": "study_722", "uploader": "0" }, { "tag": "study_114", "uploader": "0" }, { "tag": "study_395", "uploader": "0" }, { "tag": "study_380", "uploader": "0" }, { "tag": "study_114", "uploader": "0" }, { "tag": "study_117", "uploader": "0" }, { "tag": "study_249", "uploader": "0" }, { "tag": "study_560", "uploader": "0" } ], "features": [ { "name": "Class", "index": "61", "type": "nominal", "distinct": "3", "missing": "0", "target": "1", "distr": [ [ "EI", "IE", "N" ], [ [ "767", "0", "0" ], [ "0", "768", "0" ], [ "0", "0", "1655" ] ] ] }, { "name": "attribute_32", "index": "32", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "T", "N", "C", "G", "A" ], [ [ "759", "249", "420" ], [ "1", "0", "0" ], [ "4", "164", "411" ], [ "1", "175", "400" ], [ "2", "180", "424" ] ] ] }, { "name": "attribute_31", "index": "31", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "N", "C", "T", "A" ], [ [ "765", "365", "462" ], [ "1", "0", "0" ], [ "1", "110", "403" ], [ "0", "75", "413" ], [ "0", "218", "377" ] ] ] }, { "name": "attribute_33", "index": "33", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "A", "N", "T" ], [ [ "17", "204", "416" ], [ "356", "178", "417" ], [ "378", "172", "432" ], [ "2", "0", "1" ], [ "14", "214", "389" ] ] ] }, { "name": "attribute_34", "index": "34", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "T", "A", "C", "G", "N" ], [ [ "46", "169", "392" ], [ "553", "173", "395" ], [ "69", "219", "422" ], [ "98", "207", "446" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_35", "index": "35", "type": "nominal", "distinct": "6", "missing": "0", "distr": [ [ "G", "T", "A", "C", "N", "R" ], [ [ "657", "150", "394" ], [ "37", "203", "425" ], [ "35", "180", "399" ], [ "37", "234", "437" ], [ "1", "0", "0" ], [ "0", "1", "0" ] ] ] }, { "name": "attribute_36", "index": "36", "type": "nominal", "distinct": "6", "missing": "0", "distr": [ [ "T", "C", "A", "G", "N", "S" ], [ [ "347", "181", "403" ], [ "126", "239", "445" ], [ "121", "154", "407" ], [ "172", "193", "400" ], [ "1", "0", "0" ], [ "0", "1", "0" ] ] ] }, { "name": "attribute_37", "index": "37", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "T", "C", "A", "G", "N" ], [ [ "122", "140", "409" ], [ "161", "197", "378" ], [ "183", "203", "427" ], [ "300", "228", "440" ], [ "1", "0", "1" ] ] ] }, { "name": "attribute_38", "index": "38", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "T", "A", "N" ], [ [ "256", "203", "407" ], [ "202", "212", "408" ], [ "170", "169", "409" ], [ "137", "184", "429" ], [ "2", "0", "2" ] ] ] }, { "name": "attribute_39", "index": "39", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "T", "A", "N" ], [ [ "256", "201", "422" ], [ "220", "216", "404" ], [ "164", "172", "421" ], [ "126", "179", "408" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_40", "index": "40", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "A", "G", "C", "T", "N" ], [ [ "116", "190", "394" ], [ "272", "217", "436" ], [ "196", "198", "425" ], [ "182", "163", "400" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_41", "index": "41", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "A", "C", "G", "T", "N" ], [ [ "118", "195", "406" ], [ "201", "183", "410" ], [ "286", "227", "401" ], [ "161", "163", "438" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_42", "index": "42", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "C", "A", "T", "N" ], [ [ "260", "211", "445" ], [ "215", "199", "402" ], [ "132", "177", "393" ], [ "159", "181", "415" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_43", "index": "43", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "A", "C", "T", "N" ], [ [ "232", "219", "459" ], [ "126", "194", "400" ], [ "226", "227", "392" ], [ "182", "128", "403" ], [ "1", "0", "1" ] ] ] }, { "name": "attribute_44", "index": "44", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "C", "T", "A", "N" ], [ [ "225", "177", "436" ], [ "213", "211", "417" ], [ "169", "213", "398" ], [ "159", "167", "404" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_45", "index": "45", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "T", "A", "G", "N" ], [ [ "214", "238", "433" ], [ "194", "125", "406" ], [ "158", "215", "384" ], [ "200", "190", "432" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_46", "index": "46", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "T", "A", "N" ], [ [ "216", "247", "381" ], [ "233", "191", "447" ], [ "177", "138", "391" ], [ "140", "192", "436" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_47", "index": "47", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "T", "C", "G", "A", "N" ], [ [ "200", "156", "414" ], [ "172", "200", "397" ], [ "266", "238", "411" ], [ "128", "174", "433" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_48", "index": "48", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "T", "G", "C", "A", "N" ], [ [ "169", "141", "406" ], [ "256", "247", "409" ], [ "184", "215", "401" ], [ "157", "165", "439" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_49", "index": "49", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "T", "A", "N" ], [ [ "223", "226", "400" ], [ "252", "215", "478" ], [ "170", "131", "368" ], [ "120", "196", "409" ], [ "2", "0", "0" ] ] ] }, { "name": "attribute_50", "index": "50", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "C", "A", "T", "N" ], [ [ "245", "194", "397" ], [ "202", "188", "417" ], [ "141", "199", "438" ], [ "176", "187", "403" ], [ "3", "0", "0" ] ] ] }, { "name": "attribute_51", "index": "51", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "A", "G", "C", "T", "N" ], [ [ "148", "187", "360" ], [ "222", "236", "444" ], [ "210", "213", "458" ], [ "186", "132", "393" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_52", "index": "52", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "T", "A", "C", "N" ], [ [ "247", "205", "422" ], [ "163", "163", "383" ], [ "160", "217", "441" ], [ "196", "183", "409" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_53", "index": "53", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "T", "A", "N" ], [ [ "192", "214", "426" ], [ "247", "204", "423" ], [ "176", "167", "407" ], [ "151", "183", "399" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_54", "index": "54", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "T", "A", "N" ], [ [ "185", "236", "397" ], [ "269", "234", "431" ], [ "180", "140", "422" ], [ "132", "158", "405" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_55", "index": "55", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "A", "C", "G", "T", "N" ], [ [ "137", "227", "438" ], [ "226", "214", "395" ], [ "242", "187", "430" ], [ "161", "140", "392" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_56", "index": "56", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "C", "T", "A", "N" ], [ [ "242", "198", "398" ], [ "179", "233", "419" ], [ "175", "159", "429" ], [ "170", "178", "408" ], [ "1", "0", "1" ] ] ] }, { "name": "attribute_57", "index": "57", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "T", "C", "G", "A", "N" ], [ [ "184", "166", "398" ], [ "205", "169", "416" ], [ "231", "229", "448" ], [ "146", "204", "393" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_58", "index": "58", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "A", "G", "T", "N" ], [ [ "218", "205", "447" ], [ "134", "200", "386" ], [ "235", "222", "409" ], [ "179", "141", "413" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_59", "index": "59", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "T", "G", "C", "A", "N" ], [ [ "162", "187", "406" ], [ "217", "168", "404" ], [ "218", "200", "442" ], [ "169", "213", "403" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_60", "index": "60", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "C", "T", "A", "N" ], [ [ "256", "282", "415" ], [ "166", "183", "436" ], [ "197", "144", "389" ], [ "147", "159", "415" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_16", "index": "16", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "G", "C", "T", "A" ], [ [ "156", "96", "432" ], [ "241", "289", "419" ], [ "174", "300", "383" ], [ "196", "83", "421" ] ] ] }, { "name": "attribute_1", "index": "1", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "A", "G", "T", "D" ], [ [ "201", "236", "398" ], [ "169", "154", "420" ], [ "233", "183", "460" ], [ "164", "194", "377" ], [ "0", "1", "0" ] ] ] }, { "name": "attribute_2", "index": "2", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "A", "T", "D" ], [ [ "233", "236", "389" ], [ "195", "173", "426" ], [ "178", "162", "439" ], [ "161", "197", "400" ], [ "0", "0", "1" ] ] ] }, { "name": "attribute_3", "index": "3", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "A", "G", "T", "C" ], [ [ "174", "158", "380" ], [ "222", "184", "435" ], [ "165", "193", "403" ], [ "206", "233", "437" ] ] ] }, { "name": "attribute_4", "index": "4", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "G", "C", "A", "T" ], [ [ "210", "155", "437" ], [ "217", "265", "402" ], [ "177", "152", "424" ], [ "163", "196", "392" ] ] ] }, { "name": "attribute_5", "index": "5", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "C", "T", "A", "G" ], [ [ "205", "273", "387" ], [ "191", "220", "394" ], [ "195", "162", "444" ], [ "176", "113", "430" ] ] ] }, { "name": "attribute_6", "index": "6", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "T", "C", "G", "A" ], [ [ "150", "221", "389" ], [ "200", "255", "443" ], [ "273", "139", "416" ], [ "144", "153", "407" ] ] ] }, { "name": "attribute_7", "index": "7", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "G", "A", "C", "T" ], [ [ "207", "145", "428" ], [ "194", "171", "418" ], [ "213", "225", "420" ], [ "153", "227", "389" ] ] ] }, { "name": "attribute_8", "index": "8", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "C", "A", "G", "T" ], [ [ "226", "238", "414" ], [ "169", "199", "422" ], [ "192", "128", "411" ], [ "180", "203", "408" ] ] ] }, { "name": "attribute_9", "index": "9", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "A", "C", "G", "T" ], [ [ "159", "171", "419" ], [ "227", "258", "424" ], [ "241", "90", "418" ], [ "140", "249", "394" ] ] ] }, { "name": "attribute_10", "index": "10", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "T", "G", "C", "A" ], [ [ "177", "271", "401" ], [ "223", "110", "433" ], [ "148", "253", "407" ], [ "219", "134", "414" ] ] ] }, { "name": "attribute_11", "index": "11", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "C", "G", "A", "T" ], [ [ "206", "218", "399" ], [ "228", "155", "395" ], [ "150", "141", "426" ], [ "183", "254", "435" ] ] ] }, { "name": "attribute_12", "index": "12", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "A", "G", "C", "T" ], [ [ "152", "125", "391" ], [ "240", "140", "427" ], [ "217", "253", "460" ], [ "158", "250", "377" ] ] ] }, { "name": "attribute_13", "index": "13", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "C", "A", "G", "T" ], [ [ "183", "281", "414" ], [ "175", "111", "452" ], [ "227", "123", "402" ], [ "182", "253", "387" ] ] ] }, { "name": "attribute_14", "index": "14", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "A", "G", "T", "C", "N" ], [ [ "211", "117", "469" ], [ "197", "117", "398" ], [ "156", "242", "384" ], [ "203", "292", "403" ], [ "0", "0", "1" ] ] ] }, { "name": "attribute_15", "index": "15", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "G", "C", "T", "A" ], [ [ "199", "115", "454" ], [ "252", "301", "406" ], [ "141", "251", "406" ], [ "175", "101", "389" ] ] ] }, { "name": "Instance_name", "index": "0", "type": "nominal", "distinct": "3178", "missing": "0", "ignore": "1", "distr": [] }, { "name": "attribute_17", "index": "17", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "A", "G", "T", "C" ], [ [ "168", "75", "427" ], [ "212", "103", "386" ], [ "148", "323", "440" ], [ "239", "267", "402" ] ] ] }, { "name": "attribute_18", "index": "18", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "G", "T", "A", "C" ], [ [ "209", "100", "437" ], [ "154", "337", "415" ], [ "187", "63", "399" ], [ "217", "268", "404" ] ] ] }, { "name": "attribute_19", "index": "19", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "A", "C", "T", "N" ], [ [ "186", "88", "438" ], [ "214", "54", "389" ], [ "209", "286", "426" ], [ "158", "340", "401" ], [ "0", "0", "1" ] ] ] }, { "name": "attribute_20", "index": "20", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "A", "T", "N" ], [ [ "222", "280", "387" ], [ "182", "84", "405" ], [ "196", "50", "447" ], [ "166", "354", "415" ], [ "1", "0", "1" ] ] ] }, { "name": "attribute_21", "index": "21", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "T", "A", "N" ], [ [ "223", "281", "434" ], [ "223", "70", "404" ], [ "156", "349", "408" ], [ "164", "68", "408" ], [ "1", "0", "1" ] ] ] }, { "name": "attribute_22", "index": "22", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "A", "C", "T", "G", "N" ], [ [ "208", "78", "416" ], [ "225", "273", "425" ], [ "141", "334", "373" ], [ "192", "83", "441" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_23", "index": "23", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "C", "A", "T", "N" ], [ [ "187", "88", "427" ], [ "219", "324", "425" ], [ "201", "41", "420" ], [ "159", "315", "383" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_24", "index": "24", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "G", "A", "T", "N" ], [ [ "189", "346", "417" ], [ "247", "55", "404" ], [ "166", "65", "407" ], [ "164", "302", "427" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_25", "index": "25", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "T", "A", "C", "N" ], [ [ "197", "44", "463" ], [ "184", "330", "373" ], [ "212", "37", "403" ], [ "173", "357", "416" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_26", "index": "26", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "A", "G", "C", "T", "N" ], [ [ "193", "55", "419" ], [ "186", "54", "420" ], [ "186", "309", "397" ], [ "201", "350", "419" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_27", "index": "27", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "C", "T", "A", "N" ], [ [ "243", "193", "419" ], [ "220", "237", "426" ], [ "136", "153", "393" ], [ "167", "185", "417" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_28", "index": "28", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "C", "A", "G", "T", "N" ], [ [ "290", "606", "413" ], [ "249", "18", "429" ], [ "130", "4", "442" ], [ "97", "140", "371" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_29", "index": "29", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "A", "G", "C", "T", "N" ], [ [ "448", "765", "400" ], [ "113", "1", "409" ], [ "106", "1", "429" ], [ "99", "1", "417" ], [ "1", "0", "0" ] ] ] }, { "name": "attribute_30", "index": "30", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "G", "C", "A", "T", "N" ], [ [ "625", "766", "431" ], [ "23", "1", "418" ], [ "61", "1", "412" ], [ "57", "0", "394" ], [ "1", "0", "0" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }