{ "data_id": "42159", "name": "colleges", "exact_name": "colleges", "version": 11, "version_label": "0.1", "description": "Regroups information for about 7800 different US colleges. Including geographical information, stats about the population attending and post graduation career earnings.", "format": "arff", "uploader": "Thomas Schmitt", "uploader_id": 3422, "visibility": "public", "creator": "\"NA\"", "contributor": null, "date": "2019-10-04 12:02:18", "update_comment": null, "last_update": "2019-10-04 12:02:18", "licence": "NA", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/21754533\/dataset", "default_target_attribute": "percent_pell_grant", "row_id_attribute": "UNITID", "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "colleges", "Regroups information for about 7800 different US colleges. Including geographical information, stats about the population attending and post graduation career earnings. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 7063, "NumberOfFeatures": 50, "NumberOfClasses": 0, "NumberOfMissingValues": 125494, "NumberOfInstancesWithMissingValues": 7063, "NumberOfNumericFeatures": 33, "NumberOfSymbolicFeatures": 6, "ClassEntropy": null, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "Dimensionality": 0.007079144839303412, "MeanNominalAttDistinctValues": 1019.8333333333334, "Quartile2KurtosisOfNumericAtts": 1.446540734192971, "EquivalentNumberOfAtts": null, "MeanSkewnessOfNumericAtts": 1.653570087163097, "Quartile2MeansOfNumericAtts": 279.3476395081724, "MajorityClassPercentage": null, "MeanStdDevOfNumericAtts": 3345.131176249055, "Quartile2MutualInformation": null, "MajorityClassSize": null, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": 0.9139097082115994, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.3282358630683941, "PercentageOfBinaryFeatures": 0, "Quartile2StdDevOfNumericAtts": 42.7793967152446, "MaxKurtosisOfNumericAtts": 358.99040621416003, "MinMeansOfNumericAtts": -90.26391797351585, "PercentageOfInstancesWithMissingValues": 100, "Quartile3AttributeEntropy": null, "MaxMeansOfNumericAtts": 36444.77191665094, "MinMutualInformation": null, "PercentageOfMissingValues": 35.5356080985417, "Quartile3KurtosisOfNumericAtts": 6.213142733135105, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 3, "PercentageOfNumericFeatures": 66, "Quartile3MeansOfNumericAtts": 14571.281846748829, "MaxNominalAttDistinctValues": 6039, "MinSkewnessOfNumericAtts": -0.9881644118945149, "PercentageOfSymbolicFeatures": 12, "Quartile3MutualInformation": null, "MaxSkewnessOfNumericAtts": 12.989876646749993, "MinStdDevOfNumericAtts": 0.07177556257880363, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 1.696700706818044, "MaxStdDevOfNumericAtts": 13426.395583555071, "MinorityClassPercentage": null, "Quartile1KurtosisOfNumericAtts": 0.5424441820990629, "Quartile3StdDevOfNumericAtts": 8295.298850516294, "MeanAttributeEntropy": null, "MinorityClassSize": null, "Quartile1MeansOfNumericAtts": 0.5259969074607409, "StdvNominalAttDistinctValues": 2458.9747795914186, "MeanKurtosisOfNumericAtts": 21.5028611189546, "NumberOfBinaryFeatures": 0, "Quartile1MutualInformation": null, "MeanMeansOfNumericAtts": 7182.8381524991755, "Quartile1SkewnessOfNumericAtts": 0.46658009966467123, "AutoCorrelation": 0.7872184225431891, "MeanMutualInformation": null, "Quartile1StdDevOfNumericAtts": 0.2770741963374991 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "percent_pell_grant", "index": "30", "type": "numeric", "distinct": "4502", "missing": "0", "target": "1", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "UNITID", "index": "0", "type": "numeric", "distinct": "7063", "missing": "0", "identifier": "1", "min": "100654", "max": "483212", "mean": "283687", "stdev": "132384" }, { "name": "school_name", "index": "1", "type": "string", "distinct": "6961", "missing": "0" }, { "name": "city", "index": "2", "type": "string", "distinct": "2461", "missing": "0" }, { "name": "state", "index": "3", "type": "nominal", "distinct": "59", "missing": "0", "distr": [] }, { "name": "zip", "index": "4", "type": "nominal", "distinct": "6039", "missing": "0", "distr": [] }, { "name": "school_webpage", "index": "5", "type": "string", "distinct": "5710", "missing": "56" }, { "name": "latitude", "index": "6", "type": "numeric", "distinct": "6508", "missing": "342", "min": "-14", "max": "71", "mean": "37", "stdev": "6" }, { "name": "longitude", "index": "7", "type": "numeric", "distinct": "6598", "missing": "342", "min": "-171", "max": "171", "mean": "-90", "stdev": "18" }, { "name": "admission_rate", "index": "8", "type": "numeric", "distinct": "1739", "missing": "4847", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "sat_verbal_midrange", "index": "9", "type": "numeric", "distinct": "164", "missing": "5763", "min": "290", "max": "760", "mean": "522", "stdev": "68" }, { "name": "sat_math_midrange", "index": "10", "type": "numeric", "distinct": "163", "missing": "5749", "min": "310", "max": "785", "mean": "531", "stdev": "72" }, { "name": "sat_writing_midrange", "index": "11", "type": "numeric", "distinct": "131", "missing": "6270", "min": "350", "max": "755", "mean": "521", "stdev": "78" }, { "name": "act_combined_midrange", "index": "12", "type": "numeric", "distinct": "22", "missing": "5722", "min": "2", "max": "34", "mean": "23", "stdev": "3" }, { "name": "act_english_midrange", "index": "13", "type": "numeric", "distinct": "24", "missing": "5899", "min": "2", "max": "34", "mean": "23", "stdev": "4" }, { "name": "act_math_midrange", "index": "14", "type": "numeric", "distinct": "24", "missing": "5898", "min": "2", "max": "35", "mean": "23", "stdev": "3" }, { "name": "act_writing_midrange", "index": "15", "type": "numeric", "distinct": "8", "missing": "6763", "min": "5", "max": "12", "mean": "8", "stdev": "1" }, { "name": "sat_total_average", "index": "16", "type": "numeric", "distinct": "477", "missing": "5644", "min": "666", "max": "1534", "mean": "1057", "stdev": "132" }, { "name": "undergrad_size", "index": "17", "type": "numeric", "distinct": "3020", "missing": "1", "min": "0", "max": "166816", "mean": "2341", "stdev": "5452" }, { "name": "percent_white", "index": "18", "type": "numeric", "distinct": "4453", "missing": "1", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "percent_black", "index": "19", "type": "numeric", "distinct": "3277", "missing": "1", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "percent_hispanic", "index": "20", "type": "numeric", "distinct": "2802", "missing": "1", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "percent_asian", "index": "21", "type": "numeric", "distinct": "1239", "missing": "1", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "percent_part_time", "index": "22", "type": "numeric", "distinct": "3466", "missing": "6", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "average_cost_academic_year", "index": "23", "type": "numeric", "distinct": "3802", "missing": "2928", "min": "4157", "max": "74473", "mean": "24353", "stdev": "12174" }, { "name": "average_cost_program_year", "index": "24", "type": "numeric", "distinct": "2349", "missing": "4522", "min": "3057", "max": "89422", "mean": "18495", "stdev": "6355" }, { "name": "tuition_(instate)", "index": "25", "type": "numeric", "distinct": "2981", "missing": "2926", "min": "80", "max": "64900", "mean": "13948", "stdev": "10859" }, { "name": "tuition_(out_of_state)", "index": "26", "type": "numeric", "distinct": "3039", "missing": "2926", "min": "80", "max": "64900", "mean": "16442", "stdev": "9893" }, { "name": "spend_per_student", "index": "27", "type": "numeric", "distinct": "5294", "missing": "11", "min": "0", "max": "307089", "mean": "6522", "stdev": "7825" }, { "name": "faculty_salary", "index": "28", "type": "numeric", "distinct": "3297", "missing": "2672", "min": "269", "max": "23611", "mean": "5928", "stdev": "2194" }, { "name": "percent_part_time_faculty", "index": "29", "type": "numeric", "distinct": "2332", "missing": "3161", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "completion_rate", "index": "31", "type": "numeric", "distinct": "1912", "missing": "4617", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "average_age_of_entry", "index": "32", "type": "numeric", "distinct": "0", "missing": "7063", "min": "2147483647", "max": "0", "mean": "0", "stdev": "0" }, { "name": "percent_married", "index": "33", "type": "numeric", "distinct": "0", "missing": "7063", "min": "2147483647", "max": "0", "mean": "0", "stdev": "0" }, { "name": "percent_veteran", "index": "34", "type": "numeric", "distinct": "0", "missing": "7063", "min": "2147483647", "max": "0", "mean": "0", "stdev": "0" }, { "name": "predominant_degree", "index": "35", "type": "nominal", "distinct": "3", "missing": "75", "distr": [] }, { "name": "highest_degree", "index": "36", "type": "nominal", "distinct": "5", "missing": "0", "distr": [] }, { "name": "ownership", "index": "37", "type": "nominal", "distinct": "3", "missing": "0", "distr": [] }, { "name": "region", "index": "38", "type": "nominal", "distinct": "10", "missing": "0", "distr": [] }, { "name": "gender", "index": "39", "type": "string", "distinct": "3", "missing": "0" }, { "name": "carnegie_basic_classification", "index": "40", "type": "string", "distinct": "33", "missing": "2986" }, { "name": "carnegie_undergraduate", "index": "41", "type": "string", "distinct": "13", "missing": "3506" }, { "name": "carnegie_size", "index": "42", "type": "string", "distinct": "17", "missing": "3505" }, { "name": "religious_affiliation", "index": "43", "type": "string", "distinct": "55", "missing": "6260" }, { "name": "percent_female", "index": "44", "type": "string", "distinct": "102", "missing": "1510" }, { "name": "agege24", "index": "45", "type": "string", "distinct": "100", "missing": "1510" }, { "name": "faminc", "index": "46", "type": "string", "distinct": "4778", "missing": "1510" }, { "name": "mean_earnings_6_years", "index": "47", "type": "numeric", "distinct": "494", "missing": "1451", "min": "9300", "max": "106900", "mean": "29280", "stdev": "10138" }, { "name": "median_earnings_6_years", "index": "48", "type": "numeric", "distinct": "489", "missing": "1451", "min": "7000", "max": "117400", "mean": "26519", "stdev": "9705" }, { "name": "mean_earnings_10_years", "index": "49", "type": "numeric", "distinct": "607", "missing": "1736", "min": "12300", "max": "162000", "mean": "36445", "stdev": "13426" }, { "name": "median_earnings_10_years", "index": "50", "type": "numeric", "distinct": "568", "missing": "1736", "min": "8400", "max": "121500", "mean": "32555", "stdev": "11947" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }