{ "data_id": "40701", "name": "churn", "exact_name": "churn", "version": 1, "version_label": null, "description": "**Author**: Unknown \r\n**Source**: [PMLB](https:\/\/github.com\/EpistasisLab\/penn-ml-benchmarks\/tree\/master\/datasets\/classification), [BigML](https:\/\/bigml.com\/user\/francisco\/gallery\/dataset\/5163ad540c0b5e5b22000383), Supposedly from UCI but I can't find it there. \r\n**Please cite**: \r\n\r\nA dataset relating characteristics of telephony account features and usage and whether or not the customer churned. Originally used in [Discovering Knowledge in Data: An Introduction to Data Mining](http:\/\/secs.ac.in\/wp-content\/CSE_PORTAL\/DataMining_Daniel.pdf).", "format": "ARFF", "uploader": "Pieter Gijsbers", "uploader_id": 869, "visibility": "public", "creator": null, "contributor": null, "date": "2017-04-06 12:37:40", "update_comment": null, "last_update": "2017-04-06 12:37:40", "licence": "public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/4965302\/churn.arff", "default_target_attribute": "class", "row_id_attribute": null, "ignore_attribute": null, "runs": 7512, "suggest": { "input": [ "churn", "A dataset relating characteristics of telephony account features and usage and whether or not the customer churned. Originally used in [Discovering Knowledge in Data: An Introduction to Data Mining](http:\/\/secs.ac.in\/wp-content\/CSE_PORTAL\/DataMining_Daniel.pdf). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 5000, "NumberOfFeatures": 21, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 16, "NumberOfSymbolicFeatures": 5, "MinSkewnessOfNumericAtts": -0.21028611467847197, "PercentageOfSymbolicFeatures": 23.809523809523807, "Quartile3MutualInformation": 0.0467752151671025, "MaxNominalAttDistinctValues": 10, "MinStdDevOfNumericAtts": 0.7455137072660346, "Quartile1AttributeEntropy": 0.5471325281256134, "Quartile3SkewnessOfNumericAtts": 0.019315373507701978, "MaxSkewnessOfNumericAtts": 1.3606924794023325, "MinorityClassPercentage": 14.14, "Quartile1KurtosisOfNumericAtts": -0.021262334366557556, "Quartile3StdDevOfNumericAtts": 47.81948183011039, "MaxStdDevOfNumericAtts": 1443.5200033252052, "MinorityClassSize": 707, "Quartile1MeansOfNumericAtts": 9.328744, "StdvNominalAttDistinctValues": 3.492849839314596, "MeanAttributeEntropy": 1.2659352523597343, "NumberOfBinaryFeatures": 3, "Quartile1MutualInformation": 0.00251891414912, "MeanKurtosisOfNumericAtts": 0.18476979395658538, "Quartile1SkewnessOfNumericAtts": -0.04852515449147719, "MeanMeansOfNumericAtts": 224.32242362499997, "Quartile1StdDevOfNumericAtts": 3.1452576112172346, "AutoCorrelation": 0.7583516703340668, "MeanMutualInformation": 0.024132744080242498, "MeanNoiseToSignalRatio": 51.457161446308824, "Quartile2AttributeEntropy": 1.1672980918836702, "ClassEntropy": 0.5878935751446988, "MeanNominalAttDistinctValues": 3.8, "Quartile2KurtosisOfNumericAtts": 0.08236840614015817, "Dimensionality": 0.0042, "MeanSkewnessOfNumericAtts": 0.1395287334036911, "Quartile2MeansOfNumericAtts": 65.284434, "EquivalentNumberOfAtts": 24.360825821958965, "MeanStdDevOfNumericAtts": 109.24068657540887, "Quartile2MutualInformation": 0.023104102924505, "MajorityClassPercentage": 85.86, "MinAttributeEntropy": 0.45164043671574877, "Quartile2SkewnessOfNumericAtts": -0.011004011473661496, "MajorityClassSize": 4293, "MinKurtosisOfNumericAtts": -1.1999999999999262, "PercentageOfBinaryFeatures": 14.285714285714285, "Quartile2StdDevOfNumericAtts": 17.314988016366375, "MaxAttributeEntropy": 2.2775043889558475, "MinMeansOfNumericAtts": 2.7711959999999998, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 2.083375137069919, "MaxKurtosisOfNumericAtts": 3.2681836469481524, "MinMutualInformation": 8.063806707e-5, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 0.19398732998733603, "MaxMeansOfNumericAtts": 2499.5, "MinNominalAttDistinctValues": 2, "PercentageOfNumericFeatures": 76.19047619047619, "Quartile3MeansOfNumericAtts": 160.28132499999998, "MaxMutualInformation": 0.05024213240489 }, "tags": [ { "tag": "Computer Systems", "uploader": "38960" }, { "tag": "Machine Learning", "uploader": "38960" }, { "tag": "OpenML-CC18", "uploader": "1" }, { "tag": "study_135", "uploader": "5824" }, { "tag": "study_144", "uploader": "5824" }, { "tag": "study_98", "uploader": "1935" }, { "tag": "study_99", "uploader": "1" }, { "tag": "study_293", "uploader": "0" }, { "tag": "study_270", "uploader": "0" }, { "tag": "study_271", "uploader": "0" }, { "tag": "study_253", "uploader": "0" }, { "tag": "study_258", "uploader": "0" }, { "tag": "study_285", "uploader": "0" }, { "tag": "study_275", "uploader": "0" } ], "features": [ { "name": "class", "index": "20", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "0", "1" ], [ [ "4293", "0" ], [ "0", "707" ] ] ] }, { "name": "state", "index": "0", "type": "numeric", "distinct": "51", "missing": "0", "min": "0", "max": "50", "mean": "26", "stdev": "15" }, { "name": "account_length", "index": "1", "type": "numeric", "distinct": "218", "missing": "0", "min": "1", "max": "243", "mean": "100", "stdev": "40" }, { "name": "area_code", "index": "2", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "408", "415", "510" ], [ [ "1082", "177" ], [ "2149", "346" ], [ "1062", "184" ] ] ] }, { "name": "phone_number", "index": "3", "type": "numeric", "distinct": "5000", "missing": "0", "min": "0", "max": "4999", "mean": "2500", "stdev": "1444" }, { "name": "international_plan", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "4019", "508" ], [ "274", "199" ] ] ] }, { "name": "voice_mail_plan", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "3072", "605" ], [ "1221", "102" ] ] ] }, { "name": "number_vmail_messages", "index": "6", "type": "numeric", "distinct": "48", "missing": "0", "min": "0", "max": "52", "mean": "8", "stdev": "14" }, { "name": "total_day_minutes", "index": "7", "type": "numeric", "distinct": "1961", "missing": "0", "min": "0", "max": "352", "mean": "180", "stdev": "54" }, { "name": "total_day_calls", "index": "8", "type": "numeric", "distinct": "123", "missing": "0", "min": "0", "max": "165", "mean": "100", "stdev": "20" }, { "name": "total_day_charge", "index": "9", "type": "numeric", "distinct": "1961", "missing": "0", "min": "0", "max": "60", "mean": "31", "stdev": "9" }, { "name": "total_eve_minutes", "index": "10", "type": "numeric", "distinct": "1879", "missing": "0", "min": "0", "max": "364", "mean": "201", "stdev": "51" }, { "name": "total_eve_calls", "index": "11", "type": "numeric", "distinct": "126", "missing": "0", "min": "0", "max": "170", "mean": "100", "stdev": "20" }, { "name": "total_eve_charge", "index": "12", "type": "numeric", "distinct": "1659", "missing": "0", "min": "0", "max": "31", "mean": "17", "stdev": "4" }, { "name": "total_night_minutes", "index": "13", "type": "numeric", "distinct": "1853", "missing": "0", "min": "0", "max": "395", "mean": "200", "stdev": "51" }, { "name": "total_night_calls", "index": "14", "type": "numeric", "distinct": "131", "missing": "0", "min": "0", "max": "175", "mean": "100", "stdev": "20" }, { "name": "total_night_charge", "index": "15", "type": "numeric", "distinct": "1028", "missing": "0", "min": "0", "max": "18", "mean": "9", "stdev": "2" }, { "name": "total_intl_minutes", "index": "16", "type": "numeric", "distinct": "170", "missing": "0", "min": "0", "max": "20", "mean": "10", "stdev": "3" }, { "name": "total_intl_calls", "index": "17", "type": "numeric", "distinct": "21", "missing": "0", "min": "0", "max": "20", "mean": "4", "stdev": "2" }, { "name": "total_intl_charge", "index": "18", "type": "numeric", "distinct": "170", "missing": "0", "min": "0", "max": "5", "mean": "3", "stdev": "1" }, { "name": "number_customer_service_calls", "index": "19", "type": "nominal", "distinct": "10", "missing": "0", "distr": [ [ "0", "1", "2", "3", "4", "5", "6", "7", "8", "9" ], [ [ "902", "121" ], [ "1596", "190" ], [ "1005", "122" ], [ "592", "73" ], [ "141", "111" ], [ "38", "58" ], [ "12", "22" ], [ "6", "7" ], [ "1", "1" ], [ "0", "2" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 2, "nr_of_downloads": 9, "total_downloads": 11, "reach": 11, "reuse": 25, "impact_of_reuse": 0, "reach_of_reuse": 2, "impact": 26 }