{ "data_id": "41492", "name": "youtube", "exact_name": "youtube", "version": 2, "version_label": null, "description": "The YouTube personality dataset consists of a collection of behavorial features, speech transcriptions, and personality impression scores for a set of 404 YouTube vloggers that explicitly show themselves in front of the a webcam talking about a variety of topics including personal issues, politics, movies, books, etc. There is no content-related restriction and the language used in the videos is natural and diverse.", "format": "ARFF", "uploader": "Quay Au", "uploader_id": 2373, "visibility": "public", "creator": null, "contributor": null, "date": "2019-03-14 18:09:39", "update_comment": null, "last_update": "2019-03-14 18:09:39", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/21230449\/file17307ec260c.arff", "default_target_attribute": "gender,Extr,Agr,Cons,Emot,Open", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "youtube", "The YouTube personality dataset consists of a collection of behavorial features, speech transcriptions, and personality impression scores for a set of 404 YouTube vloggers that explicitly show themselves in front of the a webcam talking about a variety of topics including personal issues, politics, movies, books, etc. There is no content-related restriction and the language used in the videos is natural and diverse. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 404, "NumberOfFeatures": 31, "NumberOfClasses": null, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 30, "NumberOfSymbolicFeatures": 1, "ClassEntropy": null, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "Dimensionality": 0.07673267326732673, "MeanNominalAttDistinctValues": 2, "Quartile2KurtosisOfNumericAtts": 1.7978812735718464, "EquivalentNumberOfAtts": null, "MeanSkewnessOfNumericAtts": 0.7926273293167501, "Quartile2MeansOfNumericAtts": 0.9582337871287129, "MajorityClassPercentage": null, "MeanStdDevOfNumericAtts": 3.6286409089447544, "Quartile2MutualInformation": null, "MajorityClassSize": null, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": 0.26886516412532135, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -0.5829196188576371, "PercentageOfBinaryFeatures": 3.225806451612903, "Quartile2StdDevOfNumericAtts": 0.3362298289836828, "MaxKurtosisOfNumericAtts": 192.25974928740982, "MinMeansOfNumericAtts": -4.988304579455445e-5, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "MaxMeansOfNumericAtts": 215.8980693069307, "MinMutualInformation": null, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 8.52918656398051, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfNumericFeatures": 96.7741935483871, "Quartile3MeansOfNumericAtts": 4.668814827911363, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -7.933092285703942, "PercentageOfSymbolicFeatures": 3.225806451612903, "Quartile3MutualInformation": null, "MaxSkewnessOfNumericAtts": 13.57459836417631, "MinStdDevOfNumericAtts": 0.0002309294334034254, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 1.255634138955584, "MaxStdDevOfNumericAtts": 54.96163475573192, "MinorityClassPercentage": null, "Quartile1KurtosisOfNumericAtts": 0.5566431340811746, "Quartile3StdDevOfNumericAtts": 1.0794156901850172, "MeanAttributeEntropy": null, "MinorityClassSize": null, "Quartile1MeansOfNumericAtts": 0.2771350915841584, "StdvNominalAttDistinctValues": 0, "MeanKurtosisOfNumericAtts": 20.370670997045877, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "MeanMeansOfNumericAtts": 18.67755703512634, "Quartile1SkewnessOfNumericAtts": -0.5031485154528135, "AutoCorrelation": null, "MeanMutualInformation": null, "Quartile1StdDevOfNumericAtts": 0.09042824799458375 }, "tags": [ { "uploader": "2373", "tag": "2019_multioutput_paper" }, { "uploader": "38960", "tag": "Education" }, { "uploader": "38960", "tag": "Health" } ], "features": [ { "name": "gender", "index": "25", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "Female", "Male" ], [ [ "210", "0" ], [ "0", "194" ] ] ] }, { "name": "Extr", "index": "26", "type": "numeric", "distinct": "60", "missing": "0", "target": "1", "min": "2", "max": "7", "mean": "5", "stdev": "1" }, { "name": "Agr", "index": "27", "type": "numeric", "distinct": "59", "missing": "0", "target": "1", "min": "2", "max": "7", "mean": "5", "stdev": "1" }, { "name": "Cons", "index": "28", "type": "numeric", "distinct": "55", "missing": "0", "target": "1", "min": "2", "max": "6", "mean": "4", "stdev": "1" }, { "name": "Emot", "index": "29", "type": "numeric", "distinct": "57", "missing": "0", "target": "1", "min": "2", "max": "7", "mean": "5", "stdev": "1" }, { "name": "Open", "index": "30", "type": "numeric", "distinct": "51", "missing": "0", "target": "1", "min": "2", "max": "6", "mean": "5", "stdev": "1" }, { "name": "mean.pitch", "index": "0", "type": "numeric", "distinct": "395", "missing": "0", "min": "122", "max": "500", "mean": "216", "stdev": "55" }, { "name": "sd.pitch", "index": "1", "type": "numeric", "distinct": "398", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "mean.conf.pitch", "index": "2", "type": "numeric", "distinct": "399", "missing": "0", "min": "0", "max": "2", "mean": "1", "stdev": "0" }, { "name": "sd.conf.pitch", "index": "3", "type": "numeric", "distinct": "400", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "mean.spec.entropy", "index": "4", "type": "numeric", "distinct": "393", "missing": "0", "min": "0", "max": "4", "mean": "4", "stdev": "0" }, { "name": "sd.spec.entropy", "index": "5", "type": "numeric", "distinct": "401", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "mean.val.apeak", "index": "6", "type": "numeric", "distinct": "400", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "sd.val.apeak", "index": "7", "type": "numeric", "distinct": "395", "missing": "0", "min": "0", "max": "0", "mean": "0", "stdev": "0" }, { "name": "mean.loc.apeak", "index": "8", "type": "numeric", "distinct": "400", "missing": "0", "min": "0", "max": "0", "mean": "0", "stdev": "0" }, { "name": "sd.loc.apeak", "index": "9", "type": "numeric", "distinct": "402", "missing": "0", "min": "0", "max": "2", "mean": "1", "stdev": "0" }, { "name": "mean.num.apeak", "index": "10", "type": "numeric", "distinct": "399", "missing": "0", "min": "1", "max": "21", "mean": "7", "stdev": "3" }, { "name": "sd.num.apeak", "index": "11", "type": "numeric", "distinct": "399", "missing": "0", "min": "0", "max": "12", "mean": "3", "stdev": "2" }, { "name": "mean.energy", "index": "12", "type": "numeric", "distinct": "401", "missing": "0", "min": "0", "max": "0", "mean": "0", "stdev": "0" }, { "name": "sd.energy", "index": "13", "type": "numeric", "distinct": "397", "missing": "0", "min": "0", "max": "10", "mean": "1", "stdev": "1" }, { "name": "mean.d.energy", "index": "14", "type": "numeric", "distinct": "402", "missing": "0", "min": "0", "max": "0", "mean": "0", "stdev": "0" }, { "name": "sd.d.energy", "index": "15", "type": "numeric", "distinct": "403", "missing": "0", "min": "0", "max": "0", "mean": "0", "stdev": "0" }, { "name": "avg.voiced.seg", "index": "16", "type": "numeric", "distinct": "401", "missing": "0", "min": "0", "max": "10", "mean": "0", "stdev": "1" }, { "name": "avg.len.seg", "index": "17", "type": "numeric", "distinct": "396", "missing": "0", "min": "0", "max": "60", "mean": "3", "stdev": "4" }, { "name": "time.speaking", "index": "18", "type": "numeric", "distinct": "376", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "voice.rate", "index": "19", "type": "numeric", "distinct": "402", "missing": "0", "min": "0", "max": "0", "mean": "0", "stdev": "0" }, { "name": "num.turns", "index": "20", "type": "numeric", "distinct": "123", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "hogv.entropy", "index": "21", "type": "numeric", "distinct": "404", "missing": "0", "min": "1", "max": "8", "mean": "6", "stdev": "1" }, { "name": "hogv.median", "index": "22", "type": "numeric", "distinct": "370", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "hogv.cogR", "index": "23", "type": "numeric", "distinct": "81", "missing": "0", "min": "84", "max": "209", "mean": "131", "stdev": "17" }, { "name": "hogv.cogC", "index": "24", "type": "numeric", "distinct": "88", "missing": "0", "min": "84", "max": "238", "mean": "161", "stdev": "20" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }