{ "data_id": "43610", "name": "Risk-of-being-drawn-into-online-sex-work-(cleaned)", "exact_name": "Risk-of-being-drawn-into-online-sex-work-(cleaned)", "version": 1, "version_label": "v1.0", "description": "This dataset is the resulting cleaned version of Panos Kostakos's Risk of being drawn into online sex work dataset.\nContext\nThis database was used in the paper: \"Covert online ethnography and machine learning for detecting individuals at risk of being drawn into online sex work\". https:\/\/www.flinders.edu.au\/centre-crime-policy-research\/illicit-networks-workshop\nContent\nThe database includes data scraped from a European online adult forum. Using covert online ethnography we interviewed a small number of participants and determined their risk to either supply or demand sex services through that forum. This is a great dataset for semi-supervised learning.\nAcknowledgements\nThe dataset was initially publicized by Panos Kostakos.\nInspiration\nHow can we identify individuals at risk of being drawn into online sex work? The spread of online social media enables a greater number of people to be involved into online sex trade; however, detecting deviant behaviors online is limited by the low available of data. To overcome this challenge, we combine covert online ethnography with semi-supervised learning using data from a popular European adult forum.", "format": "arff", "uploader": "Dustin Carrion", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-24 00:40:03", "update_comment": null, "last_update": "2022-03-24 00:40:03", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102435\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Risk-of-being-drawn-into-online-sex-work-(cleaned)", "This dataset is the resulting cleaned version of Panos Kostakos's Risk of being drawn into online sex work dataset. Context This database was used in the paper: \"Covert online ethnography and machine learning for detecting individuals at risk of being drawn into online sex work\". https:\/\/www.flinders.edu.au\/centre-crime-policy-research\/illicit-networks-workshop Content The database includes data scraped from a European online adult forum. Using covert online ethnography we interviewed a small nu " ], "weight": 5 }, "qualities": { "NumberOfInstances": 28831, "NumberOfFeatures": 30, "NumberOfClasses": null, "NumberOfMissingValues": 54259, "NumberOfInstancesWithMissingValues": 28779, "NumberOfNumericFeatures": 26, "NumberOfSymbolicFeatures": 2, "Dimensionality": 0.0010405466338316396, "PercentageOfNumericFeatures": 86.66666666666667, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 6.666666666666667, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 2, "PercentageOfBinaryFeatures": 6.666666666666667, "PercentageOfInstancesWithMissingValues": 99.81963858346919, "AutoCorrelation": null, "PercentageOfMissingValues": 6.273224422785659 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "User_ID", "index": "0", "type": "numeric", "distinct": "28763", "missing": "0", "min": "1", "max": "48606", "mean": "24151", "stdev": "14052" }, { "name": "Female", "index": "1", "type": "nominal", "distinct": "2", "missing": "0", "distr": [] }, { "name": "Age", "index": "2", "type": "numeric", "distinct": "526", "missing": "0", "min": "18", "max": "87", "mean": "36", "stdev": "10" }, { "name": "Location", "index": "3", "type": "string", "distinct": "18", "missing": "0" }, { "name": "Verification", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [] }, { "name": "Heterosexual", "index": "5", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "Homosexual", "index": "6", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "bicurious", "index": "7", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "bisexual", "index": "8", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "Dominant", "index": "9", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "Submisive", "index": "10", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "Switch", "index": "11", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "Men", "index": "12", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "Men_and_Women", "index": "13", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "Nobody", "index": "14", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "Nobody_but_maybe", "index": "15", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "Women", "index": "16", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "Points_Rank", "index": "17", "type": "numeric", "distinct": "375", "missing": "0", "min": "-650", "max": "1626", "mean": "10", "stdev": "39" }, { "name": "Last_login", "index": "18", "type": "numeric", "distinct": "2360", "missing": "0", "min": "1", "max": "2402", "mean": "735", "stdev": "656" }, { "name": "Member_since_year", "index": "19", "type": "numeric", "distinct": "9", "missing": "0", "min": "2009", "max": "2017", "mean": "2014", "stdev": "2" }, { "name": "Member_since_month", "index": "20", "type": "numeric", "distinct": "12", "missing": "0", "min": "1", "max": "12", "mean": "7", "stdev": "3" }, { "name": "Member_since_day", "index": "21", "type": "numeric", "distinct": "31", "missing": "0", "min": "1", "max": "31", "mean": "15", "stdev": "9" }, { "name": "Number_of_Comments_in_public_forum", "index": "22", "type": "numeric", "distinct": "217", "missing": "0", "min": "0", "max": "2062", "mean": "3", "stdev": "30" }, { "name": "Time_spent_chating_H:M", "index": "23", "type": "numeric", "distinct": "1199", "missing": "0", "min": "0", "max": "338192", "mean": "231", "stdev": "3979" }, { "name": "Number_of_advertisments_posted", "index": "24", "type": "numeric", "distinct": "18", "missing": "0", "min": "0", "max": "21", "mean": "0", "stdev": "1" }, { "name": "Number_of_offline_meetings_attended", "index": "25", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "23", "mean": "0", "stdev": "0" }, { "name": "Number_of_Friends", "index": "26", "type": "numeric", "distinct": "49", "missing": "0", "min": "1", "max": "143", "mean": "1", "stdev": "2" }, { "name": "Profile_pictures", "index": "27", "type": "numeric", "distinct": "63", "missing": "0", "min": "0", "max": "147", "mean": "0", "stdev": "3" }, { "name": "Friends_ID_list", "index": "28", "type": "string", "distinct": "2742", "missing": "25518" }, { "name": "Risk", "index": "29", "type": "numeric", "distinct": "2", "missing": "28741", "min": "0", "max": "1", "mean": "0", "stdev": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }