{ "data_id": "43368", "name": "Online-Retail-II-UCI", "exact_name": "Online-Retail-II-UCI", "version": 1, "version_label": "v1.0", "description": "Context\nThis Online Retail II data set contains all the transactions occurring for a UK-based and registered, non-store online retail between 01\/12\/2009 and 09\/12\/2011.The company mainly sells unique all-occasion gift-ware. Many customers of the company are wholesalers.\nContent\nAttribute Information:\nInvoiceNo: Invoice number. Nominal. A 6-digit integral number uniquely assigned to each transaction. If this code starts with the letter 'c', it indicates a cancellation.\nStockCode: Product (item) code. Nominal. A 5-digit integral number uniquely assigned to each distinct product.\nDescription: Product (item) name. Nominal.\nQuantity: The quantities of each product (item) per transaction. Numeric.\nInvoiceDate: Invice date and time. Numeric. The day and time when a transaction was generated.\nUnitPrice: Unit price. Numeric. Product price per unit in sterling ().\nCustomerID: Customer number. Nominal. A 5-digit integral number uniquely assigned to each customer.\nCountry: Country name. Nominal. The name of the country where a customer resides.\nAcknowledgements\nChen, D. Sain, S.L., and Guo, K. (2012), Data mining for the online retail industry: A case study of RFM model-based customer segmentation using data mining, Journal of Database Marketing and Customer Strategy Management, Vol. 19, No. 3, pp. 197-208. doi: [Web Link].\nChen, D., Guo, K. and Ubakanma, G. (2015), Predicting customer profitability over time based on RFM time series, International Journal of Business Forecasting and Marketing Intelligence, Vol. 2, No. 1, pp.1-18. doi: [Web Link].\nChen, D., Guo, K., and Li, Bo (2019), Predicting Customer Profitability Dynamically over Time: An Experimental Comparative Study, 24th Iberoamerican Congress on Pattern Recognition (CIARP 2019), Havana, Cuba, 28-31 Oct, 2019.\nLaha Ale, Ning Zhang, Huici Wu, Dajiang Chen, and Tao Han, Online Proactive Caching in Mobile Edge Computing Using Bidirectional Deep Recurrent Neural Network, IEEE Internet of Things Journal, Vol. 6, Issue 3, pp. 5520-5530, 2019.\nRina Singh, Jeffrey A. Graves, Douglas A. Talbert, William Eberle, Prefix and Suffix Sequential Pattern Mining, Industrial Conference on Data Mining 2018: Advances in Data Mining. Applications and Theoretical Aspects, pp. 309-324. 2018.", "format": "arff", "uploader": "Onur Yildirim", "uploader_id": 30126, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-23 12:42:41", "update_comment": null, "last_update": "2022-03-23 12:42:41", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102193\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Online-Retail-II-UCI", "Context This Online Retail II data set contains all the transactions occurring for a UK-based and registered, non-store online retail between 01\/12\/2009 and 09\/12\/2011.The company mainly sells unique all-occasion gift-ware. Many customers of the company are wholesalers. Content Attribute Information: InvoiceNo: Invoice number. Nominal. A 6-digit integral number uniquely assigned to each transaction. If this code starts with the letter 'c', it indicates a cancellation. StockCode: Product (item) c " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1067371, "NumberOfFeatures": 8, "NumberOfClasses": null, "NumberOfMissingValues": 247481, "NumberOfInstancesWithMissingValues": 243007, "NumberOfNumericFeatures": 3, "NumberOfSymbolicFeatures": 0, "Dimensionality": 7.495050924186623e-6, "PercentageOfNumericFeatures": 37.5, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 22.766872999172733, "AutoCorrelation": null, "PercentageOfMissingValues": 2.898254215263484 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "Invoice", "index": "0", "type": "string", "distinct": "53628", "missing": "0" }, { "name": "StockCode", "index": "1", "type": "string", "distinct": "5305", "missing": "0" }, { "name": "Description", "index": "2", "type": "string", "distinct": "5697", "missing": "4474" }, { "name": "Quantity", "index": "3", "type": "numeric", "distinct": "1057", "missing": "0", "min": "-80995", "max": "80995", "mean": "10", "stdev": "173" }, { "name": "InvoiceDate", "index": "4", "type": "string", "distinct": "47635", "missing": "0" }, { "name": "Price", "index": "5", "type": "numeric", "distinct": "2807", "missing": "0", "min": "-53594", "max": "38970", "mean": "5", "stdev": "124" }, { "name": "Customer_ID", "index": "6", "type": "numeric", "distinct": "5942", "missing": "243007", "min": "12346", "max": "18287", "mean": "15325", "stdev": "1697" }, { "name": "Country", "index": "7", "type": "string", "distinct": "43", "missing": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }