{ "data_id": "43647", "name": "Indian-News-Articles", "exact_name": "Indian-News-Articles", "version": 1, "version_label": "v1.0", "description": "Context\nIt's always interesting to analyse what's going on in the news but there's no good data avaialable in indian context on kaggle, so I created one.\nContent\nApart from the main content of the articles, each row contains author, link, publish date etc.\nAcknowledgements\nGrateful to the creator of python, beautifulsoup library and firstpost.com.\nInspiration\nData is not always available to us, sometimes we need to create one, this is my attempt to do that.", "format": "arff", "uploader": "Dustin Carrion", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-24 00:58:22", "update_comment": null, "last_update": "2022-03-24 00:58:22", "licence": "Database: Open Database, Contents: Original Authors", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102472\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Indian-News-Articles", "Context It's always interesting to analyse what's going on in the news but there's no good data avaialable in indian context on kaggle, so I created one. Content Apart from the main content of the articles, each row contains author, link, publish date etc. Acknowledgements Grateful to the creator of python, beautifulsoup library and firstpost.com. Inspiration Data is not always available to us, sometimes we need to create one, this is my attempt to do that. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1568, "NumberOfFeatures": 8, "NumberOfClasses": null, "NumberOfMissingValues": 33, "NumberOfInstancesWithMissingValues": 15, "NumberOfNumericFeatures": 0, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.00510204081632653, "PercentageOfNumericFeatures": 0, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0.9566326530612245, "AutoCorrelation": null, "PercentageOfMissingValues": 0.2630739795918367 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "source", "index": "0", "type": "string", "distinct": "2", "missing": "0" }, { "name": "category", "index": "1", "type": "string", "distinct": "4", "missing": "0" }, { "name": "link", "index": "2", "type": "string", "distinct": "1563", "missing": "0" }, { "name": "author", "index": "3", "type": "string", "distinct": "129", "missing": "6" }, { "name": "published_at", "index": "4", "type": "string", "distinct": "1518", "missing": "6" }, { "name": "header", "index": "5", "type": "string", "distinct": "1557", "missing": "0" }, { "name": "subheader", "index": "6", "type": "string", "distinct": "1538", "missing": "12" }, { "name": "content", "index": "7", "type": "string", "distinct": "1543", "missing": "9" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }