{ "data_id": "44979", "name": "diamonds", "exact_name": "diamonds", "version": 8, "version_label": null, "description": "**Description**\n\nThis classic dataset originally contained the prices and other attributes of almost 54,000 diamonds.\nHowever, 14184 of those seem to be the same diamonds, measure from a different angle.\nThis can be found out but checking for duplicated value when disregarding the variables\nx, y, z , depth and table, which are dependent on the angle.\n\n**Attribute Information**\n\n1. *price* - Content price price in US dollars (\\$326--\\$18,823), target feature\n2. *carat* - weight of the diamond (0.2--5.01)\n3. *cut* - quality of the cut (Fair, Good, Very Good, Premium, Ideal)\n4. *color* - diamond colour, from J (worst) to D (best)\n5. *clarity* - a measurement of how clear the diamond is (I1 (worst), SI2, SI1, VS2, VS1, VVS2, VVS1, IF (best))\n6. *x* - length in mm (0--10.74)\n7. *y* - width in mm (0--58.9)\n8. *z* - depth in mm (0--31.8)\n9. *depth* - total depth percentage = z \/ mean(x, y) = 2 * z \/ (x + y) (43--79)\n10. *table* - width of top of diamond relative to widest point (43--95)", "format": "arff", "uploader": "Sebastian Fischer", "uploader_id": 30127, "visibility": "public", "creator": null, "contributor": null, "date": "2022-12-22 16:15:30", "update_comment": null, "last_update": "2022-12-22 16:15:30", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/api.openml.org\/data\/download\/22111843\/file22f1679ae7b21.arff", "default_target_attribute": "price", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "diamonds", "This classic dataset originally contained the prices and other attributes of almost 54,000 diamonds. However, 14184 of those seem to be the same diamonds, measure from a different angle. This can be found out but checking for duplicated value when disregarding the variables x, y, z , depth and table, which are dependent on the angle. 1. *price* - Content price price in US dollars (\\$326--\\$18,823), target feature 2. *carat* - weight of the diamond (0.2--5.01) 3. *cut* - quality of the cut (Fair, " ], "weight": 5 }, "qualities": { "NumberOfInstances": 53940, "NumberOfFeatures": 10, "NumberOfClasses": 0, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 3, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "AutoCorrelation": -22.555590574537902, "PercentageOfMissingValues": 0, "Dimensionality": 0.0001853911753800519, "PercentageOfNumericFeatures": 70, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 30 }, "tags": [ { "tag": "Health", "uploader": "38960" }, { "tag": "Medicine", "uploader": "38960" }, { "tag": "study_353", "uploader": "0" } ], "features": [ { "name": "price", "index": "6", "type": "numeric", "distinct": "11602", "missing": "0", "target": "1", "min": "326", "max": "18823", "mean": "3933", "stdev": "3989" }, { "name": "carat", "index": "0", "type": "numeric", "distinct": "273", "missing": "0", "min": "0", "max": "5", "mean": "1", "stdev": "0" }, { "name": "cut", "index": "1", "type": "nominal", "distinct": "5", "missing": "0", "distr": [] }, { "name": "color", "index": "2", "type": "nominal", "distinct": "7", "missing": "0", "distr": [] }, { "name": "clarity", "index": "3", "type": "nominal", "distinct": "8", "missing": "0", "distr": [] }, { "name": "depth", "index": "4", "type": "numeric", "distinct": "184", "missing": "0", "min": "43", "max": "79", "mean": "62", "stdev": "1" }, { "name": "table", "index": "5", "type": "numeric", "distinct": "127", "missing": "0", "min": "43", "max": "95", "mean": "57", "stdev": "2" }, { "name": "x", "index": "7", "type": "numeric", "distinct": "554", "missing": "0", "min": "0", "max": "11", "mean": "6", "stdev": "1" }, { "name": "y", "index": "8", "type": "numeric", "distinct": "552", "missing": "0", "min": "0", "max": "59", "mean": "6", "stdev": "1" }, { "name": "z", "index": "9", "type": "numeric", "distinct": "375", "missing": "0", "min": "0", "max": "32", "mean": "4", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }