{ "data_id": "30751", "name": "QSAR-DATASET-FOR-DRUG-TARGET-CHEMBL4931", "exact_name": "QSAR-DATASET-FOR-DRUG-TARGET-CHEMBL4931", "version": 10, "version_label": null, "description": "This dataset contains QSAR data (from ChEMBL version 17) showing activity values (unit is pseudo-pCI50) of several compounds on drug target ChEMBL_ID: CHEMBL4931 (TID: 11165), and it has 57 rows and 2 features (not including molecule IDs and class feature: molecule_id and pXC50). The features represent Basic Molecular Descriptors which were generated from SMILES strings. Missing value imputation was applied to this dataset (By choosing the Median). Feature selection was also applied.", "format": "ARFF", "uploader": "Noureddin Sadawi", "uploader_id": 62, "visibility": "public", "creator": "\"Dr Jeremy Besnard, Dr Ivan Olier, Dr Noureddin Sadawi, Dr Larisa Soldatova, Dr Crina Grosan, Prof Ross King, Dr Richard Bickerton, Prof Andrew Hopkins and Dr Willem van Hoorn\"", "contributor": null, "date": "2016-07-15 05:47:54", "update_comment": null, "last_update": "2016-07-15 05:47:54", "licence": "Public", "status": "deactivated", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/3427973\/data_40260.arff", "kaggle_url": null, "default_target_attribute": "pXC50", "row_id_attribute": "molecule_id", "ignore_attribute": null, "runs": 1, "suggest": { "input": [ "QSAR-DATASET-FOR-DRUG-TARGET-CHEMBL4931", "This dataset contains QSAR data (from ChEMBL version 17) showing activity values (unit is pseudo-pCI50) of several compounds on drug target ChEMBL_ID: CHEMBL4931 (TID: 11165), and it has 57 rows and 2 features (not including molecule IDs and class feature: molecule_id and pXC50). The features represent Basic Molecular Descriptors which were generated from SMILES strings. Missing value imputation was applied to this dataset (By choosing the Median). Feature selection was also applied. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 57, "NumberOfFeatures": 4, "NumberOfClasses": 0, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 3, "NumberOfSymbolicFeatures": 1, "MaxSkewnessOfNumericAtts": 1.709631265746812, "MinStdDevOfNumericAtts": 1.0084658259232873, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 1.709631265746812, "MaxStdDevOfNumericAtts": 3.8827239295090195, "MinorityClassPercentage": null, "Quartile1KurtosisOfNumericAtts": -1.357675545371073, "Quartile3StdDevOfNumericAtts": 3.8827239295090195, "MeanAttributeEntropy": null, "MinorityClassSize": null, "Quartile1MeansOfNumericAtts": 6.3162280701754385, "StdvNominalAttDistinctValues": null, "MeanKurtosisOfNumericAtts": 1.2139728665697986, "NumberOfBinaryFeatures": 0, "Quartile1MutualInformation": null, "MeanMeansOfNumericAtts": 17.553187134502924, "Quartile1SkewnessOfNumericAtts": -0.15451713425605948, "MeanMutualInformation": null, "Quartile1StdDevOfNumericAtts": 1.0084658259232873, "AutoCorrelation": -0.9270714285714285, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "ClassEntropy": null, "MeanNominalAttDistinctValues": null, "Quartile2KurtosisOfNumericAtts": -0.4193421350160831, "Dimensionality": 0.07017543859649122, "MeanSkewnessOfNumericAtts": 0.541393942398214, "Quartile2MeansOfNumericAtts": 6.717017543859649, "EquivalentNumberOfAtts": null, "MajorityClassPercentage": null, "MeanStdDevOfNumericAtts": 2.195791897374558, "Quartile2MutualInformation": null, "MajorityClassSize": null, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": 0.06906769570388953, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.357675545371073, "PercentageOfBinaryFeatures": 0, "Quartile2StdDevOfNumericAtts": 1.6961859366913679, "MaxKurtosisOfNumericAtts": 5.418936280096552, "MinMeansOfNumericAtts": 6.3162280701754385, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "MaxMeansOfNumericAtts": 39.626315789473686, "MinMutualInformation": null, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 5.418936280096552, "MaxMutualInformation": null, "MinNominalAttDistinctValues": null, "PercentageOfNumericFeatures": 75, "Quartile3MeansOfNumericAtts": 39.626315789473686, "MaxNominalAttDistinctValues": null, "MinSkewnessOfNumericAtts": -0.15451713425605948, "PercentageOfSymbolicFeatures": 25, "Quartile3MutualInformation": null }, "tags": [ { "tag": "MetaQSAR", "uploader": "62" }, { "tag": "study_13", "uploader": "62" } ], "features": [ { "name": "pXC50", "index": "3", "type": "numeric", "distinct": "44", "missing": "0", "target": "1", "min": "4", "max": "9", "mean": "7", "stdev": "2" }, { "name": "molecule_id", "index": "0", "type": "nominal", "distinct": "57", "missing": "0", "identifier": "1", "distr": [] }, { "name": "AMW", "index": "1", "type": "numeric", "distinct": "54", "missing": "0", "min": "5", "max": "11", "mean": "6", "stdev": "1" }, { "name": "C.", "index": "2", "type": "numeric", "distinct": "40", "missing": "0", "min": "32", "max": "49", "mean": "40", "stdev": "4" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }