{ "data_id": "541", "name": "socmob", "exact_name": "socmob", "version": 1, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\n17x17x2x2 tables of counts in GLIM-ready format used for the analyses\nin Biblarz, Timothy J., and Adrian E. Raftery. 1993. \"The Effects of\nFamily Disruption on Social Mobility.\" American Sociological Review\n(In press). For further details of the data, see this reference.\nColumn 1 is father's occupation, coded as follows:\n17. Professional, Self-Employed\n16. Professional-Salaried\n15. Manager\n14. Salesman-Nonretail\n13. Proprietor\n12. Clerk\n11. Salesman-Retail\n10. Craftsman-Manufacturing\n9. Craftsmen-Other\n8. Craftsman-Construction\n7. Service Worker\n6. Operative-Nonmanufacturing\n5. Operative-Manufacturing\n4. Laborer-Manufacturing\n3. Laborer-Nonmanufacturing\n2. Farmer\/Farm Manager\n1. Farm Laborer\nColumn 2 is son's occupation, coded in the same way as father's.\nColumn 3 is family structure, coded 1=intact family background and\n2=nonintact family background.\nColumn 4 is race, coded 1=white and 2=black.\nColumn 5 is counts for son's first occupation.\nColumn 6 is counts for son's current occupation.\nThe counts have been weighted to take account of the survey\ndesign, which is why they are not integers.\n************************************************************\n***********************************************************\nThis file was constructed from publicly available data collected\nby David Featherman and Robert Hauser in 1973: the \"Occupational\nChange in a Generation II\" (OCG II) Survey. Permission is hereby given to\nuse the above data for non-commercial scholarly and teaching purposes.\nIf these data are used in a published article or book,\nthe authors, the original data (in the form given in\nBiblarz and Raftery (1993), cited above), and StatLib should\nall be acknowledged.\n\n\nInformation about the dataset\nCLASSTYPE: numeric\nCLASSINDEX: none specific", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": "David Featherman and Robert Hauser", "contributor": "1973", "date": "2014-09-29 00:09:05", "update_comment": "set target feature", "last_update": "2014-10-07 01:32:15", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/52653\/socmob.arff", "kaggle_url": null, "default_target_attribute": "counts_for_sons_current_occupation", "row_id_attribute": null, "ignore_attribute": null, "runs": 6, "suggest": { "input": [ "socmob", "17x17x2x2 tables of counts in GLIM-ready format used for the analyses in Biblarz, Timothy J., and Adrian E. Raftery. 1993. \"The Effects of Family Disruption on Social Mobility.\" American Sociological Review (In press). For further details of the data, see this reference. Column 1 is father's occupation, coded as follows: 17. Professional, Self-Employed 16. Professional-Salaried 15. Manager 14. Salesman-Nonretail 13. Proprietor 12. Clerk 11. Salesman-Retail 10. Craftsman-Manufacturing 9. Craftsme " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1156, "NumberOfFeatures": 6, "NumberOfClasses": 0, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 2, "NumberOfSymbolicFeatures": 4, "J48.001.ErrRate": null, "MeanNominalAttDistinctValues": 9.5, "Quartile1SkewnessOfNumericAtts": 4.434987418217297, "REPTreeDepth1Kappa": null, "CfsSubsetEval_kNN1NAUC": null, "StdvNominalAttDistinctValues": 8.660254037844387, "J48.001.Kappa": null, "MeanSkewnessOfNumericAtts": 5.814349551349142, "Quartile1StdDevOfNumericAtts": 41.00364497068887, "REPTreeDepth2AUC": null, "CfsSubsetEval_kNN1NErrRate": null, "kNN1NAUC": null, "MajorityClassPercentage": null, "MeanStdDevOfNumericAtts": 42.68095707239175, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": null, "CfsSubsetEval_kNN1NKappa": null, "kNN1NErrRate": null, "kNN1NKappa": null, "MajorityClassSize": null, "MinAttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 53.486947485713, "REPTreeDepth2Kappa": null, "ClassEntropy": null, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": 25.09717193870431, "Quartile2MeansOfNumericAtts": 17.57677335640133, "REPTreeDepth3AUC": null, "DecisionStumpAUC": null, "MaxKurtosisOfNumericAtts": 81.8767230327217, "MinMeansOfNumericAtts": 16.940743944636615, "Quartile2MutualInformation": null, "REPTreeDepth3ErrRate": null, "DecisionStumpErrRate": null, "MaxMeansOfNumericAtts": 18.212802768166043, "MinMutualInformation": null, "Quartile2SkewnessOfNumericAtts": 5.814349551349142, "REPTreeDepth3Kappa": null, "DecisionStumpKappa": null, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 33.33333333333333, "Quartile2StdDevOfNumericAtts": 42.68095707239175, "RandomTreeDepth1AUC": null, "Dimensionality": 0.005190311418685121, "MaxNominalAttDistinctValues": 17, "MinSkewnessOfNumericAtts": 4.434987418217297, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "RandomTreeDepth1ErrRate": null, "EquivalentNumberOfAtts": null, "MaxSkewnessOfNumericAtts": 7.193711684480987, "MinStdDevOfNumericAtts": 41.00364497068887, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 81.8767230327217, "AutoCorrelation": -12.573246753246762, "RandomTreeDepth1Kappa": null, "J48.00001.AUC": null, "MaxStdDevOfNumericAtts": 44.35826917409464, "MinorityClassPercentage": null, "PercentageOfNumericFeatures": 33.33333333333333, "Quartile3MeansOfNumericAtts": 18.212802768166043, "CfsSubsetEval_DecisionStumpAUC": null, "RandomTreeDepth2AUC": null, "J48.00001.ErrRate": null, "MeanAttributeEntropy": null, "MinorityClassSize": null, "PercentageOfSymbolicFeatures": 66.66666666666666, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": null, "RandomTreeDepth2ErrRate": null, "J48.00001.Kappa": null, "MeanKurtosisOfNumericAtts": 53.486947485713, "NaiveBayesAUC": null, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 7.193711684480987, "CfsSubsetEval_DecisionStumpKappa": null, "RandomTreeDepth2Kappa": null, "J48.0001.AUC": null, "MeanMeansOfNumericAtts": 17.57677335640133, "NaiveBayesErrRate": null, "Quartile1KurtosisOfNumericAtts": 25.09717193870431, "Quartile3StdDevOfNumericAtts": 44.35826917409464, "CfsSubsetEval_NaiveBayesAUC": null, "RandomTreeDepth3AUC": null, "J48.0001.ErrRate": null, "MeanMutualInformation": null, "NaiveBayesKappa": null, "Quartile1MeansOfNumericAtts": 16.940743944636615, "REPTreeDepth1AUC": null, "CfsSubsetEval_NaiveBayesErrRate": null, "RandomTreeDepth3ErrRate": null, "J48.0001.Kappa": null, "J48.001.AUC": null, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 2, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": null, "CfsSubsetEval_NaiveBayesKappa": null, "RandomTreeDepth3Kappa": null }, "tags": [ { "uploader": "38960", "tag": "Sociology" }, { "uploader": "38960", "tag": "Statistics" }, { "uploader": "5824", "tag": "study_130" } ], "features": [ { "name": "counts_for_sons_current_occupation", "index": "5", "type": "numeric", "distinct": "361", "missing": "0", "target": "1", "min": "0", "max": "414", "mean": "18", "stdev": "41" }, { "name": "fathers_occupation", "index": "0", "type": "nominal", "distinct": "17", "missing": "0", "distr": [] }, { "name": "sons_occupation", "index": "1", "type": "nominal", "distinct": "17", "missing": "0", "distr": [] }, { "name": "family_structure", "index": "2", "type": "nominal", "distinct": "2", "missing": "0", "distr": [] }, { "name": "race", "index": "3", "type": "nominal", "distinct": "2", "missing": "0", "distr": [] }, { "name": "counts_for_sons_first_occupation", "index": "4", "type": "numeric", "distinct": "358", "missing": "0", "min": "0", "max": "746", "mean": "17", "stdev": "44" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }