{ "data_id": "43834", "name": "Historical-Financials-Data-for-3000-stocks", "exact_name": "Historical-Financials-Data-for-3000-stocks", "version": 1, "version_label": "v1.0", "description": "Context\nGetting access to high-quality historical stock market data can be very expensive and\/or complicated; parsing SEC 10-Q filings direct from the SEC EDGAR is difficult due to the varying structures of filings and SEC filing data from providers such as Quandl charge hundreds or thousands of dollars in yearly fees to get access to them. Here, I provide an easy-to-use, straight from the source database of parsed financials information from SEC 10-Q filings for more than 3000 stocks.\nContent\nThe quarterly financials are provided in a single .csv file, quarterly_financials.csv\n50 of the data is NaN either because the field wasn't detected by my XBRL parsing system or the field wasn't addressed in the SEC filing.\nAcknowledgements\nAll the data is scraped from the SEC from the XBRL files.", "format": "arff", "uploader": "Elif Ceren Gok", "uploader_id": 30125, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-24 15:32:09", "update_comment": null, "last_update": "2022-03-24 15:32:09", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102659\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Historical-Financials-Data-for-3000-stocks", "Context Getting access to high-quality historical stock market data can be very expensive and\/or complicated; parsing SEC 10-Q filings direct from the SEC EDGAR is difficult due to the varying structures of filings and SEC filing data from providers such as Quandl charge hundreds or thousands of dollars in yearly fees to get access to them. Here, I provide an easy-to-use, straight from the source database of parsed financials information from SEC 10-Q filings for more than 3000 stocks. Content T " ], "weight": 5 }, "qualities": { "NumberOfInstances": 101787, "NumberOfFeatures": 45, "NumberOfClasses": null, "NumberOfMissingValues": 2857964, "NumberOfInstancesWithMissingValues": 101787, "NumberOfNumericFeatures": 42, "NumberOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 100, "AutoCorrelation": null, "PercentageOfMissingValues": 62.395306975459654, "Dimensionality": 0.0004420996787409001, "PercentageOfNumericFeatures": 93.33333333333333, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0 }, "tags": [ { "uploader": "38960", "tag": "Machine Learning" }, { "uploader": "38960", "tag": "Statistics" } ], "features": [ { "name": "Unnamed:_0", "index": "0", "type": "numeric", "distinct": "101787", "missing": "0", "min": "0", "max": "101786", "mean": "50893", "stdev": "29384" }, { "name": "commonstocksharesissued", "index": "1", "type": "numeric", "distinct": "45206", "missing": "8616", "min": "-595000000", "max": "2147483647", "mean": "2147483647", "stdev": "2147483647" }, { "name": "assetscurrent", "index": "2", "type": "numeric", "distinct": "51259", "missing": "24555", "min": "-2147483648", "max": "2147483647", "mean": "1654957801", "stdev": "2147483647" }, { "name": "accountspayablecurrent", "index": "3", "type": "numeric", "distinct": "33624", "missing": "35815", "min": "-2147483648", "max": "2147483647", "mean": "406329471", "stdev": "2147483647" }, { "name": "commonstockvalue", "index": "4", "type": "numeric", "distinct": "16551", "missing": "11337", "min": "-2147483648", "max": "2147483647", "mean": "150379232", "stdev": "1282208504" }, { "name": "liabilities", "index": "5", "type": "numeric", "distinct": "52661", "missing": "19366", "min": "-2147483648", "max": "2147483647", "mean": "2147483647", "stdev": "2147483647" }, { "name": "liabilitiesandstockholdersequity", "index": "6", "type": "numeric", "distinct": "71000", "missing": "419", "min": "-2147483648", "max": "2147483647", "mean": "2147483647", "stdev": "2147483647" }, { "name": "stockholdersequity", "index": "7", "type": "numeric", "distinct": "65938", "missing": "4885", "min": "-2147483648", "max": "2147483647", "mean": "1138630384", "stdev": "2147483647" }, { "name": "earningspersharebasic", "index": "8", "type": "numeric", "distinct": "2524", "missing": "10346", "min": "-70000", "max": "8867830", "mean": "947", "stdev": "78708" }, { "name": "netincomeloss", "index": "9", "type": "numeric", "distinct": "56668", "missing": "4734", "min": "-2147483648", "max": "2147483647", "mean": "112029126", "stdev": "1875202393" }, { "name": "profitloss", "index": "10", "type": "numeric", "distinct": "28761", "missing": "43614", "min": "-2147483648", "max": "2147483647", "mean": "121227131", "stdev": "1962394339" }, { "name": "costofgoodssold", "index": "11", "type": "numeric", "distinct": "19345", "missing": "71667", "min": "-2147483648", "max": "2147483647", "mean": "1276894775", "stdev": "2147483647" }, { "name": "filing_date", "index": "12", "type": "string", "distinct": "2635", "missing": "0" }, { "name": "costsandexpenses", "index": "13", "type": "numeric", "distinct": "21104", "missing": "71771", "min": "-2147483648", "max": "2147483647", "mean": "2046239185", "stdev": "2147483647" }, { "name": "cash", "index": "14", "type": "numeric", "distinct": "5509", "missing": "81223", "min": "-115000000", "max": "2147483647", "mean": "147040673", "stdev": "1530666078" }, { "name": "notespayable", "index": "15", "type": "numeric", "distinct": "3247", "missing": "87412", "min": "-802160000", "max": "2147483647", "mean": "487905993", "stdev": "1829115694" }, { "name": "preferredstockvalue", "index": "16", "type": "numeric", "distinct": "1853", "missing": "85167", "min": "-2147483648", "max": "2147483647", "mean": "245158993", "stdev": "1482157922" }, { "name": "depreciation", "index": "17", "type": "numeric", "distinct": "16499", "missing": "36740", "min": "-520000000", "max": "2147483647", "mean": "107755694", "stdev": "1759218479" }, { "name": "operatingexpenses", "index": "18", "type": "numeric", "distinct": "33013", "missing": "51869", "min": "-2147483648", "max": "2147483647", "mean": "406513167", "stdev": "2147483647" }, { "name": "revenues", "index": "19", "type": "numeric", "distinct": "34700", "missing": "35561", "min": "-2147483648", "max": "2147483647", "mean": "1214620410", "stdev": "2147483647" }, { "name": "land", "index": "20", "type": "numeric", "distinct": "5676", "missing": "79959", "min": "-197000", "max": "2147483647", "mean": "264746903", "stdev": "1019777579" }, { "name": "accountsreceivablenet", "index": "21", "type": "numeric", "distinct": "4847", "missing": "87788", "min": "-2147483648", "max": "2147483647", "mean": "341609245", "stdev": "2147483647" }, { "name": "deferredrevenue", "index": "22", "type": "numeric", "distinct": "4015", "missing": "82103", "min": "-2147483648", "max": "2147483647", "mean": "125446709", "stdev": "759634616" }, { "name": "grossprofit", "index": "23", "type": "numeric", "distinct": "34077", "missing": "52927", "min": "-2147483648", "max": "2147483647", "mean": "528353079", "stdev": "2147483647" }, { "name": "sharesissued", "index": "24", "type": "numeric", "distinct": "9226", "missing": "71886", "min": "-2147483648", "max": "2147483647", "mean": "492528649", "stdev": "2147483647" }, { "name": "accruedincometaxes", "index": "25", "type": "numeric", "distinct": "1433", "missing": "94954", "min": "-545883000", "max": "2147483647", "mean": "201989989", "stdev": "1282096518" }, { "name": "sharesoutstanding", "index": "26", "type": "numeric", "distinct": "11153", "missing": "65296", "min": "-1383496000", "max": "2147483647", "mean": "1746099561", "stdev": "2147483647" }, { "name": "borrowedfunds", "index": "27", "type": "numeric", "distinct": "307", "missing": "100074", "min": "-45000000", "max": "2147483647", "mean": "1404101534", "stdev": "2147483647" }, { "name": "inventorygross", "index": "28", "type": "numeric", "distinct": "3639", "missing": "93715", "min": "-512000", "max": "2147483647", "mean": "708165008", "stdev": "2147483647" }, { "name": "commercialpaper", "index": "29", "type": "numeric", "distinct": "1195", "missing": "95653", "min": "-181500000", "max": "2147483647", "mean": "1071782002", "stdev": "2147483647" }, { "name": "dividends", "index": "30", "type": "numeric", "distinct": "3894", "missing": "87459", "min": "-2147483648", "max": "2147483647", "mean": "160188228", "stdev": "1112953108" }, { "name": "commonstocknoparvalue", "index": "31", "type": "numeric", "distinct": "33", "missing": "101080", "min": "-5127", "max": "2147483647", "mean": "355627307", "stdev": "1857398591" }, { "name": "costofservices", "index": "32", "type": "numeric", "distinct": "8025", "missing": "88745", "min": "-971866000", "max": "2147483647", "mean": "671079569", "stdev": "2147483647" }, { "name": "debtcurrent", "index": "33", "type": "numeric", "distinct": "4408", "missing": "87706", "min": "-2147483648", "max": "2147483647", "mean": "662307719", "stdev": "2147483647" }, { "name": "accruedinsurancecurrent", "index": "34", "type": "numeric", "distinct": "1681", "missing": "96327", "min": "109", "max": "2147483647", "mean": "137817604", "stdev": "1165163220" }, { "name": "officerscompensation", "index": "35", "type": "numeric", "distinct": "344", "missing": "98246", "min": "-2250000", "max": "300000000", "mean": "3193602", "stdev": "20186520" }, { "name": "intangibleassetscurrent", "index": "36", "type": "numeric", "distinct": "198", "missing": "100706", "min": "-20000000", "max": "2147483647", "mean": "38912817", "stdev": "226749606" }, { "name": "salariesandwages", "index": "37", "type": "numeric", "distinct": "934", "missing": "99034", "min": "-8000000", "max": "2147483647", "mean": "29940676", "stdev": "151917843" }, { "name": "interestanddebtexpense", "index": "38", "type": "numeric", "distinct": "2213", "missing": "96404", "min": "-1735000000", "max": "2024000000", "mean": "58918402", "stdev": "181649181" }, { "name": "convertibledebt", "index": "39", "type": "numeric", "distinct": "1133", "missing": "95400", "min": "-627000000", "max": "2147483647", "mean": "379279599", "stdev": "2147483647" }, { "name": "assetmanagementcosts", "index": "40", "type": "numeric", "distinct": "851", "missing": "100095", "min": "-2630000", "max": "2147483647", "mean": "149051015", "stdev": "1682291539" }, { "name": "accountsreceivablegross", "index": "41", "type": "numeric", "distinct": "1480", "missing": "96279", "min": "-60000", "max": "2147483647", "mean": "185285805", "stdev": "724627931" }, { "name": "directoperatingcosts", "index": "42", "type": "numeric", "distinct": "1283", "missing": "99631", "min": "-739000000", "max": "2147483647", "mean": "241687512", "stdev": "617764450" }, { "name": "operatingcycle", "index": "43", "type": "string", "distinct": "26", "missing": "101400" }, { "name": "stock", "index": "44", "type": "string", "distinct": "3189", "missing": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 1, "nr_of_downloads": 0, "total_downloads": 0, "reach": 1, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }