Dropout: a simple way to prevent neural networks from overfitting

Name: Work Video:
Duration: 3 min 30 s
Nitish Srivastava; Geoffrey E. Hinton; Alex Krizhevsky; Ilya Sutskever; Ruslan Salakhutdinov
{'id': 'https://openalex.org/W2095705004', 'doi': None, 'title': 'Dropout: a simple way to prevent neural networks from overfitting', 'display_name': 'Dropout: a simple way to prevent neural networks from overfitting', 'publication_year': 2014, 'publication_date': '2014-01-01', 'ids': {'openalex': 'https://openalex.org/W2095705004', 'mag': '2095705004'}, 'language': 'en', 'primary_location': {'is_oa': False, 'landing_page_url': 'https://jmlr.csail.mit.edu/papers/volume15/srivastava14a/srivastava14a.pdf', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S118988714', 'display_name': 'Journal of Machine Learning Research', 'issn_l': '1532-4435', 'issn': ['1532-4435', '1533-7928'], 'is_oa': False, 'is_in_doaj': False, 'is_core': True, 'host_organization': 'https://openalex.org/P4310315718', 'host_organization_name': 'The MIT Press', 'host_organization_lineage': ['https://openalex.org/P4310315718'], 'host_organization_lineage_names': ['The MIT Press'], 'type': 'journal'}, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}, 'type': 'article', 'type_crossref': 'journal-article', 'indexed_in': [], 'open_access': {'is_oa': False, 'oa_status': 'closed', 'oa_url': None, 'any_repository_has_fulltext': False}, 'authorships': [{'author_position': 'first', 'author': {'id': 'https://openalex.org/A5103070090', 'display_name': 'Nitish Srivastava', 'orcid': 'https://orcid.org/0000-0002-3442-5352'}, 'institutions': [{'id': 'https://openalex.org/I185261750', 'display_name': 'University of Toronto', 'ror': 'https://ror.org/03dbr7087', 'country_code': 'CA', 'type': 'education', 'lineage': ['https://openalex.org/I185261750']}], 'countries': ['CA'], 'is_corresponding': False, 'raw_author_name': 'Nitish Srivastava', 'raw_affiliation_strings': ['Department of Computer Science University of Toronto  Toronto Ontario Canada'], 'affiliations': [{'raw_affiliation_string': 'Department of Computer Science University of Toronto  Toronto Ontario Canada', 'institution_ids': ['https://openalex.org/I185261750']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5108093963', 'display_name': 'Geoffrey E. Hinton', 'orcid': None}, 'institutions': [{'id': 'https://openalex.org/I185261750', 'display_name': 'University of Toronto', 'ror': 'https://ror.org/03dbr7087', 'country_code': 'CA', 'type': 'education', 'lineage': ['https://openalex.org/I185261750']}], 'countries': ['CA'], 'is_corresponding': False, 'raw_author_name': 'Geoffrey Hinton', 'raw_affiliation_strings': ['Department of Computer Science University of Toronto  Toronto Ontario Canada'], 'affiliations': [{'raw_affiliation_string': 'Department of Computer Science University of Toronto  Toronto Ontario Canada', 'institution_ids': ['https://openalex.org/I185261750']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5031152245', 'display_name': 'Alex Krizhevsky', 'orcid': None}, 'institutions': [{'id': 'https://openalex.org/I185261750', 'display_name': 'University of Toronto', 'ror': 'https://ror.org/03dbr7087', 'country_code': 'CA', 'type': 'education', 'lineage': ['https://openalex.org/I185261750']}], 'countries': ['CA'], 'is_corresponding': False, 'raw_author_name': 'Alex Krizhevsky', 'raw_affiliation_strings': ['Department of Computer Science University of Toronto  Toronto Ontario Canada'], 'affiliations': [{'raw_affiliation_string': 'Department of Computer Science University of Toronto  Toronto Ontario Canada', 'institution_ids': ['https://openalex.org/I185261750']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5006446297', 'display_name': 'Ilya Sutskever', 'orcid': None}, 'institutions': [{'id': 'https://openalex.org/I185261750', 'display_name': 'University of Toronto', 'ror': 'https://ror.org/03dbr7087', 'country_code': 'CA', 'type': 'education', 'lineage': ['https://openalex.org/I185261750']}], 'countries': ['CA'], 'is_corresponding': False, 'raw_author_name': 'Ilya Sutskever', 'raw_affiliation_strings': ['Department of Computer Science University of Toronto  Toronto Ontario Canada'], 'affiliations': [{'raw_affiliation_string': 'Department of Computer Science University of Toronto  Toronto Ontario Canada', 'institution_ids': ['https://openalex.org/I185261750']}]}, {'author_position': 'last', 'author': {'id': 'https://openalex.org/A5071983998', 'display_name': 'Ruslan Salakhutdinov', 'orcid': 'https://orcid.org/0000-0002-3752-2756'}, 'institutions': [{'id': 'https://openalex.org/I185261750', 'display_name': 'University of Toronto', 'ror': 'https://ror.org/03dbr7087', 'country_code': 'CA', 'type': 'education', 'lineage': ['https://openalex.org/I185261750']}], 'countries': ['CA'], 'is_corresponding': False, 'raw_author_name': 'Ruslan Salakhutdinov', 'raw_affiliation_strings': ['Department of Computer Science University of Toronto  Toronto Ontario Canada'], 'affiliations': [{'raw_affiliation_string': 'Department of Computer Science University of Toronto  Toronto Ontario Canada', 'institution_ids': ['https://openalex.org/I185261750']}]}], 'institution_assertions': [], 'countries_distinct_count': 1, 'institutions_distinct_count': 1, 'corresponding_author_ids': [], 'corresponding_institution_ids': [], 'apc_list': None, 'apc_paid': None, 'fwci': 1336.249, 'has_fulltext': False, 'cited_by_count': 33365, 'citation_normalized_percentile': {'value': 0.999969, 'is_in_top_1_percent': True, 'is_in_top_10_percent': True}, 'cited_by_percentile_year': {'min': 99, 'max': 100}, 'biblio': {'volume': '15', 'issue': '1', 'first_page': '1929', 'last_page': '1958'}, 'is_retracted': False, 'is_paratext': False, 'primary_topic': {'id': 'https://openalex.org/T12535', 'display_name': 'Machine Learning and Data Classification', 'score': 0.9994, 'subfield': {'id': 'https://openalex.org/subfields/1702', 'display_name': 'Artificial Intelligence'}, 'field': {'id': 'https://openalex.org/fields/17', 'display_name': 'Computer Science'}, 'domain': {'id': 'https://openalex.org/domains/3', 'display_name': 'Physical Sciences'}}, 'topics': [{'id': 'https://openalex.org/T12535', 'display_name': 'Machine Learning and Data Classification', 'score': 0.9994, 'subfield': {'id': 'https://openalex.org/subfields/1702', 'display_name': 'Artificial Intelligence'}, 'field': {'id': 'https://openalex.org/fields/17', 'display_name': 'Computer Science'}, 'domain': {'id': 'https://openalex.org/domains/3', 'display_name': 'Physical Sciences'}}, {'id': 'https://openalex.org/T12072', 'display_name': 'Machine Learning and Algorithms', 'score': 0.9984, 'subfield': {'id': 'https://openalex.org/subfields/1702', 'display_name': 'Artificial Intelligence'}, 'field': {'id': 'https://openalex.org/fields/17', 'display_name': 'Computer Science'}, 'domain': {'id': 'https://openalex.org/domains/3', 'display_name': 'Physical Sciences'}}, {'id': 'https://openalex.org/T10320', 'display_name': 'Neural Networks and Applications', 'score': 0.9969, 'subfield': {'id': 'https://openalex.org/subfields/1702', 'display_name': 'Artificial Intelligence'}, 'field': {'id': 'https://openalex.org/fields/17', 'display_name': 'Computer Science'}, 'domain': {'id': 'https://openalex.org/domains/3', 'display_name': 'Physical Sciences'}}], 'keywords': [{'id': 'https://openalex.org/keywords/overfitting', 'display_name': 'Overfitting', 'score': 0.970073}, {'id': 'https://openalex.org/keywords/dropout', 'display_name': 'Dropout (neural networks)', 'score': 0.90460396}, {'id': 'https://openalex.org/keywords/benchmark', 'display_name': 'Benchmark (surveying)', 'score': 0.5468679}, {'id': 'https://openalex.org/keywords/deep-neural-networks', 'display_name': 'Deep Neural Networks', 'score': 0.49621564}, {'id': 'https://openalex.org/keywords/regularization', 'display_name': 'Regularization', 'score': 0.4633584}], 'concepts': [{'id': 'https://openalex.org/C22019652', 'wikidata': 'https://www.wikidata.org/wiki/Q331309', 'display_name': 'Overfitting', 'level': 3, 'score': 0.970073}, {'id': 'https://openalex.org/C2776145597', 'wikidata': 'https://www.wikidata.org/wiki/Q25339462', 'display_name': 'Dropout (neural networks)', 'level': 2, 'score': 0.90460396}, {'id': 'https://openalex.org/C41008148', 'wikidata': 'https://www.wikidata.org/wiki/Q21198', 'display_name': 'Computer science', 'level': 0, 'score': 0.7200087}, {'id': 'https://openalex.org/C154945302', 'wikidata': 'https://www.wikidata.org/wiki/Q11660', 'display_name': 'Artificial intelligence', 'level': 1, 'score': 0.70027345}, {'id': 'https://openalex.org/C50644808', 'wikidata': 'https://www.wikidata.org/wiki/Q192776', 'display_name': 'Artificial neural network', 'level': 2, 'score': 0.6955675}, {'id': 'https://openalex.org/C119857082', 'wikidata': 'https://www.wikidata.org/wiki/Q2539', 'display_name': 'Machine learning', 'level': 1, 'score': 0.69543684}, {'id': 'https://openalex.org/C185798385', 'wikidata': 'https://www.wikidata.org/wiki/Q1161707', 'display_name': 'Benchmark (surveying)', 'level': 2, 'score': 0.5468679}, {'id': 'https://openalex.org/C2984842247', 'wikidata': 'https://www.wikidata.org/wiki/Q197536', 'display_name': 'Deep neural networks', 'level': 3, 'score': 0.49621564}, {'id': 'https://openalex.org/C2776135515', 'wikidata': 'https://www.wikidata.org/wiki/Q17143721', 'display_name': 'Regularization (linguistics)', 'level': 2, 'score': 0.4633584}, {'id': 'https://openalex.org/C13280743', 'wikidata': 'https://www.wikidata.org/wiki/Q131089', 'display_name': 'Geodesy', 'level': 1, 'score': 0.0}, {'id': 'https://openalex.org/C205649164', 'wikidata': 'https://www.wikidata.org/wiki/Q1071', 'display_name': 'Geography', 'level': 0, 'score': 0.0}], 'mesh': [], 'locations_count': 1, 'locations': [{'is_oa': False, 'landing_page_url': 'https://jmlr.csail.mit.edu/papers/volume15/srivastava14a/srivastava14a.pdf', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S118988714', 'display_name': 'Journal of Machine Learning Research', 'issn_l': '1532-4435', 'issn': ['1532-4435', '1533-7928'], 'is_oa': False, 'is_in_doaj': False, 'is_core': True, 'host_organization': 'https://openalex.org/P4310315718', 'host_organization_name': 'The MIT Press', 'host_organization_lineage': ['https://openalex.org/P4310315718'], 'host_organization_lineage_names': ['The MIT Press'], 'type': 'journal'}, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}], 'best_oa_location': None, 'sustainable_development_goals': [], 'grants': [], 'datasets': [], 'versions': [], 'referenced_works_count': 36, 'referenced_works': ['https://openalex.org/W137106866', 'https://openalex.org/W1492459858', 'https://openalex.org/W1524333225', 'https://openalex.org/W1567512734', 'https://openalex.org/W189596042', 'https://openalex.org/W1993882792', 'https://openalex.org/W2025768430', 'https://openalex.org/W2053229256', 'https://openalex.org/W2085040216', 'https://openalex.org/W2096873754', 'https://openalex.org/W2100495367', 'https://openalex.org/W2103359087', 'https://openalex.org/W2114296159', 'https://openalex.org/W2114733238', 'https://openalex.org/W2131241448', 'https://openalex.org/W2135046866', 'https://openalex.org/W2136922672', 'https://openalex.org/W2145094598', 'https://openalex.org/W2147800946', 'https://openalex.org/W2150717117', 'https://openalex.org/W2152722485', 'https://openalex.org/W2156163116', 'https://openalex.org/W2156297475', 'https://openalex.org/W2158542502', 'https://openalex.org/W2163605009', 'https://openalex.org/W2183112036', 'https://openalex.org/W2294059674', 'https://openalex.org/W2335728318', 'https://openalex.org/W2546302380', 'https://openalex.org/W2611675901', 'https://openalex.org/W2949821452', 'https://openalex.org/W2962820688', 'https://openalex.org/W2963574257', 'https://openalex.org/W2971788173', 'https://openalex.org/W3118608800', 'https://openalex.org/W35527955'], 'related_works': ['https://openalex.org/W3118608800', 'https://openalex.org/W2964308564', 'https://openalex.org/W2964121744', 'https://openalex.org/W2963446712', 'https://openalex.org/W2963403868', 'https://openalex.org/W2949117887', 'https://openalex.org/W2919115771', 'https://openalex.org/W2250539671', 'https://openalex.org/W2194775991', 'https://openalex.org/W2163605009', 'https://openalex.org/W2117539524', 'https://openalex.org/W2112796928', 'https://openalex.org/W2108598243', 'https://openalex.org/W2097117768', 'https://openalex.org/W2064675550', 'https://openalex.org/W1901129140', 'https://openalex.org/W1686810756', 'https://openalex.org/W1677182931', 'https://openalex.org/W1665214252', 'https://openalex.org/W1533861849'], 'abstract_inverted_index': {'Deep': [0], 'neural': [1, 46, 73, 146], 'nets': [2, 47], 'with': [3, 36, 68], 'a': [4, 18, 53, 118], 'large': [5, 45], 'number': [6, 91], 'of': [7, 42, 92, 106, 110, 145], 'parameters': [8], 'are': [9, 26], 'very': [10], 'powerful': [11], 'machine': [12], 'learning': [13, 150], 'systems.': [14], 'However,': [15], 'overfitting': [16, 37, 129], 'is': [17, 52, 62, 100], 'serious': [19], 'problem': [20], 'in': [21, 152], 'such': [22], 'networks.': [23, 95], 'Large': [24], 'networks': [25, 114, 147], 'also': [27], 'slow': [28], 'to': [29, 34, 63, 102], 'use,': [30], 'making': [31], 'it': [32, 99], 'difficult': [33], 'deal': [35], 'by': [38, 115], 'combining': [39], 'the': [40, 72, 104, 108, 143], 'predictions': [41, 109], 'many': [43, 165], 'different': [44, 93], 'at': [48], 'test': [49, 97], 'time.': [50], 'Dropout': [51], 'technique': [54], 'for': [55], 'addressing': [56], 'this': [57], 'problem.': [58], 'The': [59], 'key': [60], 'idea': [61], 'randomly': [64], 'drop': [65], 'units': [66, 79], '(along': [67], 'their': [69], 'connections)': [70], 'from': [71, 80, 88], 'network': [74, 121], 'during': [75], 'training.': [76], 'This': [77, 126], 'prevents': [78], 'co-adapting': [81], 'too': [82], 'much.': [83], 'During': [84], 'training,': [85], 'dropout': [86, 141], 'samples': [87], 'an': [89], 'exponential': [90], 'thinned': [113], 'At': [96], 'time,': [98], 'easy': [101], 'approximate': [103], 'effect': [105], 'averaging': [107], 'all': [111], 'these': [112], 'simply': [116], 'using': [117], 'single': [119], 'unthinned': [120], 'that': [122, 140], 'has': [123], 'smaller': [124], 'weights.': [125], 'significantly': [127], 'reduces': [128], 'and': [130, 158], 'gives': [131], 'major': [132], 'improvements': [133], 'over': [134], 'other': [135], 'regularization': [136], 'methods.': [137], 'We': [138], 'show': [139], 'improves': [142], 'performance': [144], 'on': [148, 164], 'supervised': [149], 'tasks': [151], 'vision,': [153], 'speech': [154], 'recognition,': [155], 'document': [156], 'classification': [157], 'computational': [159], 'biology,': [160], 'obtaining': [161], 'state-of-the-art': [162], 'results': [163], 'benchmark': [166], 'data': [167], 'sets.': [168]}, 'cited_by_api_url': 'https://api.openalex.org/works?filter=cites:W2095705004', 'counts_by_year': [{'year': 2024, 'cited_by_count': 1732}, {'year': 2023, 'cited_by_count': 2903}, {'year': 2022, 'cited_by_count': 3302}, {'year': 2021, 'cited_by_count': 5627}, {'year': 2020, 'cited_by_count': 5587}, {'year': 2019, 'cited_by_count': 5679}, {'year': 2018, 'cited_by_count': 4118}, {'year': 2017, 'cited_by_count': 2451}, {'year': 2016, 'cited_by_count': 1186}, {'year': 2015, 'cited_by_count': 375}, {'year': 2014, 'cited_by_count': 38}, {'year': 2013, 'cited_by_count': 3}], 'updated_date': '2024-12-20T17:35:30.930061', 'created_date': '2016-06-24'}
Publication Information

Basic Information

Access and Citation

AI Researcher Chatbot

Primary Location

Authors

Topics

Keywords

Related Works