Get quick answers to your questions about the article from our AI researcher chatbot
{'id': 'https://openalex.org/W3118514422', 'doi': 'https://doi.org/10.1002/gepi.22373', 'title': 'Unsupervised cluster analysis of SARS‐CoV‐2 genomes reflects its geographic progression and identifies distinct genetic subgroups of SARS‐CoV‐2 virus', 'display_name': 'Unsupervised cluster analysis of SARS‐CoV‐2 genomes reflects its geographic progression and identifies distinct genetic subgroups of SARS‐CoV‐2 virus', 'publication_year': 2021, 'publication_date': '2021-01-08', 'ids': {'openalex': 'https://openalex.org/W3118514422', 'doi': 'https://doi.org/10.1002/gepi.22373', 'mag': '3118514422', 'pmid': 'https://pubmed.ncbi.nlm.nih.gov/33415739', 'pmcid': 'https://www.ncbi.nlm.nih.gov/pmc/articles/8005425'}, 'language': 'en', 'primary_location': {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1002/gepi.22373', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S136352176', 'display_name': 'Genetic Epidemiology', 'issn_l': '0741-0395', 'issn': ['0741-0395', '1098-2272'], 'is_oa': False, 'is_in_doaj': False, 'is_core': True, 'host_organization': 'https://openalex.org/P4310320595', 'host_organization_name': 'Wiley', 'host_organization_lineage': ['https://openalex.org/P4310320595'], 'host_organization_lineage_names': ['Wiley'], 'type': 'journal'}, 'license': None, 'license_id': None, 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, 'type': 'article', 'type_crossref': 'journal-article', 'indexed_in': ['crossref', 'pubmed'], 'open_access': {'is_oa': True, 'oa_status': 'bronze', 'oa_url': 'https://doi.org/10.1002/gepi.22373', 'any_repository_has_fulltext': True}, 'authorships': [{'author_position': 'first', 'author': {'id': 'https://openalex.org/A5010215905', 'display_name': 'Georg Hahn', 'orcid': 'https://orcid.org/0000-0001-6008-2720'}, 'institutions': [{'id': 'https://openalex.org/I136199984', 'display_name': 'Harvard University', 'ror': 'https://ror.org/03vek6s52', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I136199984']}], 'countries': ['US'], 'is_corresponding': True, 'raw_author_name': 'Georg Hahn', 'raw_affiliation_strings': ['Department of Biostatistics, T.H. Chan School of Public Health, Harvard University, Boston, Massachusetts, USA'], 'affiliations': [{'raw_affiliation_string': 'Department of Biostatistics, T.H. Chan School of Public Health, Harvard University, Boston, Massachusetts, USA', 'institution_ids': ['https://openalex.org/I136199984']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5100434238', 'display_name': 'Sanghun Lee', 'orcid': 'https://orcid.org/0000-0002-0573-9555'}, 'institutions': [{'id': 'https://openalex.org/I136199984', 'display_name': 'Harvard University', 'ror': 'https://ror.org/03vek6s52', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I136199984']}, {'id': 'https://openalex.org/I89015989', 'display_name': 'Dankook University', 'ror': 'https://ror.org/058pdbn81', 'country_code': 'KR', 'type': 'education', 'lineage': ['https://openalex.org/I89015989']}], 'countries': ['KR', 'US'], 'is_corresponding': False, 'raw_author_name': 'Sanghun Lee', 'raw_affiliation_strings': ['Department of Biostatistics, T.H. Chan School of Public Health, Harvard University, Boston, Massachusetts, USA', 'Department of Medical Consilience, Graduate School, Dankook University, Yongin-si, South Korea'], 'affiliations': [{'raw_affiliation_string': 'Department of Biostatistics, T.H. Chan School of Public Health, Harvard University, Boston, Massachusetts, USA', 'institution_ids': ['https://openalex.org/I136199984']}, {'raw_affiliation_string': 'Department of Medical Consilience, Graduate School, Dankook University, Yongin-si, South Korea', 'institution_ids': ['https://openalex.org/I89015989']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5073763243', 'display_name': 'Scott T. Weiss', 'orcid': 'https://orcid.org/0000-0001-7196-303X'}, 'institutions': [{'id': 'https://openalex.org/I1283280774', 'display_name': "Brigham and Women's Hospital", 'ror': 'https://ror.org/04b6nzv94', 'country_code': 'US', 'type': 'healthcare', 'lineage': ['https://openalex.org/I1283280774', 'https://openalex.org/I48633490']}, {'id': 'https://openalex.org/I136199984', 'display_name': 'Harvard University', 'ror': 'https://ror.org/03vek6s52', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I136199984']}], 'countries': ['US'], 'is_corresponding': False, 'raw_author_name': 'Scott T. Weiss', 'raw_affiliation_strings': ["Channing Division of Network Medicine, Department of Medicine, Brigham and Women's Hospital, Harvard Medical School, Boston, Massachusetts, USA"], 'affiliations': [{'raw_affiliation_string': "Channing Division of Network Medicine, Department of Medicine, Brigham and Women's Hospital, Harvard Medical School, Boston, Massachusetts, USA", 'institution_ids': ['https://openalex.org/I1283280774', 'https://openalex.org/I136199984']}]}, {'author_position': 'last', 'author': {'id': 'https://openalex.org/A5002736890', 'display_name': 'Christoph Lange', 'orcid': 'https://orcid.org/0000-0003-2620-1030'}, 'institutions': [{'id': 'https://openalex.org/I136199984', 'display_name': 'Harvard University', 'ror': 'https://ror.org/03vek6s52', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I136199984']}], 'countries': ['US'], 'is_corresponding': False, 'raw_author_name': 'Christoph Lange', 'raw_affiliation_strings': ['Department of Biostatistics, T.H. Chan School of Public Health, Harvard University, Boston, Massachusetts, USA'], 'affiliations': [{'raw_affiliation_string': 'Department of Biostatistics, T.H. Chan School of Public Health, Harvard University, Boston, Massachusetts, USA', 'institution_ids': ['https://openalex.org/I136199984']}]}], 'countries_distinct_count': 2, 'institutions_distinct_count': 3, 'corresponding_author_ids': ['https://openalex.org/A5010215905'], 'corresponding_institution_ids': ['https://openalex.org/I136199984'], 'apc_list': {'value': 3760, 'currency': 'USD', 'value_usd': 3760, 'provenance': 'doaj'}, 'apc_paid': None, 'fwci': 0.407, 'has_fulltext': False, 'cited_by_count': 6, 'citation_normalized_percentile': {'value': 0.764003, 'is_in_top_1_percent': False, 'is_in_top_10_percent': False}, 'cited_by_percentile_year': {'min': 82, 'max': 84}, 'biblio': {'volume': '45', 'issue': '3', 'first_page': '316', 'last_page': '323'}, 'is_retracted': False, 'is_paratext': False, 'primary_topic': {'id': 'https://openalex.org/T10118', 'display_name': 'Coronavirus Disease 2019 Research', 'score': 1.0, 'subfield': {'id': 'https://openalex.org/subfields/2725', 'display_name': 'Infectious Diseases'}, 'field': {'id': 'https://openalex.org/fields/27', 'display_name': 'Medicine'}, 'domain': {'id': 'https://openalex.org/domains/4', 'display_name': 'Health Sciences'}}, 'topics': [{'id': 'https://openalex.org/T10118', 'display_name': 'Coronavirus Disease 2019 Research', 'score': 1.0, 'subfield': {'id': 'https://openalex.org/subfields/2725', 'display_name': 'Infectious Diseases'}, 'field': {'id': 'https://openalex.org/fields/27', 'display_name': 'Medicine'}, 'domain': {'id': 'https://openalex.org/domains/4', 'display_name': 'Health Sciences'}}, {'id': 'https://openalex.org/T11495', 'display_name': 'Viral Diseases in Livestock and Poultry', 'score': 0.9997, 'subfield': {'id': 'https://openalex.org/subfields/1103', 'display_name': 'Animal Science and Zoology'}, 'field': {'id': 'https://openalex.org/fields/11', 'display_name': 'Agricultural and Biological Sciences'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, {'id': 'https://openalex.org/T10976', 'display_name': 'Gastrointestinal Viral Infections and Vaccines Development', 'score': 0.9972, 'subfield': {'id': 'https://openalex.org/subfields/2725', 'display_name': 'Infectious Diseases'}, 'field': {'id': 'https://openalex.org/fields/27', 'display_name': 'Medicine'}, 'domain': {'id': 'https://openalex.org/domains/4', 'display_name': 'Health Sciences'}}], 'keywords': [{'id': 'https://openalex.org/keywords/genomic-sequencing', 'display_name': 'Genomic Sequencing', 'score': 0.470098}, {'id': 'https://openalex.org/keywords/coronavirus', 'display_name': 'Coronavirus', 'score': 0.45965853}, {'id': 'https://openalex.org/keywords/pandemic', 'display_name': 'Pandemic', 'score': 0.42016342}, {'id': 'https://openalex.org/keywords/jaccard-index', 'display_name': 'Jaccard index', 'score': 0.4149183}], 'concepts': [{'id': 'https://openalex.org/C141231307', 'wikidata': 'https://www.wikidata.org/wiki/Q7020', 'display_name': 'Genome', 'level': 3, 'score': 0.6924533}, {'id': 'https://openalex.org/C193252679', 'wikidata': 'https://www.wikidata.org/wiki/Q242125', 'display_name': 'Phylogenetic tree', 'level': 3, 'score': 0.6918687}, {'id': 'https://openalex.org/C86803240', 'wikidata': 'https://www.wikidata.org/wiki/Q420', 'display_name': 'Biology', 'level': 0, 'score': 0.57976454}, {'id': 'https://openalex.org/C54355233', 'wikidata': 'https://www.wikidata.org/wiki/Q7162', 'display_name': 'Genetics', 'level': 1, 'score': 0.49919558}, {'id': 'https://openalex.org/C2522874641', 'wikidata': 'https://www.wikidata.org/wiki/Q808', 'display_name': 'Virus', 'level': 2, 'score': 0.479165}, {'id': 'https://openalex.org/C2777648638', 'wikidata': 'https://www.wikidata.org/wiki/Q57751738', 'display_name': 'Coronavirus', 'level': 5, 'score': 0.45965853}, {'id': 'https://openalex.org/C70721500', 'wikidata': 'https://www.wikidata.org/wiki/Q177005', 'display_name': 'Computational biology', 'level': 1, 'score': 0.442489}, {'id': 'https://openalex.org/C3007834351', 'wikidata': 'https://www.wikidata.org/wiki/Q82069695', 'display_name': 'Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2)', 'level': 5, 'score': 0.43096104}, {'id': 'https://openalex.org/C89623803', 'wikidata': 'https://www.wikidata.org/wiki/Q12184', 'display_name': 'Pandemic', 'level': 5, 'score': 0.42016342}, {'id': 'https://openalex.org/C203519979', 'wikidata': 'https://www.wikidata.org/wiki/Q865360', 'display_name': 'Jaccard index', 'level': 3, 'score': 0.4149183}, {'id': 'https://openalex.org/C24432333', 'wikidata': 'https://www.wikidata.org/wiki/Q2068526', 'display_name': 'Whole genome sequencing', 'level': 4, 'score': 0.41320774}, {'id': 'https://openalex.org/C61053724', 'wikidata': 'https://www.wikidata.org/wiki/Q1154615', 'display_name': 'Sequence analysis', 'level': 3, 'score': 0.41206545}, {'id': 'https://openalex.org/C3008058167', 'wikidata': 'https://www.wikidata.org/wiki/Q84263196', 'display_name': 'Coronavirus disease 2019 (COVID-19)', 'level': 4, 'score': 0.28525743}, {'id': 'https://openalex.org/C73555534', 'wikidata': 'https://www.wikidata.org/wiki/Q622825', 'display_name': 'Cluster analysis', 'level': 2, 'score': 0.26252693}, {'id': 'https://openalex.org/C104317684', 'wikidata': 'https://www.wikidata.org/wiki/Q7187', 'display_name': 'Gene', 'level': 2, 'score': 0.1915395}, {'id': 'https://openalex.org/C41008148', 'wikidata': 'https://www.wikidata.org/wiki/Q21198', 'display_name': 'Computer science', 'level': 0, 'score': 0.14233932}, {'id': 'https://openalex.org/C71924100', 'wikidata': 'https://www.wikidata.org/wiki/Q11190', 'display_name': 'Medicine', 'level': 0, 'score': 0.09876162}, {'id': 'https://openalex.org/C2779134260', 'wikidata': 'https://www.wikidata.org/wiki/Q12136', 'display_name': 'Disease', 'level': 2, 'score': 0.0}, {'id': 'https://openalex.org/C142724271', 'wikidata': 'https://www.wikidata.org/wiki/Q7208', 'display_name': 'Pathology', 'level': 1, 'score': 0.0}, {'id': 'https://openalex.org/C524204448', 'wikidata': 'https://www.wikidata.org/wiki/Q788926', 'display_name': 'Infectious disease (medical specialty)', 'level': 3, 'score': 0.0}, {'id': 'https://openalex.org/C119857082', 'wikidata': 'https://www.wikidata.org/wiki/Q2539', 'display_name': 'Machine learning', 'level': 1, 'score': 0.0}], 'mesh': [{'descriptor_ui': 'D000086382', 'descriptor_name': 'COVID-19', 'qualifier_ui': 'Q000821', 'qualifier_name': 'virology', 'is_major_topic': True}, {'descriptor_ui': 'D016000', 'descriptor_name': 'Cluster Analysis', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': True}, {'descriptor_ui': 'D016679', 'descriptor_name': 'Genome, Viral', 'qualifier_ui': 'Q000235', 'qualifier_name': 'genetics', 'is_major_topic': True}, {'descriptor_ui': 'D062305', 'descriptor_name': 'Geographic Mapping', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': True}, {'descriptor_ui': 'D000086402', 'descriptor_name': 'SARS-CoV-2', 'qualifier_ui': 'Q000145', 'qualifier_name': 'classification', 'is_major_topic': True}, {'descriptor_ui': 'D000086402', 'descriptor_name': 'SARS-CoV-2', 'qualifier_ui': 'Q000235', 'qualifier_name': 'genetics', 'is_major_topic': True}, {'descriptor_ui': 'D000086382', 'descriptor_name': 'COVID-19', 'qualifier_ui': 'Q000453', 'qualifier_name': 'epidemiology', 'is_major_topic': False}, {'descriptor_ui': 'D000086382', 'descriptor_name': 'COVID-19', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D002681', 'descriptor_name': 'China', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D002681', 'descriptor_name': 'China', 'qualifier_ui': 'Q000453', 'qualifier_name': 'epidemiology', 'is_major_topic': False}, {'descriptor_ui': 'D030541', 'descriptor_name': 'Databases, Genetic', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D005060', 'descriptor_name': 'Europe', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D005060', 'descriptor_name': 'Europe', 'qualifier_ui': 'Q000453', 'qualifier_name': 'epidemiology', 'is_major_topic': False}, {'descriptor_ui': 'D016679', 'descriptor_name': 'Genome, Viral', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D006801', 'descriptor_name': 'Humans', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D017720', 'descriptor_name': 'Molecular Epidemiology', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D009656', 'descriptor_name': 'North America', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D009656', 'descriptor_name': 'North America', 'qualifier_ui': 'Q000453', 'qualifier_name': 'epidemiology', 'is_major_topic': False}, {'descriptor_ui': 'D058873', 'descriptor_name': 'Pandemics', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D010802', 'descriptor_name': 'Phylogeny', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D025341', 'descriptor_name': 'Principal Component Analysis', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D011379', 'descriptor_name': 'Prognosis', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D000086402', 'descriptor_name': 'SARS-CoV-2', 'qualifier_ui': 'Q000302', 'qualifier_name': 'isolation & purification', 'is_major_topic': False}, {'descriptor_ui': 'D000086402', 'descriptor_name': 'SARS-CoV-2', 'qualifier_ui': 'Q000472', 'qualifier_name': 'pathogenicity', 'is_major_topic': False}, {'descriptor_ui': 'D000086402', 'descriptor_name': 'SARS-CoV-2', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D062211', 'descriptor_name': 'Spatio-Temporal Analysis', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}], 'locations_count': 5, 'locations': [{'is_oa': True, 'landing_page_url': 'https://doi.org/10.1002/gepi.22373', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S136352176', 'display_name': 'Genetic Epidemiology', 'issn_l': '0741-0395', 'issn': ['0741-0395', '1098-2272'], 'is_oa': False, 'is_in_doaj': False, 'is_core': True, 'host_organization': 'https://openalex.org/P4310320595', 'host_organization_name': 'Wiley', 'host_organization_lineage': ['https://openalex.org/P4310320595'], 'host_organization_lineage_names': ['Wiley'], 'type': 'journal'}, 'license': None, 'license_id': None, 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, {'is_oa': True, 'landing_page_url': 'https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7337379', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S2764455111', 'display_name': 'PubMed Central', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I1299303238', 'host_organization_name': 'National Institutes of Health', 'host_organization_lineage': ['https://openalex.org/I1299303238'], 'host_organization_lineage_names': ['National Institutes of Health'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, {'is_oa': True, 'landing_page_url': 'https://www.ncbi.nlm.nih.gov/pmc/articles/PMC8005425', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S2764455111', 'display_name': 'PubMed Central', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I1299303238', 'host_organization_name': 'National Institutes of Health', 'host_organization_lineage': ['https://openalex.org/I1299303238'], 'host_organization_lineage_names': ['National Institutes of Health'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': 'acceptedVersion', 'is_accepted': True, 'is_published': False}, {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1101/2020.05.05.079061', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S4306402567', 'display_name': 'bioRxiv (Cold Spring Harbor Laboratory)', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I2750212522', 'host_organization_name': 'Cold Spring Harbor Laboratory', 'host_organization_lineage': ['https://openalex.org/I2750212522'], 'host_organization_lineage_names': ['Cold Spring Harbor Laboratory'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': 'submittedVersion', 'is_accepted': False, 'is_published': False}, {'is_oa': False, 'landing_page_url': 'https://pubmed.ncbi.nlm.nih.gov/33415739', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S4306525036', 'display_name': 'PubMed', 'issn_l': None, 'issn': None, 'is_oa': False, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I1299303238', 'host_organization_name': 'National Institutes of Health', 'host_organization_lineage': ['https://openalex.org/I1299303238'], 'host_organization_lineage_names': ['National Institutes of Health'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}], 'best_oa_location': {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1002/gepi.22373', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S136352176', 'display_name': 'Genetic Epidemiology', 'issn_l': '0741-0395', 'issn': ['0741-0395', '1098-2272'], 'is_oa': False, 'is_in_doaj': False, 'is_core': True, 'host_organization': 'https://openalex.org/P4310320595', 'host_organization_name': 'Wiley', 'host_organization_lineage': ['https://openalex.org/P4310320595'], 'host_organization_lineage_names': ['Wiley'], 'type': 'journal'}, 'license': None, 'license_id': None, 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, 'sustainable_development_goals': [{'id': 'https://metadata.un.org/sdg/3', 'display_name': 'Good health and well-being', 'score': 0.82}], 'grants': [{'funder': 'https://openalex.org/F4320337338', 'funder_display_name': 'National Heart, Lung, and Blood Institute', 'award_id': 'P01HL132825'}, {'funder': 'https://openalex.org/F4320337338', 'funder_display_name': 'National Heart, Lung, and Blood Institute', 'award_id': 'U01HL089897'}, {'funder': 'https://openalex.org/F4320337338', 'funder_display_name': 'National Heart, Lung, and Blood Institute', 'award_id': 'P01HL120839'}, {'funder': 'https://openalex.org/F4320337338', 'funder_display_name': 'National Heart, Lung, and Blood Institute', 'award_id': '2U01HG008685'}, {'funder': 'https://openalex.org/F4320337338', 'funder_display_name': 'National Heart, Lung, and Blood Institute', 'award_id': 'U01HL089856'}, {'funder': 'https://openalex.org/F4320337348', 'funder_display_name': 'National Human Genome Research Institute', 'award_id': 'R01HG008976'}], 'datasets': [], 'versions': [], 'referenced_works_count': 20, 'referenced_works': ['https://openalex.org/W1977601452', 'https://openalex.org/W2031611770', 'https://openalex.org/W2088080911', 'https://openalex.org/W2117756735', 'https://openalex.org/W2134250657', 'https://openalex.org/W2302778906', 'https://openalex.org/W2587970647', 'https://openalex.org/W2592682870', 'https://openalex.org/W2605343262', 'https://openalex.org/W2745750801', 'https://openalex.org/W2953965357', 'https://openalex.org/W3009885589', 'https://openalex.org/W3010135793', 'https://openalex.org/W3010667412', 'https://openalex.org/W3010860326', 'https://openalex.org/W3014941429', 'https://openalex.org/W3040012249', 'https://openalex.org/W3087003652', 'https://openalex.org/W3092541222', 'https://openalex.org/W4238606998'], 'related_works': ['https://openalex.org/W4254879869', 'https://openalex.org/W3127229356', 'https://openalex.org/W3022576529', 'https://openalex.org/W2913569734', 'https://openalex.org/W2628526247', 'https://openalex.org/W2596401011', 'https://openalex.org/W2391956478', 'https://openalex.org/W2294604808', 'https://openalex.org/W2087388313', 'https://openalex.org/W2000801317'], 'abstract_inverted_index': {'Over': [0], '10,000': [1], 'viral': [2], 'genome': [3, 21, 180], 'sequences': [4, 165], 'of': [5, 23, 49, 87, 97, 103, 106, 121, 161, 177, 188, 205, 248], 'the': [6, 14, 19, 24, 29, 41, 45, 54, 68, 84, 88, 94, 98, 117, 123, 142, 171, 178, 183, 189, 193, 202, 236, 246, 254], 'SARS-CoV-2virus': [7], 'have': [8], 'been': [9], 'made': [10], 'readily': [11], 'available': [12, 115], 'during': [13], 'ongoing': [15, 249], 'coronavirus': [16], 'pandemic': [17], 'since': [18], 'initial': [20], 'sequence': [22, 234], 'virus': [25, 99], 'was': [26], 'released': [27], 'on': [28, 36, 44, 93, 232], 'open': [30], 'access': [31], 'Virological': [32], 'website': [33], '(http://virological.org/)': [34], 'early': [35], 'January': [37], '11.': [38], 'We': [39, 90, 148, 227], 'utilize': [40, 135], 'published': [42], 'data': [43, 92, 181], 'single': [46], 'stranded': [47], 'RNAs': [48], '11,132': [50], 'SARS-CoV-2': [51, 63, 108, 163, 179, 237], 'patients': [52, 109], 'in': [53, 116, 199, 207, 214, 240], 'GISAID': [55, 118], 'database,': [56], 'which': [57, 75, 220], 'contains': [58], 'fully': [59], 'or': [60], 'partially': [61], 'sequenced': [62], 'samples': [64], 'from': [65, 192], 'laboratories': [66], 'around': [67], 'world.': [69], 'Among': [70], 'many': [71], 'important': [72], 'research': [73, 250], 'questions': [74], 'are': [76, 114], 'currently': [77], 'being': [78], 'investigated,': [79], 'one': [80], 'aspect': [81], 'pertains': [82], 'to': [83, 153, 201, 223, 251, 260], 'genetic': [85, 242, 255], 'characterization/classification': [86], 'virus.': [89], 'analyze': [91], 'nucleotide': [95, 164], 'sequencing': [96], 'and': [100, 130, 185, 209, 263], 'geographic': [101, 184], 'information': [102], 'a': [104, 136, 145, 154, 217], 'subset': [105], '7640': [107], 'without': [110], 'missing': [111], 'entries': [112], 'that': [113, 140, 157, 196], 'database.': [119], 'Instead': [120], 'modeling': [122], 'mutation': [124], 'rate,': [125], 'applying': [126], 'phylogenetic': [127, 218], 'tree': [128], 'approaches,': [129], 'so': [131], 'forth,': [132], 'we': [133, 221], 'here': [134], 'model-free': [137], 'clustering': [138], 'approach': [139], 'compares': [141, 158], 'viruses': [143, 238], 'at': [144, 166], 'genome-wide': [146], 'level.': [147], 'apply': [149], 'principal': [150], 'component': [151], 'analysis': [152, 175, 219], 'similarity': [155], 'matrix': [156], 'all': [159, 167], 'pairs': [160], 'these': [162], 'loci': [168], 'simultaneously,': [169], 'using': [170], 'Jaccard': [172], 'index.': [173], 'Our': [174], 'results': [176], 'illustrates': [182], 'chronological': [186], 'progression': [187], 'virus,': [190], 'starting': [191], 'first': [194], 'cases': [195, 206], 'were': [197], 'observed': [198], 'China': [200], 'current': [203], 'wave': [204], 'Europe': [208], 'North': [210], 'America.': [211], 'This': [212], 'is': [213, 245], 'line': [215], 'with': [216], 'use': [222], 'contrast': [224], 'our': [225], 'results.': [226], 'also': [228], 'observe': [229], 'that,': [230], 'based': [231], 'their': [233], 'data,': [235], 'cluster': [239], 'distinct': [241], 'subgroups.': [243], 'It': [244], 'subject': [247], 'examine': [252], 'whether': [253], 'subgroup': [256], 'could': [257], 'be': [258], 'related': [259], 'diseases': [261], 'outcome': [262], 'its': [264], 'potential': [265], 'implications': [266], 'for': [267], 'vaccine': [268], 'development.': [269]}, 'cited_by_api_url': 'https://api.openalex.org/works?filter=cites:W3118514422', 'counts_by_year': [{'year': 2023, 'cited_by_count': 1}, {'year': 2022, 'cited_by_count': 2}, {'year': 2021, 'cited_by_count': 3}], 'updated_date': '2024-09-13T15:36:45.640762', 'created_date': '2021-01-18'}