Get quick answers to your questions about the article from our AI researcher chatbot
{'id': 'https://openalex.org/W2969491951', 'doi': 'https://doi.org/10.1371/journal.pone.0221068', 'title': 'TreeCluster: Clustering biological sequences using phylogenetic trees', 'display_name': 'TreeCluster: Clustering biological sequences using phylogenetic trees', 'publication_year': 2019, 'publication_date': '2019-08-22', 'ids': {'openalex': 'https://openalex.org/W2969491951', 'doi': 'https://doi.org/10.1371/journal.pone.0221068', 'mag': '2969491951', 'pmid': 'https://pubmed.ncbi.nlm.nih.gov/31437182', 'pmcid': 'https://www.ncbi.nlm.nih.gov/pmc/articles/6705769'}, 'language': 'en', 'primary_location': {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1371/journal.pone.0221068', 'pdf_url': 'https://journals.plos.org/plosone/article/file?id=10.1371/journal.pone.0221068&type=printable', 'source': {'id': 'https://openalex.org/S202381698', 'display_name': 'PLoS ONE', 'issn_l': '1932-6203', 'issn': ['1932-6203'], 'is_oa': True, 'is_in_doaj': True, 'is_core': True, 'host_organization': 'https://openalex.org/P4310315706', 'host_organization_name': 'Public Library of Science', 'host_organization_lineage': ['https://openalex.org/P4310315706'], 'host_organization_lineage_names': ['Public Library of Science'], 'type': 'journal'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, 'type': 'article', 'type_crossref': 'journal-article', 'indexed_in': ['crossref', 'doaj', 'pubmed'], 'open_access': {'is_oa': True, 'oa_status': 'gold', 'oa_url': 'https://journals.plos.org/plosone/article/file?id=10.1371/journal.pone.0221068&type=printable', 'any_repository_has_fulltext': True}, 'authorships': [{'author_position': 'first', 'author': {'id': 'https://openalex.org/A5083364801', 'display_name': 'Metin Balaban', 'orcid': 'https://orcid.org/0000-0002-6947-5915'}, 'institutions': [{'id': 'https://openalex.org/I36258959', 'display_name': 'University of California, San Diego', 'ror': 'https://ror.org/0168r3w48', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I36258959']}], 'countries': ['US'], 'is_corresponding': False, 'raw_author_name': 'Metin Balaban', 'raw_affiliation_strings': ['Bioinformatics and Systems Biology Graduate Program, UC San Diego, La Jolla, CA 92093, United States of America'], 'affiliations': [{'raw_affiliation_string': 'Bioinformatics and Systems Biology Graduate Program, UC San Diego, La Jolla, CA 92093, United States of America', 'institution_ids': ['https://openalex.org/I36258959']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5008998282', 'display_name': 'Niema Moshiri', 'orcid': 'https://orcid.org/0000-0003-2209-8128'}, 'institutions': [{'id': 'https://openalex.org/I36258959', 'display_name': 'University of California, San Diego', 'ror': 'https://ror.org/0168r3w48', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I36258959']}], 'countries': ['US'], 'is_corresponding': False, 'raw_author_name': 'Niema Moshiri', 'raw_affiliation_strings': ['Bioinformatics and Systems Biology Graduate Program, UC San Diego, La Jolla, CA 92093, United States of America'], 'affiliations': [{'raw_affiliation_string': 'Bioinformatics and Systems Biology Graduate Program, UC San Diego, La Jolla, CA 92093, United States of America', 'institution_ids': ['https://openalex.org/I36258959']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5055114161', 'display_name': 'Uyen Mai', 'orcid': 'https://orcid.org/0000-0001-5065-2814'}, 'institutions': [{'id': 'https://openalex.org/I36258959', 'display_name': 'University of California, San Diego', 'ror': 'https://ror.org/0168r3w48', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I36258959']}], 'countries': ['US'], 'is_corresponding': False, 'raw_author_name': 'Uyen Mai', 'raw_affiliation_strings': ['Computer Science and Engineering, UC San Diego, La Jolla, CA 92093, United States of America'], 'affiliations': [{'raw_affiliation_string': 'Computer Science and Engineering, UC San Diego, La Jolla, CA 92093, United States of America', 'institution_ids': ['https://openalex.org/I36258959']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5045140563', 'display_name': 'Xingfan Jia', 'orcid': None}, 'institutions': [{'id': 'https://openalex.org/I36258959', 'display_name': 'University of California, San Diego', 'ror': 'https://ror.org/0168r3w48', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I36258959']}], 'countries': ['US'], 'is_corresponding': False, 'raw_author_name': 'Xingfan Jia', 'raw_affiliation_strings': ['Department of Mathematics, UC San Diego, La Jolla, CA 92093, United States of America'], 'affiliations': [{'raw_affiliation_string': 'Department of Mathematics, UC San Diego, La Jolla, CA 92093, United States of America', 'institution_ids': ['https://openalex.org/I36258959']}]}, {'author_position': 'last', 'author': {'id': 'https://openalex.org/A5087959579', 'display_name': 'Siavash Mirarab', 'orcid': 'https://orcid.org/0000-0001-5410-1518'}, 'institutions': [{'id': 'https://openalex.org/I36258959', 'display_name': 'University of California, San Diego', 'ror': 'https://ror.org/0168r3w48', 'country_code': 'US', 'type': 'education', 'lineage': ['https://openalex.org/I36258959']}], 'countries': ['US'], 'is_corresponding': True, 'raw_author_name': 'Siavash Mirarab', 'raw_affiliation_strings': ['Department of Electrical and Computer Engineering, UC San Diego, La Jolla, CA 92093, United States of America'], 'affiliations': [{'raw_affiliation_string': 'Department of Electrical and Computer Engineering, UC San Diego, La Jolla, CA 92093, United States of America', 'institution_ids': ['https://openalex.org/I36258959']}]}], 'countries_distinct_count': 1, 'institutions_distinct_count': 1, 'corresponding_author_ids': ['https://openalex.org/A5087959579'], 'corresponding_institution_ids': ['https://openalex.org/I36258959'], 'apc_list': {'value': 1805, 'currency': 'USD', 'value_usd': 1805, 'provenance': 'doaj'}, 'apc_paid': {'value': 1805, 'currency': 'USD', 'value_usd': 1805, 'provenance': 'doaj'}, 'fwci': 5.796, 'has_fulltext': True, 'fulltext_origin': 'pdf', 'cited_by_count': 123, 'citation_normalized_percentile': {'value': 0.999983, 'is_in_top_1_percent': True, 'is_in_top_10_percent': True}, 'cited_by_percentile_year': {'min': 98, 'max': 99}, 'biblio': {'volume': '14', 'issue': '8', 'first_page': 'e0221068', 'last_page': 'e0221068'}, 'is_retracted': False, 'is_paratext': False, 'primary_topic': {'id': 'https://openalex.org/T10015', 'display_name': 'RNA Sequencing Data Analysis', 'score': 0.9998, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, 'topics': [{'id': 'https://openalex.org/T10015', 'display_name': 'RNA Sequencing Data Analysis', 'score': 0.9998, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, {'id': 'https://openalex.org/T10012', 'display_name': 'Population Genetic Structure and Dynamics', 'score': 0.9781, 'subfield': {'id': 'https://openalex.org/subfields/1311', 'display_name': 'Genetics'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, {'id': 'https://openalex.org/T10066', 'display_name': 'Diversity and Function of Gut Microbiome', 'score': 0.9292, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}], 'keywords': [{'id': 'https://openalex.org/keywords/tree', 'display_name': 'Tree (set theory)', 'score': 0.6275351}, {'id': 'https://openalex.org/keywords/phylogenetic-tree', 'display_name': 'phylogenetic tree', 'score': 0.558889}, {'id': 'https://openalex.org/keywords/similarity', 'display_name': 'Similarity (geometry)', 'score': 0.55542654}, {'id': 'https://openalex.org/keywords/sequence-alignment', 'display_name': 'sequence alignment', 'score': 0.531727}, {'id': 'https://openalex.org/keywords/phylogenetic-analysis', 'display_name': 'Phylogenetic Analysis', 'score': 0.526982}, {'id': 'https://openalex.org/keywords/sequence', 'display_name': 'Sequence (biology)', 'score': 0.44972116}, {'id': 'https://openalex.org/keywords/computational-phylogenetics', 'display_name': 'Computational phylogenetics', 'score': 0.43941164}, {'id': 'https://openalex.org/keywords/multiple-sequence-alignment', 'display_name': 'Multiple sequence alignment', 'score': 0.4109585}], 'concepts': [{'id': 'https://openalex.org/C73555534', 'wikidata': 'https://www.wikidata.org/wiki/Q622825', 'display_name': 'Cluster analysis', 'level': 2, 'score': 0.82749355}, {'id': 'https://openalex.org/C193252679', 'wikidata': 'https://www.wikidata.org/wiki/Q242125', 'display_name': 'Phylogenetic tree', 'level': 3, 'score': 0.82324946}, {'id': 'https://openalex.org/C184898388', 'wikidata': 'https://www.wikidata.org/wiki/Q1435712', 'display_name': 'Pairwise comparison', 'level': 2, 'score': 0.7263388}, {'id': 'https://openalex.org/C113174947', 'wikidata': 'https://www.wikidata.org/wiki/Q2859736', 'display_name': 'Tree (set theory)', 'level': 2, 'score': 0.6275351}, {'id': 'https://openalex.org/C103278499', 'wikidata': 'https://www.wikidata.org/wiki/Q254465', 'display_name': 'Similarity (geometry)', 'level': 3, 'score': 0.55542654}, {'id': 'https://openalex.org/C41008148', 'wikidata': 'https://www.wikidata.org/wiki/Q21198', 'display_name': 'Computer science', 'level': 0, 'score': 0.5237367}, {'id': 'https://openalex.org/C2778112365', 'wikidata': 'https://www.wikidata.org/wiki/Q3511065', 'display_name': 'Sequence (biology)', 'level': 2, 'score': 0.44972116}, {'id': 'https://openalex.org/C41168302', 'wikidata': 'https://www.wikidata.org/wiki/Q3772859', 'display_name': 'Computational phylogenetics', 'level': 5, 'score': 0.43941164}, {'id': 'https://openalex.org/C45484198', 'wikidata': 'https://www.wikidata.org/wiki/Q827246', 'display_name': 'Sequence alignment', 'level': 4, 'score': 0.43881854}, {'id': 'https://openalex.org/C164866538', 'wikidata': 'https://www.wikidata.org/wiki/Q367351', 'display_name': 'Cluster (spacecraft)', 'level': 2, 'score': 0.42407563}, {'id': 'https://openalex.org/C2776214188', 'wikidata': 'https://www.wikidata.org/wiki/Q408386', 'display_name': 'Inference', 'level': 2, 'score': 0.41744822}, {'id': 'https://openalex.org/C26619641', 'wikidata': 'https://www.wikidata.org/wiki/Q3142246', 'display_name': 'Phylogenetic network', 'level': 4, 'score': 0.41447294}, {'id': 'https://openalex.org/C88031987', 'wikidata': 'https://www.wikidata.org/wiki/Q1377767', 'display_name': 'Multiple sequence alignment', 'level': 5, 'score': 0.4109585}, {'id': 'https://openalex.org/C70721500', 'wikidata': 'https://www.wikidata.org/wiki/Q177005', 'display_name': 'Computational biology', 'level': 1, 'score': 0.361238}, {'id': 'https://openalex.org/C124101348', 'wikidata': 'https://www.wikidata.org/wiki/Q172491', 'display_name': 'Data mining', 'level': 1, 'score': 0.34679145}, {'id': 'https://openalex.org/C86803240', 'wikidata': 'https://www.wikidata.org/wiki/Q420', 'display_name': 'Biology', 'level': 0, 'score': 0.34509236}, {'id': 'https://openalex.org/C33923547', 'wikidata': 'https://www.wikidata.org/wiki/Q395', 'display_name': 'Mathematics', 'level': 0, 'score': 0.2850331}, {'id': 'https://openalex.org/C154945302', 'wikidata': 'https://www.wikidata.org/wiki/Q11660', 'display_name': 'Artificial intelligence', 'level': 1, 'score': 0.27207065}, {'id': 'https://openalex.org/C114614502', 'wikidata': 'https://www.wikidata.org/wiki/Q76592', 'display_name': 'Combinatorics', 'level': 1, 'score': 0.27026802}, {'id': 'https://openalex.org/C54355233', 'wikidata': 'https://www.wikidata.org/wiki/Q7162', 'display_name': 'Genetics', 'level': 1, 'score': 0.14628711}, {'id': 'https://openalex.org/C167625842', 'wikidata': 'https://www.wikidata.org/wiki/Q899763', 'display_name': 'Peptide sequence', 'level': 3, 'score': 0.085427105}, {'id': 'https://openalex.org/C115961682', 'wikidata': 'https://www.wikidata.org/wiki/Q860623', 'display_name': 'Image (mathematics)', 'level': 2, 'score': 0.0}, {'id': 'https://openalex.org/C104317684', 'wikidata': 'https://www.wikidata.org/wiki/Q7187', 'display_name': 'Gene', 'level': 2, 'score': 0.0}, {'id': 'https://openalex.org/C199360897', 'wikidata': 'https://www.wikidata.org/wiki/Q9143', 'display_name': 'Programming language', 'level': 1, 'score': 0.0}], 'mesh': [{'descriptor_ui': 'D064307', 'descriptor_name': 'Microbiota', 'qualifier_ui': 'Q000235', 'qualifier_name': 'genetics', 'is_major_topic': True}, {'descriptor_ui': 'D016415', 'descriptor_name': 'Sequence Alignment', 'qualifier_ui': 'Q000706', 'qualifier_name': 'statistics & numerical data', 'is_major_topic': True}, {'descriptor_ui': 'D000465', 'descriptor_name': 'Algorithms', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D001483', 'descriptor_name': 'Base Sequence', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D016000', 'descriptor_name': 'Cluster Analysis', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D019295', 'descriptor_name': 'Computational Biology', 'qualifier_ui': 'Q000379', 'qualifier_name': 'methods', 'is_major_topic': False}, {'descriptor_ui': 'D006678', 'descriptor_name': 'HIV', 'qualifier_ui': 'Q000145', 'qualifier_name': 'classification', 'is_major_topic': False}, {'descriptor_ui': 'D015658', 'descriptor_name': 'HIV Infections', 'qualifier_ui': 'Q000453', 'qualifier_name': 'epidemiology', 'is_major_topic': False}, {'descriptor_ui': 'D006801', 'descriptor_name': 'Humans', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D010802', 'descriptor_name': 'Phylogeny', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D012984', 'descriptor_name': 'Software', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}], 'locations_count': 9, 'locations': [{'is_oa': True, 'landing_page_url': 'https://doi.org/10.1371/journal.pone.0221068', 'pdf_url': 'https://journals.plos.org/plosone/article/file?id=10.1371/journal.pone.0221068&type=printable', 'source': {'id': 'https://openalex.org/S202381698', 'display_name': 'PLoS ONE', 'issn_l': '1932-6203', 'issn': ['1932-6203'], 'is_oa': True, 'is_in_doaj': True, 'is_core': True, 'host_organization': 'https://openalex.org/P4310315706', 'host_organization_name': 'Public Library of Science', 'host_organization_lineage': ['https://openalex.org/P4310315706'], 'host_organization_lineage_names': ['Public Library of Science'], 'type': 'journal'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, {'is_oa': False, 'landing_page_url': 'https://doaj.org/article/63f7fd8299ac4724b7c004a928ee9044', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S4306401280', 'display_name': 'DOAJ (DOAJ: Directory of Open Access Journals)', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': None, 'host_organization_name': None, 'host_organization_lineage': [], 'host_organization_lineage_names': [], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}, {'is_oa': True, 'landing_page_url': 'https://europepmc.org/articles/pmc6705769', 'pdf_url': 'https://europepmc.org/articles/pmc6705769?pdf=render', 'source': {'id': 'https://openalex.org/S4306400806', 'display_name': 'Europe PMC (PubMed Central)', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I1303153112', 'host_organization_name': 'European Bioinformatics Institute', 'host_organization_lineage': ['https://openalex.org/I1303153112'], 'host_organization_lineage_names': ['European Bioinformatics Institute'], 'type': 'repository'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, {'is_oa': True, 'landing_page_url': 'https://escholarship.org/uc/item/1cr5c0zg', 'pdf_url': 'https://escholarship.org/content/qt1cr5c0zg/qt1cr5c0zg.pdf?t=qmh0tm', 'source': {'id': 'https://openalex.org/S4306400115', 'display_name': 'eScholarship (California Digital Library)', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I2801248553', 'host_organization_name': 'California Digital Library', 'host_organization_lineage': ['https://openalex.org/I2801248553'], 'host_organization_lineage_names': ['California Digital Library'], 'type': 'repository'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, {'is_oa': True, 'landing_page_url': 'https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6705769', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S2764455111', 'display_name': 'PubMed Central', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I1299303238', 'host_organization_name': 'National Institutes of Health', 'host_organization_lineage': ['https://openalex.org/I1299303238'], 'host_organization_lineage_names': ['National Institutes of Health'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1101/261354', 'pdf_url': 'https://www.biorxiv.org/content/biorxiv/early/2018/02/21/261354.full.pdf', 'source': None, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'submittedVersion', 'is_accepted': False, 'is_published': False}, {'is_oa': True, 'landing_page_url': 'https://figshare.com/articles/dataset/TreeCluster_Clustering_biological_sequences_using_phylogenetic_trees/9718997', 'pdf_url': 'https://figshare.com/ndownloader/files/17408555', 'source': {'id': 'https://openalex.org/S4306400572', 'display_name': 'OPAL (Open@LaTrobe) (La Trobe University)', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I196829312', 'host_organization_name': 'La Trobe University', 'host_organization_lineage': ['https://openalex.org/I196829312'], 'host_organization_lineage_names': ['La Trobe University'], 'type': 'repository'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'submittedVersion', 'is_accepted': False, 'is_published': False}, {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1101/591388', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S4306402567', 'display_name': 'bioRxiv (Cold Spring Harbor Laboratory)', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I2750212522', 'host_organization_name': 'Cold Spring Harbor Laboratory', 'host_organization_lineage': ['https://openalex.org/I2750212522'], 'host_organization_lineage_names': ['Cold Spring Harbor Laboratory'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': 'submittedVersion', 'is_accepted': False, 'is_published': False}, {'is_oa': False, 'landing_page_url': 'https://pubmed.ncbi.nlm.nih.gov/31437182', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S4306525036', 'display_name': 'PubMed', 'issn_l': None, 'issn': None, 'is_oa': False, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I1299303238', 'host_organization_name': 'National Institutes of Health', 'host_organization_lineage': ['https://openalex.org/I1299303238'], 'host_organization_lineage_names': ['National Institutes of Health'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}], 'best_oa_location': {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1371/journal.pone.0221068', 'pdf_url': 'https://journals.plos.org/plosone/article/file?id=10.1371/journal.pone.0221068&type=printable', 'source': {'id': 'https://openalex.org/S202381698', 'display_name': 'PLoS ONE', 'issn_l': '1932-6203', 'issn': ['1932-6203'], 'is_oa': True, 'is_in_doaj': True, 'is_core': True, 'host_organization': 'https://openalex.org/P4310315706', 'host_organization_name': 'Public Library of Science', 'host_organization_lineage': ['https://openalex.org/P4310315706'], 'host_organization_lineage_names': ['Public Library of Science'], 'type': 'journal'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, 'sustainable_development_goals': [], 'grants': [], 'datasets': [], 'versions': [], 'referenced_works_count': 60, 'referenced_works': ['https://openalex.org/W1593676244', 'https://openalex.org/W1748508858', 'https://openalex.org/W1982447955', 'https://openalex.org/W1987526988', 'https://openalex.org/W1988925586', 'https://openalex.org/W2007668764', 'https://openalex.org/W2008856488', 'https://openalex.org/W2010981336', 'https://openalex.org/W2031611770', 'https://openalex.org/W2032678548', 'https://openalex.org/W2034285706', 'https://openalex.org/W2036509718', 'https://openalex.org/W2036862358', 'https://openalex.org/W2052857100', 'https://openalex.org/W2053400346', 'https://openalex.org/W2056251063', 'https://openalex.org/W2063273460', 'https://openalex.org/W2088481129', 'https://openalex.org/W2113434524', 'https://openalex.org/W2119284380', 'https://openalex.org/W2119362018', 'https://openalex.org/W2124166542', 'https://openalex.org/W2124351063', 'https://openalex.org/W2124493654', 'https://openalex.org/W2127504354', 'https://openalex.org/W2137597742', 'https://openalex.org/W2140638310', 'https://openalex.org/W2140890018', 'https://openalex.org/W2141052558', 'https://openalex.org/W2141669774', 'https://openalex.org/W2142802314', 'https://openalex.org/W2144775551', 'https://openalex.org/W2147461064', 'https://openalex.org/W2154730959', 'https://openalex.org/W2156125289', 'https://openalex.org/W2156619206', 'https://openalex.org/W2159638180', 'https://openalex.org/W2162315106', 'https://openalex.org/W2164842493', 'https://openalex.org/W2327639708', 'https://openalex.org/W2340423564', 'https://openalex.org/W2401404581', 'https://openalex.org/W2538509698', 'https://openalex.org/W2593591803', 'https://openalex.org/W2743986353', 'https://openalex.org/W2753968175', 'https://openalex.org/W2766813858', 'https://openalex.org/W2793085614', 'https://openalex.org/W2811244727', 'https://openalex.org/W2884242568', 'https://openalex.org/W2892206041', 'https://openalex.org/W2899210784', 'https://openalex.org/W2949210352', 'https://openalex.org/W2950954328', 'https://openalex.org/W2951878836', 'https://openalex.org/W3009335848', 'https://openalex.org/W3100709263', 'https://openalex.org/W3145289798', 'https://openalex.org/W4231579661', 'https://openalex.org/W4241328656'], 'related_works': ['https://openalex.org/W4389053053', 'https://openalex.org/W4253346505', 'https://openalex.org/W4248019281', 'https://openalex.org/W3113335767', 'https://openalex.org/W2903170547', 'https://openalex.org/W2739032002', 'https://openalex.org/W2588883198', 'https://openalex.org/W2194132979', 'https://openalex.org/W2079145549', 'https://openalex.org/W2064153754'], 'abstract_inverted_index': {'Clustering': [0], 'homologous': [1], 'sequences': [2, 19], 'based': [3], 'on': [4, 57, 100, 175], 'their': [5, 26, 101], 'similarity': [6], 'is': [7, 21, 73, 214], 'a': [8, 38, 51, 77, 168], 'problem': [9], 'that': [10, 18, 70, 94, 136], 'appears': [11], 'in': [12, 36, 64, 134, 157, 167], 'many': [13], 'bioinformatics': [14], 'applications.': [15, 212], 'The': [16], 'fact': [17], 'cluster': [20], 'ultimately': [22], 'the': [23, 33, 88, 110, 116, 140, 143, 149, 152, 158, 208], 'result': [24], 'of': [25, 45, 79, 91, 112, 118, 125, 142, 148, 210], 'phylogenetic': [27, 52, 66], 'relationships.': [28], 'Despite': [29], 'this': [30], 'observation': [31], 'and': [32, 54, 145, 186, 206], 'natural': [34], 'ways': [35], 'which': [37, 172], 'tree': [39, 53], 'can': [40, 131], 'define': [41, 76], 'clusters,': [42], 'most': [43], 'applications': [44], 'sequence': [46, 59, 189], 'clustering': [47, 72, 179], 'do': [48], 'not': [49], 'use': [50], 'instead': [55], 'operate': [56], 'pairwise': [58, 126], 'distances.': [60, 127], 'Due': [61], 'to': [62, 98], 'advances': [63], 'large-scale': [65], 'inference,': [67], 'we': [68, 173], 'argue': [69], 'tree-based': [71, 196], 'under-utilized.': [74], 'We': [75, 103, 163, 191], 'family': [78], 'optimization': [80], 'problems': [81, 130], 'that,': [82, 193], 'given': [83], 'an': [84], 'arbitrary': [85], 'tree,': [86, 144], 'return': [87], 'minimum': [89], 'number': [90], 'clusters': [92, 96, 203], 'such': [93], 'all': [95], 'adhere': [97], 'constraints': [99], 'heterogeneity.': [102], 'study': [104], 'three': [105, 129, 150, 176], 'specific': [106], 'constraints,': [107], 'limiting': [108], '(1)': [109], 'diameter': [111], 'each': [113], 'cluster,': [114], '(2)': [115], 'sum': [117], 'its': [119], 'branch': [120], 'lengths,': [121], 'or': [122], '(3)': [123], 'chains': [124], 'These': [128], 'be': [132], 'solved': [133], 'time': [135], 'increases': [137], 'linearly': [138], 'with': [139], 'size': [141], 'for': [146, 180], 'two': [147], 'criteria,': [151], 'algorithms': [153, 166], 'have': [154], 'been': [155], 'known': [156], 'theoretical': [159], 'computer': [160], 'scientist': [161], 'literature.': [162], 'implement': [164], 'these': [165], 'tool': [169], 'called': [170], 'TreeCluster,': [171], 'test': [174], 'applications:': [177], 'OTU': [178], 'microbiome': [181], 'data,': [182], 'HIV': [183], 'transmission': [184], 'clustering,': [185], 'divide-and-conquer': [187], 'multiple': [188], 'alignment.': [190], 'show': [192], 'by': [194], 'using': [195], 'distances,': [197], 'TreeCluster': [198, 213], 'generates': [199], 'more': [200], 'internally': [201], 'consistent': [202], 'than': [204], 'alternatives': [205], 'improves': [207], 'effectiveness': [209], 'downstream': [211], 'available': [215], 'at': [216], 'https://github.com/niemasd/TreeCluster.': [217]}, 'cited_by_api_url': 'https://api.openalex.org/works?filter=cites:W2969491951', 'counts_by_year': [{'year': 2024, 'cited_by_count': 25}, {'year': 2023, 'cited_by_count': 24}, {'year': 2022, 'cited_by_count': 33}, {'year': 2021, 'cited_by_count': 24}, {'year': 2020, 'cited_by_count': 14}, {'year': 2019, 'cited_by_count': 2}], 'updated_date': '2024-09-13T14:37:16.131791', 'created_date': '2019-08-29'}