Get quick answers to your questions about the article from our AI researcher chatbot
{'id': 'https://openalex.org/W2054254276', 'doi': 'https://doi.org/10.1186/1471-2105-9-18', 'title': 'LTRharvest, an efficient and flexible software for de novo detection of LTR retrotransposons', 'display_name': 'LTRharvest, an efficient and flexible software for de novo detection of LTR retrotransposons', 'publication_year': 2008, 'publication_date': '2008-01-14', 'ids': {'openalex': 'https://openalex.org/W2054254276', 'doi': 'https://doi.org/10.1186/1471-2105-9-18', 'mag': '2054254276', 'pmid': 'https://pubmed.ncbi.nlm.nih.gov/18194517', 'pmcid': 'https://www.ncbi.nlm.nih.gov/pmc/articles/2253517'}, 'language': 'en', 'primary_location': {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1186/1471-2105-9-18', 'pdf_url': 'https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-18', 'source': {'id': 'https://openalex.org/S19032547', 'display_name': 'BMC Bioinformatics', 'issn_l': '1471-2105', 'issn': ['1471-2105'], 'is_oa': True, 'is_in_doaj': True, 'is_core': True, 'host_organization': 'https://openalex.org/P4310320256', 'host_organization_name': 'BioMed Central', 'host_organization_lineage': ['https://openalex.org/P4310319965', 'https://openalex.org/P4310320256'], 'host_organization_lineage_names': ['Springer Nature', 'BioMed Central'], 'type': 'journal'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, 'type': 'article', 'type_crossref': 'journal-article', 'indexed_in': ['crossref', 'pubmed'], 'open_access': {'is_oa': True, 'oa_status': 'gold', 'oa_url': 'https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-18', 'any_repository_has_fulltext': True}, 'authorships': [{'author_position': 'first', 'author': {'id': 'https://openalex.org/A5012331187', 'display_name': 'David Ellinghaus', 'orcid': 'https://orcid.org/0000-0002-4332-6110'}, 'institutions': [{'id': 'https://openalex.org/I159176309', 'display_name': 'Universität Hamburg', 'ror': 'https://ror.org/00g30e956', 'country_code': 'DE', 'type': 'education', 'lineage': ['https://openalex.org/I159176309']}], 'countries': ['DE'], 'is_corresponding': False, 'raw_author_name': 'David Ellinghaus', 'raw_affiliation_strings': ['ZBH - Center for Bioinformatics, University of Hamburg , Bundesstrasse 43, 20146 Hamburg, Germany.'], 'affiliations': [{'raw_affiliation_string': 'ZBH - Center for Bioinformatics, University of Hamburg , Bundesstrasse 43, 20146 Hamburg, Germany.', 'institution_ids': ['https://openalex.org/I159176309']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5060071039', 'display_name': 'Stefan Kurtz', 'orcid': 'https://orcid.org/0000-0001-5783-0054'}, 'institutions': [{'id': 'https://openalex.org/I159176309', 'display_name': 'Universität Hamburg', 'ror': 'https://ror.org/00g30e956', 'country_code': 'DE', 'type': 'education', 'lineage': ['https://openalex.org/I159176309']}], 'countries': ['DE'], 'is_corresponding': False, 'raw_author_name': 'Stefan Kurtz', 'raw_affiliation_strings': ['ZBH Center for Bioinformatics, University of Hamburg, Hamburg, Germany'], 'affiliations': [{'raw_affiliation_string': 'ZBH Center for Bioinformatics, University of Hamburg, Hamburg, Germany', 'institution_ids': ['https://openalex.org/I159176309']}]}, {'author_position': 'last', 'author': {'id': 'https://openalex.org/A5064136361', 'display_name': 'Ute Willhoeft', 'orcid': 'https://orcid.org/0000-0003-3313-2125'}, 'institutions': [{'id': 'https://openalex.org/I159176309', 'display_name': 'Universität Hamburg', 'ror': 'https://ror.org/00g30e956', 'country_code': 'DE', 'type': 'education', 'lineage': ['https://openalex.org/I159176309']}], 'countries': ['DE'], 'is_corresponding': False, 'raw_author_name': 'Ute Willhoeft', 'raw_affiliation_strings': ['ZBH Center for Bioinformatics, University of Hamburg, Hamburg, Germany'], 'affiliations': [{'raw_affiliation_string': 'ZBH Center for Bioinformatics, University of Hamburg, Hamburg, Germany', 'institution_ids': ['https://openalex.org/I159176309']}]}], 'institution_assertions': [], 'countries_distinct_count': 1, 'institutions_distinct_count': 1, 'corresponding_author_ids': [], 'corresponding_institution_ids': [], 'apc_list': {'value': 1690, 'currency': 'GBP', 'value_usd': 2072, 'provenance': 'doaj'}, 'apc_paid': {'value': 1690, 'currency': 'GBP', 'value_usd': 2072, 'provenance': 'doaj'}, 'fwci': 8.772, 'has_fulltext': True, 'fulltext_origin': 'pdf', 'cited_by_count': 1297, 'citation_normalized_percentile': {'value': 0.95469, 'is_in_top_1_percent': False, 'is_in_top_10_percent': True}, 'cited_by_percentile_year': {'min': 99, 'max': 100}, 'biblio': {'volume': '9', 'issue': '1', 'first_page': None, 'last_page': None}, 'is_retracted': False, 'is_paratext': False, 'primary_topic': {'id': 'https://openalex.org/T10434', 'display_name': 'Chromosomal and Genetic Variations', 'score': 0.9997, 'subfield': {'id': 'https://openalex.org/subfields/1110', 'display_name': 'Plant Science'}, 'field': {'id': 'https://openalex.org/fields/11', 'display_name': 'Agricultural and Biological Sciences'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, 'topics': [{'id': 'https://openalex.org/T10434', 'display_name': 'Chromosomal and Genetic Variations', 'score': 0.9997, 'subfield': {'id': 'https://openalex.org/subfields/1110', 'display_name': 'Plant Science'}, 'field': {'id': 'https://openalex.org/fields/11', 'display_name': 'Agricultural and Biological Sciences'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, {'id': 'https://openalex.org/T10015', 'display_name': 'Genomics and Phylogenetic Studies', 'score': 0.9983, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, {'id': 'https://openalex.org/T10521', 'display_name': 'RNA and protein synthesis mechanisms', 'score': 0.9893, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}], 'keywords': [{'id': 'https://openalex.org/keywords/retrotransposon', 'display_name': 'Retrotransposon', 'score': 0.852466}], 'concepts': [{'id': 'https://openalex.org/C7029365', 'wikidata': 'https://www.wikidata.org/wiki/Q413988', 'display_name': 'Retrotransposon', 'level': 5, 'score': 0.852466}, {'id': 'https://openalex.org/C4918238', 'wikidata': 'https://www.wikidata.org/wiki/Q121438', 'display_name': 'Transposable element', 'level': 4, 'score': 0.72094345}, {'id': 'https://openalex.org/C141231307', 'wikidata': 'https://www.wikidata.org/wiki/Q7020', 'display_name': 'Genome', 'level': 3, 'score': 0.6467511}, {'id': 'https://openalex.org/C86803240', 'wikidata': 'https://www.wikidata.org/wiki/Q420', 'display_name': 'Biology', 'level': 0, 'score': 0.6166103}, {'id': 'https://openalex.org/C2776321320', 'wikidata': 'https://www.wikidata.org/wiki/Q857525', 'display_name': 'Annotation', 'level': 2, 'score': 0.56708854}, {'id': 'https://openalex.org/C70721500', 'wikidata': 'https://www.wikidata.org/wiki/Q177005', 'display_name': 'Computational biology', 'level': 1, 'score': 0.5564085}, {'id': 'https://openalex.org/C199491388', 'wikidata': 'https://www.wikidata.org/wiki/Q1869477', 'display_name': 'Long terminal repeat', 'level': 4, 'score': 0.48490816}, {'id': 'https://openalex.org/C54355233', 'wikidata': 'https://www.wikidata.org/wiki/Q7162', 'display_name': 'Genetics', 'level': 1, 'score': 0.46879348}, {'id': 'https://openalex.org/C41008148', 'wikidata': 'https://www.wikidata.org/wiki/Q21198', 'display_name': 'Computer science', 'level': 0, 'score': 0.42356303}, {'id': 'https://openalex.org/C2777904410', 'wikidata': 'https://www.wikidata.org/wiki/Q7397', 'display_name': 'Software', 'level': 2, 'score': 0.42228663}, {'id': 'https://openalex.org/C104317684', 'wikidata': 'https://www.wikidata.org/wiki/Q7187', 'display_name': 'Gene', 'level': 2, 'score': 0.20849523}, {'id': 'https://openalex.org/C199360897', 'wikidata': 'https://www.wikidata.org/wiki/Q9143', 'display_name': 'Programming language', 'level': 1, 'score': 0.08678174}], 'mesh': [{'descriptor_ui': 'D000465', 'descriptor_name': 'Algorithms', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': True}, {'descriptor_ui': 'D002874', 'descriptor_name': 'Chromosome Mapping', 'qualifier_ui': 'Q000379', 'qualifier_name': 'methods', 'is_major_topic': True}, {'descriptor_ui': 'D018626', 'descriptor_name': 'Retroelements', 'qualifier_ui': 'Q000235', 'qualifier_name': 'genetics', 'is_major_topic': True}, {'descriptor_ui': 'D016415', 'descriptor_name': 'Sequence Alignment', 'qualifier_ui': 'Q000379', 'qualifier_name': 'methods', 'is_major_topic': True}, {'descriptor_ui': 'D017422', 'descriptor_name': 'Sequence Analysis, DNA', 'qualifier_ui': 'Q000379', 'qualifier_name': 'methods', 'is_major_topic': True}, {'descriptor_ui': 'D012984', 'descriptor_name': 'Software', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': True}, {'descriptor_ui': 'D001483', 'descriptor_name': 'Base Sequence', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D002874', 'descriptor_name': 'Chromosome Mapping', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D008969', 'descriptor_name': 'Molecular Sequence Data', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D011381', 'descriptor_name': 'Programming Languages', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D018626', 'descriptor_name': 'Retroelements', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D016415', 'descriptor_name': 'Sequence Alignment', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}, {'descriptor_ui': 'D017422', 'descriptor_name': 'Sequence Analysis, DNA', 'qualifier_ui': '', 'qualifier_name': None, 'is_major_topic': False}], 'locations_count': 3, 'locations': [{'is_oa': True, 'landing_page_url': 'https://doi.org/10.1186/1471-2105-9-18', 'pdf_url': 'https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-18', 'source': {'id': 'https://openalex.org/S19032547', 'display_name': 'BMC Bioinformatics', 'issn_l': '1471-2105', 'issn': ['1471-2105'], 'is_oa': True, 'is_in_doaj': True, 'is_core': True, 'host_organization': 'https://openalex.org/P4310320256', 'host_organization_name': 'BioMed Central', 'host_organization_lineage': ['https://openalex.org/P4310319965', 'https://openalex.org/P4310320256'], 'host_organization_lineage_names': ['Springer Nature', 'BioMed Central'], 'type': 'journal'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, {'is_oa': True, 'landing_page_url': 'https://www.ncbi.nlm.nih.gov/pmc/articles/PMC2253517', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S2764455111', 'display_name': 'PubMed Central', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I1299303238', 'host_organization_name': 'National Institutes of Health', 'host_organization_lineage': ['https://openalex.org/I1299303238'], 'host_organization_lineage_names': ['National Institutes of Health'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, {'is_oa': False, 'landing_page_url': 'https://pubmed.ncbi.nlm.nih.gov/18194517', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S4306525036', 'display_name': 'PubMed', 'issn_l': None, 'issn': None, 'is_oa': False, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I1299303238', 'host_organization_name': 'National Institutes of Health', 'host_organization_lineage': ['https://openalex.org/I1299303238'], 'host_organization_lineage_names': ['National Institutes of Health'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}], 'best_oa_location': {'is_oa': True, 'landing_page_url': 'https://doi.org/10.1186/1471-2105-9-18', 'pdf_url': 'https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-18', 'source': {'id': 'https://openalex.org/S19032547', 'display_name': 'BMC Bioinformatics', 'issn_l': '1471-2105', 'issn': ['1471-2105'], 'is_oa': True, 'is_in_doaj': True, 'is_core': True, 'host_organization': 'https://openalex.org/P4310320256', 'host_organization_name': 'BioMed Central', 'host_organization_lineage': ['https://openalex.org/P4310319965', 'https://openalex.org/P4310320256'], 'host_organization_lineage_names': ['Springer Nature', 'BioMed Central'], 'type': 'journal'}, 'license': 'cc-by', 'license_id': 'https://openalex.org/licenses/cc-by', 'version': 'publishedVersion', 'is_accepted': True, 'is_published': True}, 'sustainable_development_goals': [{'score': 0.58, 'id': 'https://metadata.un.org/sdg/9', 'display_name': 'Industry, innovation and infrastructure'}], 'grants': [], 'datasets': [], 'versions': [], 'referenced_works_count': 26, 'referenced_works': ['https://openalex.org/W1953861638', 'https://openalex.org/W1963918196', 'https://openalex.org/W1966585515', 'https://openalex.org/W2011632873', 'https://openalex.org/W2040386650', 'https://openalex.org/W2055043387', 'https://openalex.org/W2055666215', 'https://openalex.org/W2070797653', 'https://openalex.org/W2082330286', 'https://openalex.org/W2085708372', 'https://openalex.org/W2097937009', 'https://openalex.org/W2108031629', 'https://openalex.org/W2109289454', 'https://openalex.org/W2122774081', 'https://openalex.org/W2122954888', 'https://openalex.org/W2124281279', 'https://openalex.org/W2127384606', 'https://openalex.org/W2133767259', 'https://openalex.org/W2134283755', 'https://openalex.org/W2146055754', 'https://openalex.org/W2151464048', 'https://openalex.org/W2151899848', 'https://openalex.org/W2158874082', 'https://openalex.org/W2162216089', 'https://openalex.org/W2163960662', 'https://openalex.org/W2168909179'], 'related_works': ['https://openalex.org/W3145616024', 'https://openalex.org/W2955897131', 'https://openalex.org/W2402665505', 'https://openalex.org/W2375807013', 'https://openalex.org/W2089350008', 'https://openalex.org/W2064967612', 'https://openalex.org/W2054036000', 'https://openalex.org/W2019364734', 'https://openalex.org/W2004644512', 'https://openalex.org/W113856995'], 'abstract_inverted_index': {'Transposable': [0], 'elements': [1], 'are': [2, 27, 34, 65], 'abundant': [3], 'in': [4, 94, 186, 224], 'eukaryotic': [5, 30], 'genomes': [6], 'and': [7, 22, 113, 129, 139, 141, 145, 194, 239, 242, 261, 263], 'it': [8], 'is': [9, 47, 149, 168, 203], 'believed': [10], 'that': [11], 'they': [12, 72], 'have': [13, 78], 'a': [14, 48, 80, 122, 133, 229, 247], 'significant': [15], 'impact': [16], 'on': [17, 105, 228], 'the': [18, 85, 192, 220, 258, 264], 'evolution': [19], 'of': [20, 42, 54, 62, 89, 119, 135, 143, 163, 212, 235, 281], 'gene': [21], 'chromosome': [23, 223], 'structure.': [24], 'While': [25], 'there': [26, 33, 46], 'several': [28], 'completed': [29], 'genome': [31, 39, 181], 'projects,': [32, 182], 'only': [35], 'few': [36], 'high': [37, 101, 209], 'quality': [38, 102, 117, 210], 'wide': [40], 'annotations': [41, 103, 155], 'transposable': [43, 55, 63], 'elements.': [44, 56], 'Therefore,': [45], 'considerable': [49], 'demand': [50], 'for': [51, 68, 84, 126, 156, 217, 251, 273], 'computational': [52, 69], 'identification': [53], 'LTR': [57, 92, 107, 213, 253, 282], 'retrotransposons,': [58], 'an': [59, 199, 204, 270], 'important': [60], 'subclass': [61], 'elements,': [64], 'well': [66], 'suited': [67], 'identification,': [70], 'as': [71, 198, 266], 'contain': [73], 'long': [74], 'terminal': [75], 'repeats': [76], '(LTRs).We': [77], 'developed': [79], 'software': [81, 158, 206], 'tool': [82, 207], 'LTRharvest': [83, 98, 120, 164, 246], 'de': [86], 'novo': [87], 'detection': [88], 'full': [90], 'length': [91], 'retrotransposons': [93], 'large': [95, 175], 'sequence': [96, 114, 189], 'sets.': [97], 'efficiently': [99, 173], 'delivers': [100], 'based': [104], 'known': [106, 188], 'transposon': [108], 'features': [109, 190], 'like': [110], 'length,': [111], 'distance,': [112], 'motifs.': [115], 'A': [116], 'validation': [118], 'against': [121], 'gold': [123], 'standard': [124], 'annotation': [125, 211, 255], 'Saccharomyces': [127], 'cerevisae': [128], 'Drosophila': [130], 'melanogaster': [131], 'shows': [132], 'sensitivity': [134], 'up': [136], 'to': [137, 172, 277], '90%': [138], '97%': [140], 'specificity': [142], '100%': [144], '72%,': [146], 'respectively.': [147], 'This': [148], 'comparable': [150], 'or': [151, 179], 'slightly': [152], 'better': [153], 'than': [154], 'previous': [157, 166], 'tools.': [159], 'The': [160], 'main': [161], 'advantage': [162], 'over': [165], 'tools': [167], '(a)': [169], 'its': [170, 184, 196], 'ability': [171], 'handle': [174], 'datasets': [176], 'from': [177], 'finished': [178], 'unfinished': [180], '(b)': [183], 'flexibility': [185, 238], 'incorporating': [187, 274], 'into': [191], 'prediction,': [193], '(c)': [195], 'availability': [197, 265], 'open': [200, 267], 'source': [201, 268], 'software.LTRharvest': [202], 'efficient': [205], 'delivering': [208], 'retrotransposons.': [214, 283], 'It': [215], 'can,': [216], 'example,': [218], 'process': [219], 'largest': [221], 'human': [222], 'approx.': [225], '8': [226], 'minutes': [227], 'Linux': [230], 'PC': [231], 'with': [232], '4': [233], 'GB': [234], 'memory.': [236], 'Its': [237], 'small': [240], 'space': [241], 'run-time': [243], 'requirements': [244], 'makes': [245], 'very': [248], 'competitive': [249], 'candidate': [250], 'future': [252], 'retrotransposon': [254], 'projects.': [256], 'Moreover,': [257], 'structured': [259], 'design': [260], 'implementation': [262], 'provides': [269], 'excellent': [271], 'base': [272], 'novel': [275], 'concepts': [276], 'further': [278], 'improve': [279], 'prediction': [280]}, 'cited_by_api_url': 'https://api.openalex.org/works?filter=cites:W2054254276', 'counts_by_year': [{'year': 2024, 'cited_by_count': 186}, {'year': 2023, 'cited_by_count': 234}, {'year': 2022, 'cited_by_count': 214}, {'year': 2021, 'cited_by_count': 160}, {'year': 2020, 'cited_by_count': 128}, {'year': 2019, 'cited_by_count': 100}, {'year': 2018, 'cited_by_count': 72}, {'year': 2017, 'cited_by_count': 49}, {'year': 2016, 'cited_by_count': 35}, {'year': 2015, 'cited_by_count': 24}, {'year': 2014, 'cited_by_count': 17}, {'year': 2013, 'cited_by_count': 18}, {'year': 2012, 'cited_by_count': 23}], 'updated_date': '2024-12-21T10:59:44.852571', 'created_date': '2016-06-24'}