Get quick answers to your questions about the article from our AI researcher chatbot
{'id': 'https://openalex.org/W2070071798', 'doi': 'https://doi.org/10.1142/9781848161092_0020', 'title': 'CLASSIFICATION OF PROTEIN SEQUENCES BASED ON WORD SEGMENTATION METHODS', 'display_name': 'CLASSIFICATION OF PROTEIN SEQUENCES BASED ON WORD SEGMENTATION METHODS', 'publication_year': 2007, 'publication_date': '2007-12-01', 'ids': {'openalex': 'https://openalex.org/W2070071798', 'doi': 'https://doi.org/10.1142/9781848161092_0020', 'mag': '2070071798'}, 'language': 'en', 'primary_location': {'is_oa': False, 'landing_page_url': 'https://doi.org/10.1142/9781848161092_0020', 'pdf_url': None, 'source': None, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}, 'type': 'article', 'type_crossref': 'proceedings-article', 'indexed_in': ['crossref'], 'open_access': {'is_oa': True, 'oa_status': 'green', 'oa_url': 'http://www.comp.nus.edu.sg/~wongls/psZ/apbc2008/apbc065a.pdf', 'any_repository_has_fulltext': True}, 'authorships': [{'author_position': 'first', 'author': {'id': 'https://openalex.org/A5100397381', 'display_name': 'Yang Yang', 'orcid': 'https://orcid.org/0000-0001-5720-773X'}, 'institutions': [{'id': 'https://openalex.org/I183067930', 'display_name': 'Shanghai Jiao Tong University', 'ror': 'https://ror.org/0220qvk04', 'country_code': 'CN', 'type': 'education', 'lineage': ['https://openalex.org/I183067930']}], 'countries': ['CN'], 'is_corresponding': False, 'raw_author_name': 'YANG YANG', 'raw_affiliation_strings': ['Department of Computer Science and Engineering, Shanghai Jiao Tong University, 800 Dong Chuan Road, Shanghai 200240, China'], 'affiliations': [{'raw_affiliation_string': 'Department of Computer Science and Engineering, Shanghai Jiao Tong University, 800 Dong Chuan Road, Shanghai 200240, China', 'institution_ids': ['https://openalex.org/I183067930']}]}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5040440605', 'display_name': 'Bao‐Liang Lu', 'orcid': 'https://orcid.org/0000-0001-8359-0058'}, 'institutions': [{'id': 'https://openalex.org/I183067930', 'display_name': 'Shanghai Jiao Tong University', 'ror': 'https://ror.org/0220qvk04', 'country_code': 'CN', 'type': 'education', 'lineage': ['https://openalex.org/I183067930']}], 'countries': ['CN'], 'is_corresponding': False, 'raw_author_name': 'BAO-LIANG LU', 'raw_affiliation_strings': ['Department of Computer Science and Engineering, Shanghai Jiao Tong University, 800 Dong Chuan Road, Shanghai 200240, China; Laboratory for Computational Biology, Shanghai Center for Systems Biomedicine, 800 Dong Chuan Road, Shanghai 200240, China', 'Laboratory for Computational Biology, Shanghai Center for Systems Biomedicine, 800 Dong Chuan Road, Shanghai 200240, China'], 'affiliations': [{'raw_affiliation_string': 'Department of Computer Science and Engineering, Shanghai Jiao Tong University, 800 Dong Chuan Road, Shanghai 200240, China; Laboratory for Computational Biology, Shanghai Center for Systems Biomedicine, 800 Dong Chuan Road, Shanghai 200240, China', 'institution_ids': ['https://openalex.org/I183067930']}, {'raw_affiliation_string': 'Laboratory for Computational Biology, Shanghai Center for Systems Biomedicine, 800 Dong Chuan Road, Shanghai 200240, China', 'institution_ids': []}]}, {'author_position': 'last', 'author': {'id': 'https://openalex.org/A5010877916', 'display_name': 'Wen-Yun Yang', 'orcid': 'https://orcid.org/0009-0006-4551-7996'}, 'institutions': [{'id': 'https://openalex.org/I183067930', 'display_name': 'Shanghai Jiao Tong University', 'ror': 'https://ror.org/0220qvk04', 'country_code': 'CN', 'type': 'education', 'lineage': ['https://openalex.org/I183067930']}], 'countries': ['CN'], 'is_corresponding': False, 'raw_author_name': 'WEN-YUN YANG', 'raw_affiliation_strings': ['Department of Computer Science and Engineering, Shanghai Jiao Tong University, 800 Dong Chuan Road, Shanghai 200240, China'], 'affiliations': [{'raw_affiliation_string': 'Department of Computer Science and Engineering, Shanghai Jiao Tong University, 800 Dong Chuan Road, Shanghai 200240, China', 'institution_ids': ['https://openalex.org/I183067930']}]}], 'institution_assertions': [], 'countries_distinct_count': 1, 'institutions_distinct_count': 1, 'corresponding_author_ids': [], 'corresponding_institution_ids': [], 'apc_list': None, 'apc_paid': None, 'fwci': 0.0, 'has_fulltext': False, 'cited_by_count': 14, 'citation_normalized_percentile': {'value': 0.887779, 'is_in_top_1_percent': False, 'is_in_top_10_percent': False}, 'cited_by_percentile_year': {'min': 85, 'max': 86}, 'biblio': {'volume': None, 'issue': None, 'first_page': '177', 'last_page': '186'}, 'is_retracted': False, 'is_paratext': False, 'primary_topic': {'id': 'https://openalex.org/T12254', 'display_name': 'Machine Learning in Bioinformatics', 'score': 0.9998, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, 'topics': [{'id': 'https://openalex.org/T12254', 'display_name': 'Machine Learning in Bioinformatics', 'score': 0.9998, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, {'id': 'https://openalex.org/T10015', 'display_name': 'Genomics and Phylogenetic Studies', 'score': 0.9983, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}, {'id': 'https://openalex.org/T10521', 'display_name': 'RNA and protein synthesis mechanisms', 'score': 0.9967, 'subfield': {'id': 'https://openalex.org/subfields/1312', 'display_name': 'Molecular Biology'}, 'field': {'id': 'https://openalex.org/fields/13', 'display_name': 'Biochemistry, Genetics and Molecular Biology'}, 'domain': {'id': 'https://openalex.org/domains/1', 'display_name': 'Life Sciences'}}], 'keywords': [{'id': 'https://openalex.org/keywords/substring', 'display_name': 'Substring', 'score': 0.6022855}, {'id': 'https://openalex.org/keywords/text-segmentation', 'display_name': 'Text segmentation', 'score': 0.49948716}], 'concepts': [{'id': 'https://openalex.org/C182407805', 'wikidata': 'https://www.wikidata.org/wiki/Q2626534', 'display_name': 'Substring', 'level': 3, 'score': 0.6022855}, {'id': 'https://openalex.org/C89600930', 'wikidata': 'https://www.wikidata.org/wiki/Q1423946', 'display_name': 'Segmentation', 'level': 2, 'score': 0.56951106}, {'id': 'https://openalex.org/C98501671', 'wikidata': 'https://www.wikidata.org/wiki/Q1948408', 'display_name': 'Text segmentation', 'level': 3, 'score': 0.49948716}, {'id': 'https://openalex.org/C191935318', 'wikidata': 'https://www.wikidata.org/wiki/Q148', 'display_name': 'China', 'level': 2, 'score': 0.47544193}, {'id': 'https://openalex.org/C154945302', 'wikidata': 'https://www.wikidata.org/wiki/Q11660', 'display_name': 'Artificial intelligence', 'level': 1, 'score': 0.46825466}, {'id': 'https://openalex.org/C41008148', 'wikidata': 'https://www.wikidata.org/wiki/Q21198', 'display_name': 'Computer science', 'level': 0, 'score': 0.45156008}, {'id': 'https://openalex.org/C204321447', 'wikidata': 'https://www.wikidata.org/wiki/Q30642', 'display_name': 'Natural language processing', 'level': 1, 'score': 0.36469713}, {'id': 'https://openalex.org/C161191863', 'wikidata': 'https://www.wikidata.org/wiki/Q199655', 'display_name': 'Library science', 'level': 1, 'score': 0.33623976}, {'id': 'https://openalex.org/C205649164', 'wikidata': 'https://www.wikidata.org/wiki/Q1071', 'display_name': 'Geography', 'level': 0, 'score': 0.23750183}, {'id': 'https://openalex.org/C162319229', 'wikidata': 'https://www.wikidata.org/wiki/Q175263', 'display_name': 'Data structure', 'level': 2, 'score': 0.12882376}, {'id': 'https://openalex.org/C166957645', 'wikidata': 'https://www.wikidata.org/wiki/Q23498', 'display_name': 'Archaeology', 'level': 1, 'score': 0.09918797}, {'id': 'https://openalex.org/C199360897', 'wikidata': 'https://www.wikidata.org/wiki/Q9143', 'display_name': 'Programming language', 'level': 1, 'score': 0.0}], 'mesh': [], 'locations_count': 2, 'locations': [{'is_oa': False, 'landing_page_url': 'https://doi.org/10.1142/9781848161092_0020', 'pdf_url': None, 'source': None, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}, {'is_oa': True, 'landing_page_url': 'http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.143.8460', 'pdf_url': 'http://www.comp.nus.edu.sg/~wongls/psZ/apbc2008/apbc065a.pdf', 'source': {'id': 'https://openalex.org/S4306400349', 'display_name': 'CiteSeer X (The Pennsylvania State University)', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I130769515', 'host_organization_name': 'Pennsylvania State University', 'host_organization_lineage': ['https://openalex.org/I130769515'], 'host_organization_lineage_names': ['Pennsylvania State University'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': 'submittedVersion', 'is_accepted': False, 'is_published': False}], 'best_oa_location': {'is_oa': True, 'landing_page_url': 'http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.143.8460', 'pdf_url': 'http://www.comp.nus.edu.sg/~wongls/psZ/apbc2008/apbc065a.pdf', 'source': {'id': 'https://openalex.org/S4306400349', 'display_name': 'CiteSeer X (The Pennsylvania State University)', 'issn_l': None, 'issn': None, 'is_oa': True, 'is_in_doaj': False, 'is_core': False, 'host_organization': 'https://openalex.org/I130769515', 'host_organization_name': 'Pennsylvania State University', 'host_organization_lineage': ['https://openalex.org/I130769515'], 'host_organization_lineage_names': ['Pennsylvania State University'], 'type': 'repository'}, 'license': None, 'license_id': None, 'version': 'submittedVersion', 'is_accepted': False, 'is_published': False}, 'sustainable_development_goals': [], 'grants': [], 'datasets': [], 'versions': [], 'referenced_works_count': 11, 'referenced_works': ['https://openalex.org/W1982481323', 'https://openalex.org/W1991022130', 'https://openalex.org/W1991256448', 'https://openalex.org/W2020816856', 'https://openalex.org/W2106575335', 'https://openalex.org/W2107427637', 'https://openalex.org/W2107725114', 'https://openalex.org/W2150666695', 'https://openalex.org/W2153635508', 'https://openalex.org/W2156455118', 'https://openalex.org/W2283504545'], 'related_works': ['https://openalex.org/W2978383222', 'https://openalex.org/W2785359773', 'https://openalex.org/W2384559435', 'https://openalex.org/W2380773642', 'https://openalex.org/W2337707338', 'https://openalex.org/W2251446894', 'https://openalex.org/W2172629291', 'https://openalex.org/W2101674824', 'https://openalex.org/W2058548953', 'https://openalex.org/W1597333669'], 'abstract_inverted_index': {'Series': [0], 'on': [1, 157, 245, 293], 'Advances': [2], 'in': [3, 167, 224, 264, 278, 398], 'Bioinformatics': [4, 12, 458], 'and': [5, 30, 37, 55, 101, 107, 144, 182, 197, 220, 231, 257, 312, 319, 346, 364, 374, 391, 400, 415, 425, 448], 'Computational': [6, 69], 'BiologyProceedings': [7], 'of': [8, 34, 52, 94, 104, 164, 174, 191, 217, 254, 266, 326, 331, 352, 409, 440, 454], 'the': [9, 89, 97, 168, 189, 218, 238, 258, 272, 290, 304, 438, 455], '6th': [10, 456], 'Asia-Pacific': [11, 457], 'Conference,': [13], 'pp.': [14], '177-186': [15], '(2007)': [16], 'No': [17], 'AccessCLASSIFICATION': [18], 'OF': [19], 'PROTEIN': [20], 'SEQUENCES': [21], 'BASED': [22], 'ON': [23], 'WORD': [24], 'SEGMENTATION': [25], 'METHODSYANG': [26], 'YANG,': [27], 'BAO-LIANG': [28, 50], 'LU,': [29], 'WEN-YUN': [31, 102], 'YANGYANG': [32], 'YANGDepartment': [33, 103], 'Computer': [35, 53, 105], 'Science': [36, 54, 92, 106], 'Engineering,': [38, 56, 108], 'Shanghai': [39, 47, 57, 65, 71, 80, 109, 117], 'Jiao': [40, 58, 110], 'Tong': [41, 59, 111], 'University,': [42, 60, 112], '800': [43, 61, 76, 113], 'Dong': [44, 62, 77, 114], 'Chuan': [45, 63, 78, 115], 'Road,': [46, 64, 79, 116], '200240,': [48, 66, 81, 118], 'China,': [49], 'LUDepartment': [51], 'ChinaLaboratory': [67], 'for': [68, 73, 308, 383, 406, 437], 'Biology,': [70], 'Center': [72], 'Systems': [74], 'Biomedicine,': [75], 'ChinaCorresponding': [82], 'author.This': [83], 'work': [84], 'was': [85], 'partially': [86], 'supported': [87], 'by': [88, 194, 329], 'National': [90], 'Natural': [91], 'Foundation': [93], 'China': [95], 'via': [96], 'grant': [98], 'NSFC': [99], '60473040.,': [100], 'Chinahttps://doi.org/10.1142/9781848161092_0020Cited': [119], 'by:5': [120], 'PreviousNext': [121], 'AboutSectionsPDF/EPUB': [122], 'ToolsAdd': [123], 'to': [124, 128, 180, 303], 'favoritesDownload': [125], 'CitationsTrack': [126], 'CitationsRecommend': [127], 'Library': [129], 'ShareShare': [130], 'onFacebookTwitterLinked': [131], 'InRedditEmail': [132], 'Abstract:': [133], 'Protein': [134, 327], 'sequences': [135, 149, 355], 'contain': [136], 'great': [137], 'potential': [138], 'revealing': [139], 'protein': [140, 148, 184, 247, 268, 353, 385, 410], 'function,': [141], 'structure': [142], 'families': [143, 155, 269], 'evolution': [145], 'information.': [146], 'Classifying': [147], 'into': [150], 'different': [151], 'functional': [152], 'groups': [153], 'or': [154], 'based': [156, 292], 'their': [158, 232], 'sequence': [159, 386], 'patterns': [160], 'has': [161], 'attracted': [162], 'lots': [163], 'research': [165], 'efforts': [166], 'last': [169], 'decade.': [170], 'A': [171], 'key': [172], 'issue': [173], 'these': [175], 'classification': [176, 196, 265], 'systems': [177], 'is': [178, 251, 260], 'how': [179], 'interpret': [181], 'represent': [183], 'sequences,': [185, 219], 'which': [186], 'largely': [187], 'determines': [188], 'performance': [190], 'classifiers.': [192], 'Inspired': [193], 'text': [195], 'Chinese': [198], 'word': [199], 'segmentation': [200], 'techniques,': [201], 'we': [202], 'propose': [203], 'a': [204, 252, 434], 'segmentation-based': [205], 'feature': [206, 239, 282, 296], 'extraction': [207], 'method.': [208], 'The': [209], 'extracted': [210], 'features': [211], 'include': [212], 'selected': [213], 'words,': [214], 'i.e.,': [215], 'substrings': [216], 'also': [221, 285, 300], 'motifs': [222], 'specified': [223], 'public': [225], 'database.': [226], 'They': [227], 'are': [228, 235], 'segmented': [229], 'out': [230], 'occurrence': [233], 'frequencies': [234], 'recorded': [236], 'as': [237], 'vector': [240], 'values.': [241], 'We': [242], 'conducted': [243], 'experiments': [244], 'two': [246], 'data': [248, 387], 'sets.': [249], 'One': [250], 'set': [253, 283], 'SCOP': [255, 267], 'families,': [256], 'other': [259], 'GPCR': [261, 309], 'family.': [262], 'Experiments': [263], 'show': [270], 'that': [271], 'proposed': [273], 'method': [274, 405], 'not': [275], 'only': [276], 'results': [277], 'an': [279, 332, 336], 'extremely': [280], 'condensed': [281], 'but': [284], 'achieves': [286], 'higher': [287], 'accuracy': [288], 'than': [289], 'methods': [291], 'whole': [294], 'k-spectrum': [295], 'space.': [297], 'And': [298], 'it': [299], 'performs': [301], 'comparably': [302], 'most': [305], 'powerful': [306], 'classifiers': [307], 'level': [310, 313], 'I': [311], 'II': [314], 'subfamily': [315], 'recognition': [316], 'with': [317, 335, 356], '92.6': [318], '88.8%': [320], 'accuracy,': [321], 'respectively.': [322], 'FiguresReferencesRelatedDetailsCited': [323], 'By': [324], '5Classification': [325], 'Sequences': [328], 'Means': [330], 'Ensemble': [333], 'Classifier': [334], 'Improved': [337], 'Feature': [338], 'Selection': [339], 'StrategyAditya': [340], 'Sriram,': [341], 'Mounica': [342], 'Sanapala,': [343], 'Ronak': [344], 'Patel': [345], 'Nagamma': [347], 'Patil5': [348], 'November': [349], '2018Comparative': [350], 'analysis': [351, 408], 'primary': [354], 'graph': [357], 'energyHaiyan': [358], 'Wu,': [359], 'Yusen': [360, 416], 'Zhang,': [361], 'Wei': [362], 'Chen': [363], 'Zengchao': [365], 'Mu1': [366], 'Nov': [367], '2015': [368], '|': [369, 396, 420], 'Physica': [370, 421], 'A:': [371, 422], 'Statistical': [372, 423], 'Mechanics': [373, 424], 'its': [375, 426], 'Applications,': [376, 427], 'Vol.': [377, 402, 428], '437A': [378], 'fast': [379], 'hierarchical': [380], 'clustering': [381], 'algorithm': [382], 'large-scale': [384], 'setsSándor': [388], 'M.': [389], 'Szilágyi': [390], 'László': [392], 'Szilágyi1': [393], 'May': [394], '2014': [395], 'Computers': [397], 'Biology': [399], 'Medicine,': [401], '48A': [403], 'novel': [404], 'similarity/dissimilarity': [407], 'sequencesZengchao': [411], 'Mu,': [412], 'Jing': [413], 'Wu': [414], 'Zhang1': [417], 'Dec': [418], '2013': [419], '392,': [429], 'No.': [430], '24Feature': [431], 'Reduction': [432], 'Using': [433], 'Topic': [435], 'Model': [436], 'Prediction': [439], 'Type': [441], 'III': [442], 'Secreted': [443], 'EffectorsSihui': [444], 'Qi,': [445], 'Yang': [446, 447], 'Anjun': [449], 'Song1': [450], 'Jan': [451], '2011': [452], 'Proceedings': [453], 'ConferenceMetrics': [459], 'History': [460], 'PDF': [461], 'download': [462]}, 'cited_by_api_url': 'https://api.openalex.org/works?filter=cites:W2070071798', 'counts_by_year': [{'year': 2024, 'cited_by_count': 1}, {'year': 2021, 'cited_by_count': 2}, {'year': 2018, 'cited_by_count': 2}, {'year': 2017, 'cited_by_count': 1}, {'year': 2016, 'cited_by_count': 1}, {'year': 2015, 'cited_by_count': 1}, {'year': 2014, 'cited_by_count': 3}, {'year': 2013, 'cited_by_count': 2}], 'updated_date': '2024-12-23T11:20:28.175328', 'created_date': '2016-06-24'}