Get quick answers to your questions about the article from our AI researcher chatbot
{'id': 'https://openalex.org/W2112520519', 'doi': 'https://doi.org/10.1142/s0219427905001304', 'title': 'Improving Domain Dictionary-Based Text Categorization Using Self-Partition Model', 'display_name': 'Improving Domain Dictionary-Based Text Categorization Using Self-Partition Model', 'publication_year': 2005, 'publication_date': '2005-09-01', 'ids': {'openalex': 'https://openalex.org/W2112520519', 'doi': 'https://doi.org/10.1142/s0219427905001304', 'mag': '2112520519'}, 'language': 'en', 'primary_location': {'is_oa': False, 'landing_page_url': 'https://doi.org/10.1142/s0219427905001304', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S50006202', 'display_name': 'International Journal of Computer Processing Of Languages', 'issn_l': '1793-8406', 'issn': ['1793-8406', '2010-0205'], 'is_oa': False, 'is_in_doaj': False, 'is_core': True, 'host_organization': 'https://openalex.org/P4310319815', 'host_organization_name': 'World Scientific', 'host_organization_lineage': ['https://openalex.org/P4310319815'], 'host_organization_lineage_names': ['World Scientific'], 'type': 'journal'}, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}, 'type': 'article', 'type_crossref': 'journal-article', 'indexed_in': ['crossref'], 'open_access': {'is_oa': False, 'oa_status': 'closed', 'oa_url': None, 'any_repository_has_fulltext': False}, 'authorships': [{'author_position': 'first', 'author': {'id': 'https://openalex.org/A5101847965', 'display_name': 'Wenliang Chen', 'orcid': 'https://orcid.org/0000-0001-5141-325X'}, 'institutions': [], 'countries': [], 'is_corresponding': False, 'raw_author_name': 'WENLIANG CHEN', 'raw_affiliation_strings': [], 'affiliations': []}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5100370155', 'display_name': 'Jingbo Zhu', 'orcid': 'https://orcid.org/0000-0002-6537-7007'}, 'institutions': [], 'countries': [], 'is_corresponding': False, 'raw_author_name': 'JINGBO ZHU', 'raw_affiliation_strings': [], 'affiliations': []}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5101923144', 'display_name': 'Muhua Zhu', 'orcid': 'https://orcid.org/0000-0002-6519-2379'}, 'institutions': [], 'countries': [], 'is_corresponding': False, 'raw_author_name': 'MUHUA ZHU', 'raw_affiliation_strings': [], 'affiliations': []}, {'author_position': 'middle', 'author': {'id': 'https://openalex.org/A5100425448', 'display_name': 'Li Zhang', 'orcid': 'https://orcid.org/0000-0001-7914-0679'}, 'institutions': [], 'countries': [], 'is_corresponding': False, 'raw_author_name': 'LI ZHANG', 'raw_affiliation_strings': [], 'affiliations': []}, {'author_position': 'last', 'author': {'id': 'https://openalex.org/A5100885321', 'display_name': 'Tianshun Yao', 'orcid': None}, 'institutions': [], 'countries': [], 'is_corresponding': False, 'raw_author_name': 'TIANSHUN YAO', 'raw_affiliation_strings': [], 'affiliations': []}], 'institution_assertions': [], 'countries_distinct_count': 0, 'institutions_distinct_count': 0, 'corresponding_author_ids': [], 'corresponding_institution_ids': [], 'apc_list': None, 'apc_paid': None, 'fwci': 0.415, 'has_fulltext': True, 'fulltext_origin': 'ngrams', 'cited_by_count': 1, 'citation_normalized_percentile': {'value': 0.566245, 'is_in_top_1_percent': False, 'is_in_top_10_percent': False}, 'cited_by_percentile_year': {'min': 61, 'max': 68}, 'biblio': {'volume': '18', 'issue': '03', 'first_page': '197', 'last_page': '210'}, 'is_retracted': False, 'is_paratext': False, 'primary_topic': {'id': 'https://openalex.org/T11550', 'display_name': 'Text and Document Classification Technologies', 'score': 0.9996, 'subfield': {'id': 'https://openalex.org/subfields/1702', 'display_name': 'Artificial Intelligence'}, 'field': {'id': 'https://openalex.org/fields/17', 'display_name': 'Computer Science'}, 'domain': {'id': 'https://openalex.org/domains/3', 'display_name': 'Physical Sciences'}}, 'topics': [{'id': 'https://openalex.org/T11550', 'display_name': 'Text and Document Classification Technologies', 'score': 0.9996, 'subfield': {'id': 'https://openalex.org/subfields/1702', 'display_name': 'Artificial Intelligence'}, 'field': {'id': 'https://openalex.org/fields/17', 'display_name': 'Computer Science'}, 'domain': {'id': 'https://openalex.org/domains/3', 'display_name': 'Physical Sciences'}}, {'id': 'https://openalex.org/T12016', 'display_name': 'Web Data Mining and Analysis', 'score': 0.9879, 'subfield': {'id': 'https://openalex.org/subfields/1710', 'display_name': 'Information Systems'}, 'field': {'id': 'https://openalex.org/fields/17', 'display_name': 'Computer Science'}, 'domain': {'id': 'https://openalex.org/domains/3', 'display_name': 'Physical Sciences'}}, {'id': 'https://openalex.org/T10181', 'display_name': 'Natural Language Processing Techniques', 'score': 0.9658, 'subfield': {'id': 'https://openalex.org/subfields/1702', 'display_name': 'Artificial Intelligence'}, 'field': {'id': 'https://openalex.org/fields/17', 'display_name': 'Computer Science'}, 'domain': {'id': 'https://openalex.org/domains/3', 'display_name': 'Physical Sciences'}}], 'keywords': [{'id': 'https://openalex.org/keywords/text-categorization', 'display_name': 'Text Categorization', 'score': 0.5484855}], 'concepts': [{'id': 'https://openalex.org/C41008148', 'wikidata': 'https://www.wikidata.org/wiki/Q21198', 'display_name': 'Computer science', 'level': 0, 'score': 0.873212}, {'id': 'https://openalex.org/C94124525', 'wikidata': 'https://www.wikidata.org/wiki/Q912550', 'display_name': 'Categorization', 'level': 2, 'score': 0.63090324}, {'id': 'https://openalex.org/C42812', 'wikidata': 'https://www.wikidata.org/wiki/Q1082910', 'display_name': 'Partition (number theory)', 'level': 2, 'score': 0.58382034}, {'id': 'https://openalex.org/C204321447', 'wikidata': 'https://www.wikidata.org/wiki/Q30642', 'display_name': 'Natural language processing', 'level': 1, 'score': 0.55955684}, {'id': 'https://openalex.org/C2986744138', 'wikidata': 'https://www.wikidata.org/wiki/Q302088', 'display_name': 'Text categorization', 'level': 3, 'score': 0.5484855}, {'id': 'https://openalex.org/C154945302', 'wikidata': 'https://www.wikidata.org/wiki/Q11660', 'display_name': 'Artificial intelligence', 'level': 1, 'score': 0.50867254}, {'id': 'https://openalex.org/C36503486', 'wikidata': 'https://www.wikidata.org/wiki/Q11235244', 'display_name': 'Domain (mathematical analysis)', 'level': 2, 'score': 0.5012293}, {'id': 'https://openalex.org/C23123220', 'wikidata': 'https://www.wikidata.org/wiki/Q816826', 'display_name': 'Information retrieval', 'level': 1, 'score': 0.4529563}, {'id': 'https://openalex.org/C124101348', 'wikidata': 'https://www.wikidata.org/wiki/Q172491', 'display_name': 'Data mining', 'level': 1, 'score': 0.32041144}, {'id': 'https://openalex.org/C134306372', 'wikidata': 'https://www.wikidata.org/wiki/Q7754', 'display_name': 'Mathematical analysis', 'level': 1, 'score': 0.0}, {'id': 'https://openalex.org/C33923547', 'wikidata': 'https://www.wikidata.org/wiki/Q395', 'display_name': 'Mathematics', 'level': 0, 'score': 0.0}, {'id': 'https://openalex.org/C114614502', 'wikidata': 'https://www.wikidata.org/wiki/Q76592', 'display_name': 'Combinatorics', 'level': 1, 'score': 0.0}], 'mesh': [], 'locations_count': 1, 'locations': [{'is_oa': False, 'landing_page_url': 'https://doi.org/10.1142/s0219427905001304', 'pdf_url': None, 'source': {'id': 'https://openalex.org/S50006202', 'display_name': 'International Journal of Computer Processing Of Languages', 'issn_l': '1793-8406', 'issn': ['1793-8406', '2010-0205'], 'is_oa': False, 'is_in_doaj': False, 'is_core': True, 'host_organization': 'https://openalex.org/P4310319815', 'host_organization_name': 'World Scientific', 'host_organization_lineage': ['https://openalex.org/P4310319815'], 'host_organization_lineage_names': ['World Scientific'], 'type': 'journal'}, 'license': None, 'license_id': None, 'version': None, 'is_accepted': False, 'is_published': False}], 'best_oa_location': None, 'sustainable_development_goals': [{'score': 0.61, 'id': 'https://metadata.un.org/sdg/4', 'display_name': 'Quality education'}], 'grants': [], 'datasets': [], 'versions': [], 'referenced_works_count': 10, 'referenced_works': ['https://openalex.org/W1568869800', 'https://openalex.org/W1984802689', 'https://openalex.org/W2005422315', 'https://openalex.org/W2060683726', 'https://openalex.org/W2064580901', 'https://openalex.org/W2098750402', 'https://openalex.org/W2104421947', 'https://openalex.org/W2118020653', 'https://openalex.org/W2127314673', 'https://openalex.org/W2435251607'], 'related_works': ['https://openalex.org/W2390857744', 'https://openalex.org/W2390698788', 'https://openalex.org/W2383063829', 'https://openalex.org/W2360898036', 'https://openalex.org/W2138922887', 'https://openalex.org/W2133651098', 'https://openalex.org/W2125109223', 'https://openalex.org/W2082678934', 'https://openalex.org/W2078570174', 'https://openalex.org/W2035261173'], 'abstract_inverted_index': {'International': [0], 'Journal': [1, 658], 'of': [2, 5, 157, 188, 237, 259, 272, 280, 284, 302, 453, 469, 498, 505, 540, 638, 659], 'Computer': [3, 451], 'Processing': [4, 34, 54, 74, 94, 115, 452, 545, 634, 662], 'LanguagesVol.': [6], '18,': [7, 687], 'No.': [8, 688], '03,': [9], 'pp.': [10, 322, 400, 457, 509, 621], '197-210': [11], '(2005)': [12], 'No': [13], 'AccessImproving': [14], 'Domain': [15, 158, 189, 219], 'Dictionary-Based': [16], 'Text': [17, 483, 529], 'Categorization': [18], 'Using': [19, 191], 'Self-Partition': [20, 168], 'ModelWENLIANG': [21], 'CHEN,': [22], 'JINGBO': [23, 51], 'ZHU,': [24, 26], 'MUHUA': [25, 71], 'LI': [27, 91], 'ZHANG,': [28], 'and': [29, 111, 241, 261, 276, 296, 316, 348, 379, 442, 464, 493, 526, 554, 590, 601, 612, 655, 680], 'TIANSHUN': [30, 112], 'YAOWENLIANG': [31], 'CHENNatural': [32], 'Language': [33, 53, 73, 93, 114, 428, 544, 633], 'Lab,': [35, 55, 75, 95, 116], 'Northeastern': [36, 56, 76, 96, 117], 'University,': [37, 57, 77, 97, 118, 433], 'Shenyang,': [38, 58, 78, 98, 119], '110004,': [39, 59, 79, 99, 120], 'P.': [40, 60, 80, 100, 121, 556], 'R.': [41, 61, 81, 101, 122, 327, 613], 'China': [42, 62, 82, 102, 123, 260, 273, 410], 'Search': [43, 63, 83, 103, 124], 'for': [44, 64, 84, 104, 125, 153, 304, 336, 385, 472, 482, 672], 'more': [45, 65, 85, 105, 126], 'papers': [46, 66, 86, 106, 127], 'by': [47, 67, 87, 107, 128, 253], 'this': [48, 68, 88, 108, 129, 146], 'author': [49, 69, 89, 109, 130], ',': [50, 70, 90, 110, 331, 339, 353, 363, 631, 648], 'ZHUNatural': [52, 72], 'ZHANGNatural': [92], 'YAONatural': [113], 'https://doi.org/10.1142/S0219427905001304Cited': [131], 'by:1': [132], 'PreviousNext': [133], 'AboutSectionsPDF/EPUB': [134], 'ToolsAdd': [135], 'to': [136, 140, 185, 426], 'favoritesDownload': [137], 'CitationsTrack': [138], 'CitationsRecommend': [139], 'Library': [141, 411, 416], 'ShareShare': [142], 'onFacebookTwitterLinked': [143], 'InRedditEmail': [144], 'AbstractIn': [145], 'paper,': [147], 'we': [148, 197], 'present': [149], 'a': [150, 199], 'novel': [151, 200], 'model': [152, 164], 'improving': [154], 'the': [155, 174, 178, 186, 208, 218, 229, 235, 242, 254, 267, 277, 281, 506], 'performance': [156], 'Dictionary-based': [159, 220], 'text': [160, 201, 210, 212, 221, 305, 337, 386, 475, 565, 675], 'categorization.': [161], 'The': [162, 203], 'proposed': [163, 198, 209], 'is': [165, 239, 246], 'named': [166], 'as': [167, 195], 'Model': [169], '(SPM).': [170], 'SPM': [171], 'can': [172], 'group': [173], 'candidate': [175], 'words': [176, 303], 'into': [177], 'predefined': [179], 'clusters,': [180], 'which': [181], 'are': [182], 'generated': [183], 'according': [184], 'structure': [187], 'Dictionary.': [190], 'these': [192], 'learned': [193], 'clusters': [194], 'features,': [196], 'representation.': [202], 'experimental': [204], 'results': [205], 'show': [206], 'that': [207], 'representation-based': [211], 'categorization': [213, 222, 338, 387, 566], 'system': [214, 230], 'performs': [215, 226], 'better': [216, 227], 'than': [217, 228], 'system.': [223], 'It': [224], 'also': [225], 'based': [231, 447], 'on': [232, 314, 346, 448, 480, 538, 561, 572, 599], 'Bag-of-Words': [233], 'when': [234], 'number': [236], 'features': [238], 'small': [240], 'training': [243], 'corpus': [244], 'size': [245], 'small.This': [247], 'research': [248, 637], 'was': [249], 'supported': [250], 'in': [251, 307, 318, 350, 391, 477, 501, 534, 542, 564, 567, 603], 'part': [252], 'National': [255, 268], 'Natural': [256, 269, 427, 543, 632], 'Science': [257, 270], 'Foundation': [258, 271], 'Microsoft': [262], 'Asia': [263, 393], 'Research': [264, 315, 347, 600], '(No.': [265, 274, 286], '60203019),': [266], '60473140)': [275], 'Key': [278], 'Project': [279], 'Chinese': [282, 660], 'Ministry': [283], 'Education': [285], '104065).Keywords:Text': [287], 'CategorizationText': [288, 693], 'RepresentationDomain': [289, 694], 'KnowledgeWord': [290, 695], 'Clustering': [291], 'References': [292], 'L.': [293, 406, 422, 494], 'D.': [294], 'Baker': [295], 'A.': [297, 462, 608], 'K.': [298, 465], 'McCallum,': [299], 'Distributional': [300, 496], 'clustering': [301, 335, 384, 497], 'classification,': [306, 476], 'Proc.': [308, 340, 535, 568, 593], '21st': [309], 'Int.': [310, 344, 570, 597], 'ACM': [311, 343, 361, 515, 596], 'SIGIR': [312], 'Conf.': [313, 345, 571, 598], 'Development': [317, 349, 602], 'Information': [319, 351, 394, 604, 661], 'Retrieval,': [320, 605], '1998,': [321], '96–103': [323], '.': [324, 368, 402, 437, 459, 486, 511, 549, 586, 651], 'Google': [325, 369, 403, 420, 438, 460, 487, 512, 522, 550, 587, 624, 652, 665], 'Scholar': [326, 370, 404, 421, 439, 461, 488, 523, 551, 625, 666], 'Bekkerman': [328], 'et': [329, 358, 629], 'al.': [330, 359, 630], 'On': [332], 'feature': [333, 562, 670], 'distributional': [334], 'SIGIR-01,': [341], '24th': [342], 'Retrieval': [352, 395], 'eds.': [354, 606], 'W.': [355, 371], 'B.': [356], 'Croft': [357], '(': [360, 644], 'Press': [362, 647], 'New': [364, 617], 'York,': [365, 618], 'USA': [366], ')': [367, 650], 'Chen,': [372], 'X.': [373, 591], 'Chang,': [374], 'H.': [375, 578], 'Wang,': [376, 677], 'J.': [377, 555], 'Zhu': [378, 654, 679], 'T.': [380, 626, 656], 'Yao,': [381, 657], 'Automatic': [382], 'word': [383], 'using': [388, 531], 'global': [389], 'information,': [390], 'First': [392], 'Symposium': [396], '(AIRS': [397], '2004),': [398], '2004,': [399], '1–6': [401], 'C.': [405, 407], 'E.': [408], 'Board,': [409], 'Categorization,': [412, 484], '4th': [413], 'edn.': [414], '(Beijing': [415], 'Press,': [417, 616], 'Beijing,': [418], '1999).': [419], 'Lee,': [423, 495], 'Similarity-Based': [424], 'Approaches': [425], 'Processing,': [429], 'Ph.D.': [430], 'thesis,': [431], 'Harvard': [432], 'Cambridge,': [434], 'MA,': [435], '1997': [436, 585], 'S.': [440, 627], 'Lee': [441], 'M.': [443, 607], 'Shishibori,': [444], 'Passage': [445], 'segmentation': [446], 'topic': [449], 'matter,': [450], 'Oriental': [454], 'Languages': [455], '15(3),': [456], '305–340': [458], 'McCallum': [463], 'Nigam,': [466], 'A': [467, 558, 636], 'comparison': [468], 'event': [470], 'models': [471], 'naïve': [473], 'Bayes': [474, 674], 'AAAI–98': [478], 'Workshop': [479, 537], 'Learning': [481, 574], '1998': [485, 548], 'F.': [489, 610], 'Pereira,': [490], 'N.': [491], 'Tishby': [492], 'English': [499], 'words,': [500], '30th': [502], 'Annual': [503], 'Meeting': [504], 'ACL,': [507], '1993,': [508], '183–190': [510], 'ScholarF.': [513], 'Sebastiani,': [514], 'Computing': [516], 'Surveys': [517], '34,': [518], '1': [519], '(2002).': [520, 664], 'Crossref,': [521, 623], 'Scott,': [524], 'Sam': [525], 'Stan': [527], 'Matwin,': [528], 'classification': [530], 'WordNet': [532, 541], 'hypernyms,': [533], 'COLING/ACL': [536], 'Usage': [539], 'Systems,': [546], 'Montreal,': [547], 'Y.': [552], 'Yang': [553, 589], 'Pedersen,': [557], 'comparative': [559], 'study': [560], 'selection': [563, 671], '14th': [569], 'Machine': [573], "(ICML'97),": [575], 'Jr.': [576], 'Doughals': [577], 'Fisher': [579], '(ed.),': [580], 'Nashville,': [581], 'TN,': [582], 'July': [583], '8–12,': [584], 'ScholarY.': [588], 'Liu,': [592], 'SIGIR-99,': [594], '22nd': [595], 'Hearst,': [609], 'Gey': [611], 'Tong': [614], '(ACM': [615], 'USA,': [619], '1999)': [620], '42–49.': [622], 'Yao': [628], '—': [635], 'making': [639], 'computers': [640], 'understand': [641], 'human': [642], 'languages': [643], 'Tsinghua': [645], 'University': [646], '2002': [649], 'ScholarJ.': [653], '16(3),': [663], 'FiguresReferencesRelatedDetailsCited': [667], 'By': [668], '1Divergence-based': [669], 'naïve': [673], 'classificationHuizhen': [676], 'Jingbo': [678], 'Keh-Yih': [681], 'Su1': [682], 'Oct': [683], '2008': [684], 'Recommended': [685], 'Vol.': [686], '03': [689], 'Metrics': [690], 'History': [691], 'KeywordsText': [692], 'ClusteringPDF': [696], 'download': [697]}, 'cited_by_api_url': 'https://api.openalex.org/works?filter=cites:W2112520519', 'counts_by_year': [], 'updated_date': '2024-12-13T20:44:00.694774', 'created_date': '2016-06-24'}