{"id":"https://openalex.org/W2883127447","doi":"https://doi.org/10.1016/j.bdr.2018.05.007","title":"Lossless Pruned Naive Bayes for Big Data Classifications","display_name":"Lossless Pruned Naive Bayes for Big Data Classifications","publication_year":2018,"publication_date":"2018-07-17","ids":{"openalex":"https://openalex.org/W2883127447","doi":"https://doi.org/10.1016/j.bdr.2018.05.007","mag":"2883127447"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1016/j.bdr.2018.05.007","pdf_url":null,"source":{"id":"https://openalex.org/S2491565770","display_name":"Big Data Research","issn_l":"2214-5796","issn":["2214-5796","2214-580X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027285085","display_name":"Nanfei Sun","orcid":"https://orcid.org/0000-0002-4010-1514"},"institutions":[{"id":"https://openalex.org/I52913039","display_name":"University of Houston - Clear Lake","ror":"https://ror.org/01t817z14","country_code":"US","type":"education","lineage":["https://openalex.org/I52913039"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nanfei Sun","raw_affiliation_strings":["Management Information Systems, University of Houston - Clear Lake, 2700 Bay Area Blvd., Houston, TX 77058, United States"],"affiliations":[{"raw_affiliation_string":"Management Information Systems, University of Houston - Clear Lake, 2700 Bay Area Blvd., Houston, TX 77058, United States","institution_ids":["https://openalex.org/I52913039"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036757754","display_name":"Bingjun Sun","orcid":"https://orcid.org/0000-0002-6036-3730"},"institutions":[{"id":"https://openalex.org/I113979032","display_name":"Twitter (United States)","ror":"https://ror.org/04wt43v05","country_code":"US","type":"company","lineage":["https://openalex.org/I113979032"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bingjun Sun","raw_affiliation_strings":["Twitter, 1355 Market Street, Suite 900, San Francisco, CA 94103, United States"],"affiliations":[{"raw_affiliation_string":"Twitter, 1355 Market Street, Suite 900, San Francisco, CA 94103, United States","institution_ids":["https://openalex.org/I113979032"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102026686","display_name":"Jian Lin","orcid":"https://orcid.org/0000-0002-7102-7978"},"institutions":[{"id":"https://openalex.org/I52913039","display_name":"University of Houston - Clear Lake","ror":"https://ror.org/01t817z14","country_code":"US","type":"education","lineage":["https://openalex.org/I52913039"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jian (Denny) Lin","raw_affiliation_strings":["Management Information Systems, University of Houston - Clear Lake, 2700 Bay Area Blvd., Houston, TX 77058, United States"],"affiliations":[{"raw_affiliation_string":"Management Information Systems, University of Houston - Clear Lake, 2700 Bay Area Blvd., Houston, TX 77058, United States","institution_ids":["https://openalex.org/I52913039"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034615694","display_name":"Michael Wu","orcid":"https://orcid.org/0009-0000-4659-2548"},"institutions":[{"id":"https://openalex.org/I52913039","display_name":"University of Houston - Clear Lake","ror":"https://ror.org/01t817z14","country_code":"US","type":"education","lineage":["https://openalex.org/I52913039"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Yu-Chi Wu","raw_affiliation_strings":["Management Information Systems, University of Houston - Clear Lake, 2700 Bay Area Blvd., Houston, TX 77058, United States"],"affiliations":[{"raw_affiliation_string":"Management Information Systems, University of Houston - Clear Lake, 2700 Bay Area Blvd., Houston, TX 77058, United States","institution_ids":["https://openalex.org/I52913039"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5102026686"],"corresponding_institution_ids":["https://openalex.org/I52913039"],"apc_list":{"value":2500,"currency":"USD","value_usd":2500,"provenance":"doaj"},"apc_paid":null,"fwci":2.126,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":24,"citation_normalized_percentile":{"value":0.847305,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":92,"max":93},"biblio":{"volume":"14","issue":null,"first_page":"27","last_page":"36"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Multi-label Text Classification in Machine Learning","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Multi-label Text Classification in Machine Learning","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Extraction and Crawling Techniques","score":0.997,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Text Compression and Indexing Algorithms","score":0.991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lossy-compression","display_name":"Lossy compression","score":0.6115603},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.5784017},{"id":"https://openalex.org/keywords/machine-learning-algorithms","display_name":"Machine Learning Algorithms","score":0.541454},{"id":"https://openalex.org/keywords/multi-label-learning","display_name":"Multi-label Learning","score":0.536207},{"id":"https://openalex.org/keywords/web-data-extraction","display_name":"Web Data Extraction","score":0.530364},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information Retrieval","score":0.528483},{"id":"https://openalex.org/keywords/text-indexing","display_name":"Text Indexing","score":0.527661}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.81293976},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.7793671},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.6987721},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.696034},{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.6115603},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.5784017},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5259792},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.52161753},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46192047},{"id":"https://openalex.org/C140745168","wikidata":"https://www.wikidata.org/wiki/Q1210082","display_name":"Tree traversal","level":2,"score":0.44910455},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.24636349},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.17124179},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.14045113},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1016/j.bdr.2018.05.007","pdf_url":null,"source":{"id":"https://openalex.org/S2491565770","display_name":"Big Data Research","issn_l":"2214-5796","issn":["2214-5796","2214-580X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":18,"referenced_works":["https://openalex.org/W1550206324","https://openalex.org/W1620204465","https://openalex.org/W1973520416","https://openalex.org/W2010581776","https://openalex.org/W2014566476","https://openalex.org/W2025047573","https://openalex.org/W2029296527","https://openalex.org/W2036553810","https://openalex.org/W2063862666","https://openalex.org/W2065472179","https://openalex.org/W2066667100","https://openalex.org/W2071423279","https://openalex.org/W2073830447","https://openalex.org/W2105573333","https://openalex.org/W2107008379","https://openalex.org/W2108079923","https://openalex.org/W2143774383","https://openalex.org/W2154610494"],"related_works":["https://openalex.org/W4205915047","https://openalex.org/W3180760233","https://openalex.org/W2978432024","https://openalex.org/W2276828234","https://openalex.org/W2148203918","https://openalex.org/W2132019419","https://openalex.org/W2118338613","https://openalex.org/W2071387875","https://openalex.org/W1995805316","https://openalex.org/W1568381040"],"abstract_inverted_index":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2883127447","counts_by_year":[{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":3}],"updated_date":"2024-11-20T22:18:46.851840","created_date":"2018-08-03"}