{"id":"https://openalex.org/W2001459151","doi":"https://doi.org/10.1021/ci4006595","title":"Assessment of Machine Learning Reliability Methods for Quantifying the Applicability Domain of QSAR Regression Models","display_name":"Assessment of Machine Learning Reliability Methods for Quantifying the Applicability Domain of QSAR Regression Models","publication_year":2014,"publication_date":"2014-02-03","ids":{"openalex":"https://openalex.org/W2001459151","doi":"https://doi.org/10.1021/ci4006595","mag":"2001459151","pmid":"https://pubmed.ncbi.nlm.nih.gov/24490838"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci4006595","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080831166","display_name":"Marko Toplak","orcid":"https://orcid.org/0000-0003-4413-1603"},"institutions":[{"id":"https://openalex.org/I153976015","display_name":"University of Ljubljana","ror":"https://ror.org/05njb9z20","country_code":"SI","type":"education","lineage":["https://openalex.org/I153976015"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Marko Toplak","raw_affiliation_strings":["Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia","institution_ids":["https://openalex.org/I153976015"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086624431","display_name":"Rok Mo\u010dnik","orcid":null},"institutions":[{"id":"https://openalex.org/I153976015","display_name":"University of Ljubljana","ror":"https://ror.org/05njb9z20","country_code":"SI","type":"education","lineage":["https://openalex.org/I153976015"]},{"id":"https://openalex.org/I204778367","display_name":"Norwegian University of Science and Technology","ror":"https://ror.org/05xg72x27","country_code":"NO","type":"education","lineage":["https://openalex.org/I204778367"]}],"countries":["NO","SI"],"is_corresponding":false,"raw_author_name":"Rok Mo\u010dnik","raw_affiliation_strings":["Department\rof Cancer Research and Molecular Medicine, Norwegian University of Science and Technology, Olav Kyrres gate 9, 7489 Trondheim, Norway","Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia","institution_ids":["https://openalex.org/I153976015"]},{"raw_affiliation_string":"Department\rof Cancer Research and Molecular Medicine, Norwegian University of Science and Technology, Olav Kyrres gate 9, 7489 Trondheim, Norway","institution_ids":["https://openalex.org/I204778367"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076143672","display_name":"Matija Polajnar","orcid":null},"institutions":[{"id":"https://openalex.org/I153976015","display_name":"University of Ljubljana","ror":"https://ror.org/05njb9z20","country_code":"SI","type":"education","lineage":["https://openalex.org/I153976015"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Matija Polajnar","raw_affiliation_strings":["Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia","institution_ids":["https://openalex.org/I153976015"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045389796","display_name":"Zoran Bosni\u0107","orcid":"https://orcid.org/0000-0003-0501-7146"},"institutions":[{"id":"https://openalex.org/I153976015","display_name":"University of Ljubljana","ror":"https://ror.org/05njb9z20","country_code":"SI","type":"education","lineage":["https://openalex.org/I153976015"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Zoran Bosni\u0107","raw_affiliation_strings":["Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia","institution_ids":["https://openalex.org/I153976015"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072219201","display_name":"Lars Carlsson","orcid":"https://orcid.org/0000-0001-9491-4134"},"institutions":[{"id":"https://openalex.org/I4210143795","display_name":"AstraZeneca (Sweden)","ror":"https://ror.org/04wwrrg31","country_code":"SE","type":"company","lineage":["https://openalex.org/I105036370","https://openalex.org/I4210143795"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Lars Carlsson","raw_affiliation_strings":["Computational Toxicology, Global Safety Assessment, AstraZeneca R&D, Pepparedsleden 1, 43183 M\u00f6lndal, Sweden"],"affiliations":[{"raw_affiliation_string":"Computational Toxicology, Global Safety Assessment, AstraZeneca R&D, Pepparedsleden 1, 43183 M\u00f6lndal, Sweden","institution_ids":["https://openalex.org/I4210143795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031085910","display_name":"Catrin Hasselgren","orcid":null},"institutions":[{"id":"https://openalex.org/I4210143795","display_name":"AstraZeneca (Sweden)","ror":"https://ror.org/04wwrrg31","country_code":"SE","type":"company","lineage":["https://openalex.org/I105036370","https://openalex.org/I4210143795"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Catrin Hasselgren","raw_affiliation_strings":["Computational Toxicology, Global Safety Assessment, AstraZeneca R&D, Pepparedsleden 1, 43183 M\u00f6lndal, Sweden"],"affiliations":[{"raw_affiliation_string":"Computational Toxicology, Global Safety Assessment, AstraZeneca R&D, Pepparedsleden 1, 43183 M\u00f6lndal, Sweden","institution_ids":["https://openalex.org/I4210143795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024075429","display_name":"Janez Dem\u0161ar","orcid":"https://orcid.org/0000-0002-1256-1687"},"institutions":[{"id":"https://openalex.org/I153976015","display_name":"University of Ljubljana","ror":"https://ror.org/05njb9z20","country_code":"SI","type":"education","lineage":["https://openalex.org/I153976015"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Janez Dem\u0161ar","raw_affiliation_strings":["Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia","institution_ids":["https://openalex.org/I153976015"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030997667","display_name":"Scott Boyer","orcid":null},"institutions":[{"id":"https://openalex.org/I4210143795","display_name":"AstraZeneca (Sweden)","ror":"https://ror.org/04wwrrg31","country_code":"SE","type":"company","lineage":["https://openalex.org/I105036370","https://openalex.org/I4210143795"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Scott Boyer","raw_affiliation_strings":["Computational Toxicology, Global Safety Assessment, AstraZeneca R&D, Pepparedsleden 1, 43183 M\u00f6lndal, Sweden"],"affiliations":[{"raw_affiliation_string":"Computational Toxicology, Global Safety Assessment, AstraZeneca R&D, Pepparedsleden 1, 43183 M\u00f6lndal, Sweden","institution_ids":["https://openalex.org/I4210143795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073792028","display_name":"Bla\u017e Zupan","orcid":"https://orcid.org/0000-0002-5864-7056"},"institutions":[{"id":"https://openalex.org/I153976015","display_name":"University of Ljubljana","ror":"https://ror.org/05njb9z20","country_code":"SI","type":"education","lineage":["https://openalex.org/I153976015"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Bla\u017e Zupan","raw_affiliation_strings":["Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Faculty\rof Computer and Information Science, University of Ljubljana, Tr\u017ea\u0161ka\r25, 1000 Ljubljana, Slovenia","institution_ids":["https://openalex.org/I153976015"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063376974","display_name":"Jonna St\u00e5lring","orcid":null},"institutions":[{"id":"https://openalex.org/I4210143795","display_name":"AstraZeneca (Sweden)","ror":"https://ror.org/04wwrrg31","country_code":"SE","type":"company","lineage":["https://openalex.org/I105036370","https://openalex.org/I4210143795"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Jonna St\u00e5lring","raw_affiliation_strings":["Computational Toxicology, Global Safety Assessment, AstraZeneca R&D, Pepparedsleden 1, 43183 M\u00f6lndal, Sweden"],"affiliations":[{"raw_affiliation_string":"Computational Toxicology, Global Safety Assessment, AstraZeneca R&D, Pepparedsleden 1, 43183 M\u00f6lndal, Sweden","institution_ids":["https://openalex.org/I4210143795"]}]}],"institution_assertions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.834,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":58,"citation_normalized_percentile":{"value":0.958053,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"54","issue":"2","first_page":"431","last_page":"441"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Methods in Drug Discovery","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Methods in Drug Discovery","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Accelerating Materials Innovation through Informatics","score":0.9951,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Advances in Metabolomics Research","score":0.9158,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/applicability-domain","display_name":"Applicability domain","score":0.7693176},{"id":"https://openalex.org/keywords/qsar-modeling","display_name":"QSAR Modeling","score":0.608874},{"id":"https://openalex.org/keywords/chemical-space","display_name":"Chemical space","score":0.4837887}],"concepts":[{"id":"https://openalex.org/C164126121","wikidata":"https://www.wikidata.org/wiki/Q766383","display_name":"Quantitative structure\u2013activity relationship","level":2,"score":0.87022054},{"id":"https://openalex.org/C107908354","wikidata":"https://www.wikidata.org/wiki/Q4781456","display_name":"Applicability domain","level":3,"score":0.7693176},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.67277753},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.62280214},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.584216},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5414074},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49859023},{"id":"https://openalex.org/C99726746","wikidata":"https://www.wikidata.org/wiki/Q906396","display_name":"Chemical space","level":3,"score":0.4837887},{"id":"https://openalex.org/C12362212","wikidata":"https://www.wikidata.org/wiki/Q728435","display_name":"Linear subspace","level":2,"score":0.43591794},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.4272287},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.41384587},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18375695},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.16353726},{"id":"https://openalex.org/C74187038","wikidata":"https://www.wikidata.org/wiki/Q1418791","display_name":"Drug discovery","level":2,"score":0.12309557},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.09875956},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D021281","descriptor_name":"Quantitative Structure-Activity Relationship","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012044","descriptor_name":"Regression Analysis","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013997","descriptor_name":"Time Factors","qualifier_ui":"","qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci4006595","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/24490838","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":25,"referenced_works":["https://openalex.org/W1480376833","https://openalex.org/W1540105270","https://openalex.org/W1554944419","https://openalex.org/W1970334426","https://openalex.org/W1988037271","https://openalex.org/W2011006316","https://openalex.org/W2014854068","https://openalex.org/W2015931265","https://openalex.org/W2019500309","https://openalex.org/W2023294425","https://openalex.org/W2025421550","https://openalex.org/W2048611698","https://openalex.org/W2054111413","https://openalex.org/W2074681440","https://openalex.org/W2085087514","https://openalex.org/W2085890279","https://openalex.org/W2115104712","https://openalex.org/W2122183194","https://openalex.org/W2126022166","https://openalex.org/W2129512921","https://openalex.org/W2130764285","https://openalex.org/W2131850886","https://openalex.org/W2604272474","https://openalex.org/W2787894218","https://openalex.org/W28412257"],"related_works":["https://openalex.org/W3005120176","https://openalex.org/W2985099987","https://openalex.org/W2746158299","https://openalex.org/W2309296013","https://openalex.org/W2090257471","https://openalex.org/W2057392260","https://openalex.org/W2055287694","https://openalex.org/W1977382278","https://openalex.org/W1970841929","https://openalex.org/W1969085205"],"abstract_inverted_index":{"The":[0,31,166,215],"vastness":[1],"of":[2,33,45,87,91,107,114,131,173,197,208],"chemical":[3],"space":[4],"and":[5,41,127,183],"the":[6,51,55,96,108,112,129,163,171,185,195,234],"relatively":[7],"small":[8],"coverage":[9],"by":[10,136,206],"experimental":[11,56,79],"data":[12,122,180,236],"recording":[13],"molecular":[14],"properties":[15],"require":[16],"us":[17],"to":[18,73,160,179,184,233],"identify":[19],"subspaces,":[20],"or":[21],"domains,":[22],"for":[23,68],"which":[24],"we":[25,82],"can":[26,150,203],"confidently":[27],"apply":[28],"QSAR":[29,34,61,121],"models.":[30],"prediction":[32,103,109,141],"models":[35],"in":[36,60,75,95,162,189,220,226],"these":[37,146,201],"domains":[38],"is":[39,177],"reliable,":[40],"potential":[42],"subsequent":[43],"investigations":[44],"such":[46],"compounds":[47,69,161],"would":[48],"find":[49],"that":[50,63,70,145,155,170,193],"predictions":[52,64],"closely":[53],"match":[54],"values.":[57],"Standard":[58],"approaches":[59,149],"assume":[62],"are":[65,71],"more":[66],"reliable":[67],"\"similar\"":[72],"those":[74],"subspaces":[76],"with":[77,124,140],"denser":[78],"data.":[80],"Here,":[81],"report":[83],"on":[84,158],"a":[85],"study":[86,117],"an":[88,227],"alternative":[89,148],"set":[90,181],"techniques":[92,218],"recently":[93],"proposed":[94],"machine":[97],"learning":[98],"community.":[99],"These":[100],"methods":[101,135,176],"quantify":[102],"confidence":[104],"through":[105],"estimation":[106,213,217],"error":[110],"at":[111,194],"point":[113],"interest.":[115],"Our":[116],"includes":[118],"20":[119],"public":[120],"sets":[123],"continuous":[125],"response":[126],"assesses":[128],"quality":[130,172],"10":[132],"reliability":[133,153,174,212,216],"scoring":[134,175],"observing":[137],"their":[138],"correlation":[139],"error.":[142],"We":[143,191],"show":[144],"new":[147],"outperform":[151],"standard":[152],"scores":[154,209],"rely":[156],"only":[157],"similarity":[159],"training":[164],"set.":[165],"results":[167],"also":[168],"indicate":[169],"sensitive":[178],"characteristics":[182],"regression":[186],"method":[187],"used":[188],"QSAR.":[190],"demonstrate":[192],"cost":[196],"increased":[198],"computational":[199],"complexity":[200],"dependencies":[202],"be":[204],"leveraged":[205],"integration":[207],"from":[210],"various":[211],"approaches.":[214],"described":[219],"this":[221],"paper":[222],"have":[223],"been":[224],"implemented":[225],"open":[228],"source":[229],"add-on":[230],"package":[231],"(https://bitbucket.org/biolab/orange-reliability)":[232],"Orange":[235],"mining":[237],"suite.":[238]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2001459151","counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":8},{"year":2018,"cited_by_count":8},{"year":2017,"cited_by_count":7},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":2}],"updated_date":"2024-11-03T17:01:16.957114","created_date":"2016-06-24"}