{"id":"https://openalex.org/W4403788141","doi":"https://doi.org/10.48550/arxiv.2409.16183","title":"Expert-level vision-language foundation model for real-world radiology\n and comprehensive evaluation","display_name":"Expert-level vision-language foundation model for real-world radiology\n and comprehensive evaluation","publication_year":2024,"publication_date":"2024-09-24","ids":{"openalex":"https://openalex.org/W4403788141","doi":"https://doi.org/10.48550/arxiv.2409.16183"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.16183","pdf_url":"http://arxiv.org/pdf/2409.16183","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2409.16183","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100321192","display_name":"Xiaohong Liu","orcid":"https://orcid.org/0000-0002-0818-1059"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiaohong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101633476","display_name":"Guoxing Yang","orcid":"https://orcid.org/0000-0002-1019-2021"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Guoxing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100521856","display_name":"Yulin Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Yulin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113306648","display_name":"Jiaji Mao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mao, Jiaji","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100368805","display_name":"Xiang Zhang","orcid":"https://orcid.org/0000-0001-5097-2113"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075501144","display_name":"Ming Gao","orcid":"https://orcid.org/0000-0003-3397-5659"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Ming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013030532","display_name":"Shanghang Zhang","orcid":"https://orcid.org/0000-0003-4047-3526"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shanghang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100722023","display_name":"Jun Shen","orcid":"https://orcid.org/0000-0002-8881-9189"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100458577","display_name":"Guangyu Wang","orcid":"https://orcid.org/0000-0003-1312-884X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Guangyu","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":{"min":0,"max":86},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T13062","display_name":"Theoretical Framework of Cognitive Informatics and Computational Intelligence","score":0.6003,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13062","display_name":"Theoretical Framework of Cognitive Informatics and Computational Intelligence","score":0.6003,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.80485857},{"id":"https://openalex.org/keywords/knowledge-representation","display_name":"Knowledge Representation","score":0.482345}],"concepts":[{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.80485857},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.505318},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42751133},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38023517},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.34462026},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.20154634},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.11518985}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.16183","pdf_url":"http://arxiv.org/pdf/2409.16183","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.16183","pdf_url":"http://arxiv.org/pdf/2409.16183","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391913857","https://openalex.org/W4391375266","https://openalex.org/W3204019825","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2381393187","https://openalex.org/W2358668433","https://openalex.org/W2358060160","https://openalex.org/W2332779545"],"abstract_inverted_index":{"Radiology":[0],"is":[1,93],"a":[2,30,82,142,158,184],"vital":[3],"and":[4,11,54,65,84,105,114,123,137,141,205,222],"complex":[5],"component":[6],"of":[7,100,229],"modern":[8],"clinical":[9,244],"workflow":[10],"covers":[12],"many":[13],"tasks.":[14,36],"Recently,":[15],"vision-language":[16,52,86,167],"(VL)":[17],"foundation":[18,87,216],"models":[19,43,217],"in":[20,25,62,73,234],"medicine":[21],"have":[22],"shown":[23],"potential":[24,240],"processing":[26],"multimodal":[27,60,121],"information,":[28,140],"offering":[29],"unified":[31,143],"solution":[32],"for":[33,90,241],"various":[34],"radiology":[35,63,162,235],"However,":[37],"existing":[38],"studies":[39],"either":[40],"pre-trained":[41],"VL":[42,215],"on":[44,95,190,218],"natural":[45],"data":[46],"or":[47],"did":[48],"not":[49],"fully":[50,151],"integrate":[51],"architecture":[53],"pretraining,":[55],"often":[56],"neglecting":[57],"the":[58,96,153,191,227],"unique":[59],"complexity":[61],"images":[64,104,199,203,207],"their":[66,70],"textual":[67],"contexts.":[68],"Additionally,":[69],"practical":[71],"applicability":[72,239],"real-world":[74,192],"scenarios":[75],"remains":[76],"underexplored.":[77],"Here,":[78],"we":[79,156],"present":[80],"RadFound,":[81],"large":[83],"open-source":[85],"model":[88],"tailored":[89,147],"radiology,":[91],"that":[92],"trained":[94],"most":[97],"extensive":[98],"dataset":[99],"over":[101],"8.1":[102],"million":[103],"250,000":[106],"image-text":[107],"pairs,":[108],"covering":[109],"19":[110],"major":[111],"organ":[112],"systems":[113],"10":[115],"imaging":[116],"modalities.":[117],"To":[118,150],"establish":[119],"expert-level":[120],"perception":[122],"generation":[124,173],"capabilities,":[125],"RadFound":[126,211,230],"introduces":[127],"an":[128,232],"enhanced":[129],"vision":[130],"encoder":[131],"to":[132,148,178],"capture":[133],"intra-image":[134],"local":[135],"features":[136],"inter-image":[138],"contextual":[139],"cross-modal":[144],"learning":[145],"design":[146],"radiology.":[149],"assess":[152],"models'":[154],"capability,":[155],"construct":[157],"benchmark,":[159],"RadVLBench,":[160],"including":[161],"interpretation":[163],"tasks":[164,174],"like":[165],"medical":[166],"question-answering,":[168],"as":[169,171],"well":[170],"text":[172],"ranging":[175],"from":[176],"captioning":[177],"report":[179],"generation.":[180],"We":[181],"also":[182],"propose":[183],"human":[185,223],"evaluation":[186],"framework.":[187],"When":[188],"evaluated":[189],"benchmark":[193],"involving":[194],"three":[195],"representative":[196],"modalities,":[197],"2D":[198],"(chest":[200],"X-rays),":[201],"multi-view":[202],"(mammograms),":[204],"3D":[206],"(thyroid":[208],"CT":[209],"scans),":[210],"significantly":[212],"outperforms":[213],"other":[214],"both":[219],"quantitative":[220],"metrics":[221],"evaluation.":[224],"In":[225],"summary,":[226],"development":[228],"represents":[231],"advancement":[233],"generalists,":[236],"demonstrating":[237],"broad":[238],"integration":[242],"into":[243],"workflows.":[245]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4403788141","counts_by_year":[],"updated_date":"2024-10-27T08:44:17.138187","created_date":"2024-10-26"}