{"id":"https://openalex.org/W1835571316","doi":"https://doi.org/10.1186/1471-2105-7-170","title":"BioWarehouse: a bioinformatics database warehouse toolkit","display_name":"BioWarehouse: a bioinformatics database warehouse toolkit","publication_year":2006,"publication_date":"2006-03-23","ids":{"openalex":"https://openalex.org/W1835571316","doi":"https://doi.org/10.1186/1471-2105-7-170","mag":"1835571316","pmid":"https://pubmed.ncbi.nlm.nih.gov/16556315","pmcid":"https://www.ncbi.nlm.nih.gov/pmc/articles/1444936"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-7-170","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-7-170","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-7-170","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013728691","display_name":"Thomas J. Lee","orcid":"https://orcid.org/0009-0006-1831-2485"},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thomas J Lee","raw_affiliation_strings":["Bioinformatics Research Group, SRI International, Menlo Park, USA."],"affiliations":[{"raw_affiliation_string":"Bioinformatics Research Group, SRI International, Menlo Park, USA.","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020288433","display_name":"Yannick Pouliot","orcid":"https://orcid.org/0000-0002-0344-1923"},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yannick Pouliot","raw_affiliation_strings":["Bioinformatics Research Group, SRI International, Menlo Park, USA."],"affiliations":[{"raw_affiliation_string":"Bioinformatics Research Group, SRI International, Menlo Park, USA.","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063604640","display_name":"Valerie Wagner","orcid":"https://orcid.org/0000-0002-4782-2664"},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Valerie Wagner","raw_affiliation_strings":["Bioinformatics Research Group, SRI International, Menlo Park, USA."],"affiliations":[{"raw_affiliation_string":"Bioinformatics Research Group, SRI International, Menlo Park, USA.","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042213306","display_name":"Priyanka Gupta","orcid":"https://orcid.org/0000-0003-2726-9766"},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Priyanka Gupta","raw_affiliation_strings":["Bioinformatics Research Group, SRI International, Menlo Park, USA."],"affiliations":[{"raw_affiliation_string":"Bioinformatics Research Group, SRI International, Menlo Park, USA.","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049616607","display_name":"David WJ Stringer-Calvert","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David WJ Stringer-Calvert","raw_affiliation_strings":["Computer Science Laboratory, Menlo Park, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Laboratory, Menlo Park, USA","institution_ids":["https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052549427","display_name":"Jessica D. Tenenbaum","orcid":"https://orcid.org/0000-0003-3532-565X"},"institutions":[{"id":"https://openalex.org/I4210137306","display_name":"Stanford Medicine","ror":"https://ror.org/03mtd9a03","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210137306","https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jessica D Tenenbaum","raw_affiliation_strings":["Stanford Medical Informatics, Stanford University, Stanford, USA"],"affiliations":[{"raw_affiliation_string":"Stanford Medical Informatics, Stanford University, Stanford, USA","institution_ids":["https://openalex.org/I4210137306"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082071104","display_name":"Peter D. Karp","orcid":"https://orcid.org/0000-0002-5876-6418"},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Peter D Karp","raw_affiliation_strings":["Bioinformatics Research Group, SRI International, Menlo Park, USA."],"affiliations":[{"raw_affiliation_string":"Bioinformatics Research Group, SRI International, Menlo Park, USA.","institution_ids":["https://openalex.org/I1298353152"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072,"provenance":"doaj"},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072,"provenance":"doaj"},"fwci":7.114,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":186,"citation_normalized_percentile":{"value":0.927411,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"7","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10932","display_name":"Microbial Metabolic Engineering and Bioproduction","score":0.9971,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10932","display_name":"Microbial Metabolic Engineering and Bioproduction","score":0.9971,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9918,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9846,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C135572916","wikidata":"https://www.wikidata.org/wiki/Q193351","display_name":"Data warehouse","level":2,"score":0.61007196},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.59301996},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5789132},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.4467231},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.32943684},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.32895055},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.21570608}],"mesh":[{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D003628","descriptor_name":"Database Management Systems","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015202","descriptor_name":"Protein Engineering","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D015202","descriptor_name":"Protein Engineering","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012660","descriptor_name":"Semantics","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015398","descriptor_name":"Signal Transduction","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D015398","descriptor_name":"Signal Transduction","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":"","qualifier_name":null,"is_major_topic":false}],"locations_count":5,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-7-170","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-7-170","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://www.osti.gov/biblio/1626315","pdf_url":null,"source":{"id":"https://openalex.org/S4306402487","display_name":"OSTI OAI (U.S. Department of Energy Office of Scientific and Technical Information)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I139351228","host_organization_name":"Office of Scientific and Technical Information","host_organization_lineage":["https://openalex.org/I139351228"],"host_organization_lineage_names":["Office of Scientific and Technical Information"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://europepmc.org/articles/pmc1444936","pdf_url":"https://europepmc.org/articles/pmc1444936?pdf=render","source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":["European Bioinformatics Institute"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC1444936","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/16556315","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-7-170","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-7-170","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310319965","https://openalex.org/P4310320256"],"host_organization_lineage_names":["Springer Nature","BioMed Central"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.42,"id":"https://metadata.un.org/sdg/9"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":42,"referenced_works":["https://openalex.org/W1569620237","https://openalex.org/W1603241183","https://openalex.org/W1604281503","https://openalex.org/W1968766436","https://openalex.org/W1973415432","https://openalex.org/W1981671919","https://openalex.org/W1983594585","https://openalex.org/W1984345785","https://openalex.org/W1995077427","https://openalex.org/W2003144438","https://openalex.org/W2013171416","https://openalex.org/W2016758618","https://openalex.org/W2033532845","https://openalex.org/W2035923305","https://openalex.org/W2063133646","https://openalex.org/W2070980736","https://openalex.org/W2087157049","https://openalex.org/W2094258495","https://openalex.org/W2096525273","https://openalex.org/W2103017472","https://openalex.org/W2105941683","https://openalex.org/W2111973517","https://openalex.org/W2118579925","https://openalex.org/W2125816119","https://openalex.org/W2132754077","https://openalex.org/W2133034723","https://openalex.org/W2146453000","https://openalex.org/W2158784643","https://openalex.org/W2159482845","https://openalex.org/W2160453515","https://openalex.org/W2160948978","https://openalex.org/W22005843","https://openalex.org/W2255714488","https://openalex.org/W2917140582","https://openalex.org/W31971057","https://openalex.org/W4213149192","https://openalex.org/W4230903726","https://openalex.org/W4231551535","https://openalex.org/W4247964656","https://openalex.org/W4248664566","https://openalex.org/W4285719527","https://openalex.org/W4294216483"],"related_works":["https://openalex.org/W6138692","https://openalex.org/W4200307027","https://openalex.org/W3167309973","https://openalex.org/W2759027785","https://openalex.org/W2543282246","https://openalex.org/W2531755459","https://openalex.org/W2384867819","https://openalex.org/W2373884155","https://openalex.org/W2359411520","https://openalex.org/W1535822977"],"abstract_inverted_index":{"Abstract":[0],"Background":[1],"This":[2],"article":[3],"addresses":[4],"the":[5,27,55,79,95,104,111,146,182,195,225,249,252,265],"problem":[6,268],"of":[7,9,65,81,85,132,184,208,227,243,248,251],"interoperation":[8],"heterogeneous":[10],"bioinformatics":[11,23,148,257],"databases.":[12,198],"Results":[13],"We":[14],"introduce":[15],"BioWarehouse,":[16],"an":[17,174],"open":[18],"source":[19,138],"toolkit":[20],"for":[21,189,206,211,238,269],"constructing":[22],"database":[24,32,47,66,124,266],"warehouses":[25],"using":[26,54],"MySQL":[28],"and":[29,73,90,92,100,103,113,117,164,170,230,234],"Oracle":[30],"relational":[31,123],"managers.":[33],"BioWarehouse":[34,76,179,260],"integrates":[35],"its":[36],"component":[37],"databases":[38,86,120],"into":[39,121],"a":[40,45,63,82,122,130,236],"common":[41],"representational":[42],"framework":[43],"within":[44],"single":[46],"management":[48],"system,":[49],"thus":[50],"enabling":[51],"multi-database":[52],"queries":[53,242],"Structured":[56],"Query":[57],"Language":[58],"(SQL)":[59],"but":[60],"also":[61,128],"facilitating":[62],"variety":[64],"integration":[67,80,267],"tasks":[68],"such":[69],"as":[70],"comparative":[71],"analysis":[72],"data":[74,222,253],"mining.":[75],"currently":[77],"supports":[78,145],"pathway-centric":[83],"set":[84],"including":[87],"ENZYME,":[88],"KEGG,":[89],"BioCyc,":[91],"in":[93,110,194,220],"addition":[94],"UniProt,":[96],"GenBank,":[97],"NCBI":[98],"Taxonomy,":[99],"CMR":[101],"databases,":[102],"Gene":[105],"Ontology.":[106],"Loader":[107],"tools,":[108],"written":[109],"C":[112],"JAVA":[114],"languages,":[115],"parse":[116],"load":[118],"these":[119],"schema.":[125],"The":[126,143,199],"loaders":[127],"apply":[129],"degree":[131],"semantic":[133,141],"normalization":[134],"to":[135,180,256],"their":[136],"respective":[137],"data,":[139],"decreasing":[140],"heterogeneity.":[142],"schema":[144],"following":[147],"datatypes:":[149],"chemical":[150],"compounds,":[151],"biochemical":[152],"reactions,":[153],"metabolic":[154,231,239],"pathways,":[155],"proteins,":[156],"genes,":[157],"nucleic":[158],"acid":[159],"sequences,":[160,166],"features":[161],"on":[162,264],"protein":[163],"nucleic-acid":[165],"organisms,":[167],"organism":[168],"taxonomies,":[169],"controlled":[171],"vocabularies.":[172],"As":[173],"application":[175],"example,":[176],"we":[177],"applied":[178],"determine":[181],"fraction":[183],"biochemically":[185],"characterized":[186],"enzyme":[187,209],"activities":[188,210],"which":[190,212],"no":[191,203],"sequences":[192],"exist":[193],"public":[196],"sequence":[197,204,221],"answer":[200],"is":[201],"that":[202],"exists":[205],"36%":[207],"EC":[213],"numbers":[214],"have":[215],"been":[216],"assigned.":[217],"These":[218],"gaps":[219],"significantly":[223],"limit":[224],"accuracy":[226],"genome":[228],"annotation":[229],"pathway":[232],"prediction,":[233],"are":[235],"barrier":[237],"engineering.":[240],"Complex":[241],"this":[244],"type":[245],"provide":[246],"examples":[247],"value":[250],"warehousing":[254],"approach":[255],"research.":[258],"Conclusion":[259],"embodies":[261],"significant":[262],"progress":[263],"bioinformatics.":[270]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1835571316","counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":6},{"year":2016,"cited_by_count":8},{"year":2015,"cited_by_count":8},{"year":2014,"cited_by_count":7},{"year":2013,"cited_by_count":18},{"year":2012,"cited_by_count":20}],"updated_date":"2024-12-11T12:22:16.344091","created_date":"2016-06-24"}