{"id":"https://openalex.org/W4361280319","doi":"https://doi.org/10.3389/fbinf.2023.1143014","title":"EGAsubmitter: A software to automate submission of nucleic acid sequencing data to the European Genome-phenome Archive","display_name":"EGAsubmitter: A software to automate submission of nucleic acid sequencing data to the European Genome-phenome Archive","publication_year":2023,"publication_date":"2023-03-30","ids":{"openalex":"https://openalex.org/W4361280319","doi":"https://doi.org/10.3389/fbinf.2023.1143014","pmid":"https://pubmed.ncbi.nlm.nih.gov/37063647"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.3389/fbinf.2023.1143014","pdf_url":"https://www.frontiersin.org/articles/10.3389/fbinf.2023.1143014/pdf","source":{"id":"https://openalex.org/S4210219554","display_name":"Frontiers in Bioinformatics","issn_l":"2673-7647","issn":["2673-7647"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.frontiersin.org/articles/10.3389/fbinf.2023.1143014/pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013652847","display_name":"Marco Viviani","orcid":"https://orcid.org/0000-0003-4698-8870"},"institutions":[{"id":"https://openalex.org/I4210153126","display_name":"Istituti di Ricovero e Cura a Carattere Scientifico","ror":"https://ror.org/04tfzc498","country_code":"IT","type":"healthcare","lineage":["https://openalex.org/I4210153126"]},{"id":"https://openalex.org/I4210151091","display_name":"Candiolo Cancer Institute","ror":"https://ror.org/04wadq306","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210151091","https://openalex.org/I4210153126","https://openalex.org/I4210167100"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Viviani","raw_affiliation_strings":["Candiolo Cancer Institute\u2014FPO IRCCS, Candiolo, Italy","Department of Oncology, University of Torino, Candiolo, Italy"],"affiliations":[{"raw_affiliation_string":"Candiolo Cancer Institute\u2014FPO IRCCS, Candiolo, Italy","institution_ids":["https://openalex.org/I4210153126","https://openalex.org/I4210151091"]},{"raw_affiliation_string":"Department of Oncology, University of Torino, Candiolo, Italy","institution_ids":["https://openalex.org/I4210151091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054523097","display_name":"Marilisa Montemurro","orcid":"https://orcid.org/0000-0001-5643-1385"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Polytechnic University of Turin","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marilisa Montemurro","raw_affiliation_strings":["Politecnico di Torino, Turin, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Torino, Turin, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049302590","display_name":"Livio Trusolino","orcid":"https://orcid.org/0000-0002-6379-3365"},"institutions":[{"id":"https://openalex.org/I4210153126","display_name":"Istituti di Ricovero e Cura a Carattere Scientifico","ror":"https://ror.org/04tfzc498","country_code":"IT","type":"healthcare","lineage":["https://openalex.org/I4210153126"]},{"id":"https://openalex.org/I4210151091","display_name":"Candiolo Cancer Institute","ror":"https://ror.org/04wadq306","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210151091","https://openalex.org/I4210153126","https://openalex.org/I4210167100"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Livio Trusolino","raw_affiliation_strings":["Candiolo Cancer Institute\u2014FPO IRCCS, Candiolo, Italy","Department of Oncology, University of Torino, Candiolo, Italy"],"affiliations":[{"raw_affiliation_string":"Candiolo Cancer Institute\u2014FPO IRCCS, Candiolo, Italy","institution_ids":["https://openalex.org/I4210153126","https://openalex.org/I4210151091"]},{"raw_affiliation_string":"Department of Oncology, University of Torino, Candiolo, Italy","institution_ids":["https://openalex.org/I4210151091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031287599","display_name":"Andrea Bertotti","orcid":"https://orcid.org/0000-0001-8196-7608"},"institutions":[{"id":"https://openalex.org/I4210153126","display_name":"Istituti di Ricovero e Cura a Carattere Scientifico","ror":"https://ror.org/04tfzc498","country_code":"IT","type":"healthcare","lineage":["https://openalex.org/I4210153126"]},{"id":"https://openalex.org/I4210151091","display_name":"Candiolo Cancer Institute","ror":"https://ror.org/04wadq306","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210151091","https://openalex.org/I4210153126","https://openalex.org/I4210167100"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Andrea Bertotti","raw_affiliation_strings":["Candiolo Cancer Institute\u2014FPO IRCCS, Candiolo, Italy","Department of Oncology, University of Torino, Candiolo, Italy"],"affiliations":[{"raw_affiliation_string":"Candiolo Cancer Institute\u2014FPO IRCCS, Candiolo, Italy","institution_ids":["https://openalex.org/I4210153126","https://openalex.org/I4210151091"]},{"raw_affiliation_string":"Department of Oncology, University of Torino, Candiolo, Italy","institution_ids":["https://openalex.org/I4210151091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011857762","display_name":"Gianvito Urgese","orcid":"https://orcid.org/0000-0003-2672-7593"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Polytechnic University of Turin","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Gianvito Urgese","raw_affiliation_strings":["Politecnico di Torino, Turin, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Torino, Turin, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049648750","display_name":"Elena Grassi","orcid":"https://orcid.org/0000-0003-1066-927X"},"institutions":[{"id":"https://openalex.org/I4210151091","display_name":"Candiolo Cancer Institute","ror":"https://ror.org/04wadq306","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210151091","https://openalex.org/I4210153126","https://openalex.org/I4210167100"]},{"id":"https://openalex.org/I4210153126","display_name":"Istituti di Ricovero e Cura a Carattere Scientifico","ror":"https://ror.org/04tfzc498","country_code":"IT","type":"healthcare","lineage":["https://openalex.org/I4210153126"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Elena Grassi","raw_affiliation_strings":["Candiolo Cancer Institute\u2014FPO IRCCS, Candiolo, Italy","Department of Oncology, University of Torino, Candiolo, Italy"],"affiliations":[{"raw_affiliation_string":"Candiolo Cancer Institute\u2014FPO IRCCS, Candiolo, Italy","institution_ids":["https://openalex.org/I4210151091","https://openalex.org/I4210153126"]},{"raw_affiliation_string":"Department of Oncology, University of Torino, Candiolo, Italy","institution_ids":["https://openalex.org/I4210151091"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5049648750"],"corresponding_institution_ids":["https://openalex.org/I4210151091","https://openalex.org/I4210153126"],"apc_list":{"value":1900,"currency":"USD","value_usd":1900,"provenance":"doaj"},"apc_paid":{"value":1900,"currency":"USD","value_usd":1900,"provenance":"doaj"},"fwci":0.0,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":70},"biblio":{"volume":"3","issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11937","display_name":"Data Sharing and Stewardship in Science","score":0.9975,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11937","display_name":"Data Sharing and Stewardship in Science","score":0.9975,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Management and Reproducibility of Scientific Workflows","score":0.9962,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10015","display_name":"RNA Sequencing Data Analysis","score":0.9676,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.77610135},{"id":"https://openalex.org/keywords/genome-annotation","display_name":"genome annotation","score":0.511435},{"id":"https://openalex.org/keywords/data-sharing","display_name":"Data Sharing","score":0.507971},{"id":"https://openalex.org/keywords/perl","display_name":"Perl","score":0.49126524}],"concepts":[{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.7769145},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.77610135},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6750081},{"id":"https://openalex.org/C20136886","wikidata":"https://www.wikidata.org/wiki/Q749647","display_name":"Interoperability","level":2,"score":0.5856115},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.51293916},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.50136137},{"id":"https://openalex.org/C153048206","wikidata":"https://www.wikidata.org/wiki/Q3454922","display_name":"Metadata repository","level":3,"score":0.49719194},{"id":"https://openalex.org/C2777002779","wikidata":"https://www.wikidata.org/wiki/Q42478","display_name":"Perl","level":2,"score":0.49126524},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4601304},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4350793},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.41701388},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.106506586},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.3389/fbinf.2023.1143014","pdf_url":"https://www.frontiersin.org/articles/10.3389/fbinf.2023.1143014/pdf","source":{"id":"https://openalex.org/S4210219554","display_name":"Frontiers in Bioinformatics","issn_l":"2673-7647","issn":["2673-7647"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC10098081","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37063647","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.3389/fbinf.2023.1143014","pdf_url":"https://www.frontiersin.org/articles/10.3389/fbinf.2023.1143014/pdf","source":{"id":"https://openalex.org/S4210219554","display_name":"Frontiers in Bioinformatics","issn_l":"2673-7647","issn":["2673-7647"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"score":0.45,"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":18,"referenced_works":["https://openalex.org/W2017952818","https://openalex.org/W2021037350","https://openalex.org/W2108234281","https://openalex.org/W2110417468","https://openalex.org/W2116041602","https://openalex.org/W2117608012","https://openalex.org/W2129455748","https://openalex.org/W2302501749","https://openalex.org/W2406493898","https://openalex.org/W2530682065","https://openalex.org/W2884419303","https://openalex.org/W3012529551","https://openalex.org/W3027376788","https://openalex.org/W3102028509","https://openalex.org/W3199620625","https://openalex.org/W3213275415","https://openalex.org/W4206412709","https://openalex.org/W4298139967"],"related_works":["https://openalex.org/W3023161639","https://openalex.org/W2972511296","https://openalex.org/W2782431616","https://openalex.org/W2394393789","https://openalex.org/W2379265733","https://openalex.org/W2374379029","https://openalex.org/W2183628870","https://openalex.org/W2008531296","https://openalex.org/W1552553528","https://openalex.org/W1503116306"],"abstract_inverted_index":{"Making":[0],"raw":[1,25],"data":[2,26,50,60,149],"available":[3],"to":[4,27,61,69,136,142,150],"the":[5,11,22,49,53,62,91,123,127,144],"research":[6],"community":[7],"is":[8,67,140],"one":[9],"of":[10,13,24,88,93,108,147],"pillars":[12],"Findability,":[14],"Accessibility,":[15],"Interoperability,":[16],"and":[17,40,52,74,90,134,155],"Reuse":[18],"(FAIR)":[19],"research.":[20],"However,":[21],"submission":[23,128,146],"public":[28],"databases":[29],"still":[30],"involves":[31],"many":[32],"manually":[33],"operated":[34],"procedures":[35],"that":[36,84,121],"are":[37,101],"intrinsically":[38],"time-consuming":[39],"error-prone,":[41],"which":[42,100],"raises":[43],"potential":[44],"reliability":[45],"issues":[46],"for":[47,81],"both":[48],"themselves":[51],"ensuing":[54],"metadata.":[55],"For":[56],"example,":[57],"submitting":[58],"sequencing":[59,148],"European":[63],"Genome-phenome":[64],"Archive":[65],"(EGA)":[66],"estimated":[68],"take":[70],"1":[71],"month":[72],"overall,":[73],"mainly":[75],"relies":[76],"on":[77],"a":[78,105,118],"web":[79],"interface":[80],"metadata":[82,137],"management":[83],"requires":[85],"manual":[86],"completion":[87],"forms":[89],"upload":[92],"several":[94],"comma":[95],"separated":[96],"values":[97],"(CSV)":[98],"files,":[99],"not":[102],"structured":[103],"from":[104,131],"formal":[106],"point":[107],"view.":[109],"To":[110],"tackle":[111],"these":[112],"limitations,":[113],"here":[114],"we":[115],"present":[116],"EGAsubmitter,":[117],"Snakemake-based":[119],"pipeline":[120],"guides":[122],"user":[124,153],"across":[125],"all":[126],"steps,":[129],"ranging":[130],"files":[132],"encryption":[133],"upload,":[135],"submission.":[138],"EGASubmitter":[139],"expected":[141],"streamline":[143],"automated":[145],"EGA,":[151],"minimizing":[152],"errors":[154],"ensuring":[156],"higher":[157],"end":[158],"product":[159],"fidelity.":[160]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4361280319","counts_by_year":[],"updated_date":"2024-10-10T19:27:50.553549","created_date":"2023-03-31"}