CINXE.COM
BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes | Molecular Biology and Evolution | Oxford Academic
<!DOCTYPE html> <html lang="en" class="no-js"> <head> <!-- charset must appear in the first 1024 bytes of the document --> <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> <title>BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes | Molecular Biology and Evolution | Oxford Academic</title> <script type='text/javascript' defer src='//js.trendmd.com/trendmd.min.js' data-trendmdconfig='{"element":"#trendmd-suggestions"}' class='optanon-category-C0002'></script> <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.7.1/jquery.min.js" type="text/javascript"></script> <script>window.jQuery || document.write('<script src="//oup.silverchair-cdn.com/Themes/Silver/app/js/jquery.3.7.1.min.js" type="text/javascript">\x3C/script>')</script> <script src="//oup.silverchair-cdn.com/Themes/Silver/app/vendor/v-638654880267142888/jquery-migrate-1.4.1.min.js" type="text/javascript"></script> <script type='text/javascript' src='https://platform-api.sharethis.com/js/sharethis.js#property=643701de45aa460012e1032e&product=sop' async='async' class='optanon-category-C0004'></script> <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=10" /> <meta http-equiv="X-UA-Compatible" content="IE=Edge" /> <!-- Turn off telephone number detection. --> <meta name="format-detection" content="telephone=no" /> <!-- Bookmark Icons --> <link rel="apple-touch-icon" sizes="180x180" href="//oup.silverchair-cdn.com/UI/app/img/v-638654879241847311/apple-touch-icon.png"> <link rel="icon" type="image/png" href="//oup.silverchair-cdn.com/UI/app/img/v-638654879242047735/favicon-32x32.png" sizes="32x32"> <link rel="icon" type="image/png" href="//oup.silverchair-cdn.com/UI/app/img/v-638654879241997236/favicon-16x16.png" sizes="16x16"> <link rel="mask-icon" href="//oup.silverchair-cdn.com/UI/app/img/v-638654879242697268/safari-pinned-tab.svg" color="#001C54"> <link rel="icon" href="//oup.silverchair-cdn.com/UI/app/img/v-638654879242147229/favicon.ico"> <link rel="manifest" href="//oup.silverchair-cdn.com/UI/app/img/v-638654879242447968/manifest.json"> <meta name="msapplication-config" content="//oup.silverchair-cdn.com/UI/app/img/v-638654879241847311/browserconfig.xml"> <meta name="theme-color" content="#002f65"> <link rel="stylesheet" type="text/css" href="//oup.silverchair-cdn.com/UI/app/fonts/icons.css" /> <link rel="stylesheet" type="text/css" href="//oup.silverchair-cdn.com/Themes/Client/app/css/v-638669719594245124/site.min.css" /> <link rel="preload" href="https://fonts.googleapis.com/css?family=Merriweather:300,400,400italic,700,700italic|Source+Sans+Pro:400,400italic,700,700italic" as="style" onload="this.onload=null;this.rel='stylesheet'"> <link href="//oup.silverchair-cdn.com/data/SiteBuilderAssetsOriginals/Live/CSS/journals/v-638647548564311250/global.css" rel="stylesheet" type="text/css" /> <link href="//oup.silverchair-cdn.com/data/SiteBuilderAssets/Live/CSS/mbe/v-637435494140226869/Site.css" rel="stylesheet" type="text/css" /> <script> var dataLayer = [{"full_title":"BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes","short_title":"BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes","authors":"Mosè Manni,Matthew R Berkeley,Mathieu Seppey,Felipe A Simão,Evgeny M Zdobnov","issue_and_volume":"Volume 38 | Issue 10","type":"letter","online_publication_date":"2021-07-28","access_type":"Open Access","license_type":"cc-by","event_type":"full-text","discipline_ot_level_1":"Science and Mathematics","discipline_ot_level_2":"Biological Sciences","supplier_tag":"SC_Journals","object_type":"Article","taxonomy":"taxId%3a39%7ctaxLabel%3aAcademicSubjects%7cnodeId%3aSCI01180%7cnodeLabel%3aMolecular+and+Cell+Biology%7cnodeLevel%3a3%3btaxId%3a39%7ctaxLabel%3aAcademicSubjects%7cnodeId%3aSCI01130%7cnodeLabel%3aEvolutionary+Biology%7cnodeLevel%3a3","siteid":"molbev","authzrequired":"false","doi":"10.1093/molbev/msab199"}]; </script> <script> (function (w, d, s, l, i) { w[l] = w[l] || []; w[l].push({ 'gtm.start': new Date().getTime(), event: 'gtm.js' }); var f = d.getElementsByTagName(s)[0], j = d.createElement(s), dl = l != 'dataLayer' ? '&l=' + l : ''; j.async = true; j.src = 'https://www.googletagmanager.com/gtm.js?id=' + i + dl; f.parentNode.insertBefore(j, f); })(window, document, 'script', 'dataLayer', 'GTM-W6DD7HV'); </script> <script type="text/javascript"> var App = App || {}; App.LoginUserInfo = { isInstLoggedIn: 0, isIndividualLoggedIn: 0 }; App.CurrentSubdomain = 'mbe'; App.SiteURL = 'academic.oup.com/mbe'; </script> <link href="https://cdn.jsdelivr.net/chartist.js/latest/chartist.min.css" media="print" onload="this.onload=null;this.removeAttribute('media');" rel="stylesheet" type="text/css" /> <script type="application/ld+json"> {"@context":"https://schema.org","@type":"ScholarlyArticle","@id":"https://academic.oup.com/mbe/article/38/10/4647/6329644","name":"BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes","datePublished":"2021-07-28","isPartOf":{"@id":"https://academic.oup.com/mbe/issue/38/10","@type":"PublicationIssue","issueNumber":"10","datePublished":"2021-09-27","isPartOf":{"@id":"https://academic.oup.com/mbe/mbe","@type":"Periodical","name":"Molecular Biology and Evolution","issn":["1537-1719"]}},"url":"https://dx.doi.org/10.1093/molbev/msab199","keywords":["quality assessment","completeness","genome","transcriptome","prokaryotes","eukaryotes","viruses","microbes","metagenomes"],"inLanguage":"en","copyrightHolder":"Society for Molecular Biology and Evolution","copyrightYear":"2024","publisher":"Oxford University Press","author":[{"name":"Manni, Mosè","affiliation":"Department of Genetic Medicine and Development, University of Geneva , Geneva, Switzerland Swiss Institute of Bioinformatics , Geneva, Switzerland","@type":"Person","sameAs":"https://orcid.org/0000-0002-4146-6523"},{"name":"Berkeley, Matthew R","affiliation":"Department of Genetic Medicine and Development, University of Geneva , Geneva, Switzerland Swiss Institute of Bioinformatics , Geneva, Switzerland","@type":"Person"},{"name":"Seppey, Mathieu","affiliation":"Department of Genetic Medicine and Development, University of Geneva , Geneva, Switzerland Swiss Institute of Bioinformatics , Geneva, Switzerland","@type":"Person"},{"name":"Simão, Felipe A","affiliation":"Department of Genetic Medicine and Development, University of Geneva , Geneva, Switzerland Swiss Institute of Bioinformatics , Geneva, Switzerland","@type":"Person"},{"name":"Zdobnov, Evgeny M","affiliation":"Department of Genetic Medicine and Development, University of Geneva , Geneva, Switzerland Swiss Institute of Bioinformatics , Geneva, Switzerland","@type":"Person"}],"description":"Abstract. Methods for evaluating the quality of genomic and metagenomic data are essential to aid genome assembly procedures and to correctly interpret the","pageStart":"4647","pageEnd":"4654","siteName":"OUP Academic","thumbnailURL":"https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f1.jpeg?Expires=1794517789&Signature=eWh7HHHsCYWezRFtAFWvRluAqs7ihfBK1ywy~T3hpQgJYqVXx3JbKxXf70K4y7jC31FHEUbKDhlkWFwIRIluyMgbbzXndgNn6ZfbAfZjQAd-O316IMijKLMZmTOb5M7Y2b-898e9zuDENQViMXzYWW2uxzwN29O1Aqq4yShaCfBHqA4lnIxoQ5Rj87IAGxI9Rgf8DPVCVPziLHOvv2edjOV-gQRpjy9e0JSpC9cp9GmuwwYVFeQXhdbdbo34b7hQhh9ySRE1TQSNcy9t61Wy6cgV-kXyHu0VHKL99eFHyKxBouWDtZ8mgRcjhVkLIccSgX7s2d5nA9LFJyngqJsJUg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA","headline":"BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes","image":"https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f1.jpeg?Expires=1794517789&Signature=eWh7HHHsCYWezRFtAFWvRluAqs7ihfBK1ywy~T3hpQgJYqVXx3JbKxXf70K4y7jC31FHEUbKDhlkWFwIRIluyMgbbzXndgNn6ZfbAfZjQAd-O316IMijKLMZmTOb5M7Y2b-898e9zuDENQViMXzYWW2uxzwN29O1Aqq4yShaCfBHqA4lnIxoQ5Rj87IAGxI9Rgf8DPVCVPziLHOvv2edjOV-gQRpjy9e0JSpC9cp9GmuwwYVFeQXhdbdbo34b7hQhh9ySRE1TQSNcy9t61Wy6cgV-kXyHu0VHKL99eFHyKxBouWDtZ8mgRcjhVkLIccSgX7s2d5nA9LFJyngqJsJUg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA","image:alt":"Comparison of the number of complete BUSCOs obtained by running BUSCO v5 and v3 with BUSCO odb_10 and odb_9 data sets on (a) bacterial, (b) fungal, and (c) metazoan gene sets."} </script> <meta property="og:site_name" content="OUP Academic" /> <meta property="og:title" content="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" /> <meta property="og:description" content="Abstract. Methods for evaluating the quality of genomic and metagenomic data are essential to aid genome assembly procedures and to correctly interpret the" /> <meta property="og:type" content="article" /> <meta property="og:url" content="https://dx.doi.org/10.1093/molbev/msab199" /> <meta property="og:updated_time" content="" /> <meta property="og:image" content="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f1.jpeg?Expires=1794517789&Signature=eWh7HHHsCYWezRFtAFWvRluAqs7ihfBK1ywy~T3hpQgJYqVXx3JbKxXf70K4y7jC31FHEUbKDhlkWFwIRIluyMgbbzXndgNn6ZfbAfZjQAd-O316IMijKLMZmTOb5M7Y2b-898e9zuDENQViMXzYWW2uxzwN29O1Aqq4yShaCfBHqA4lnIxoQ5Rj87IAGxI9Rgf8DPVCVPziLHOvv2edjOV-gQRpjy9e0JSpC9cp9GmuwwYVFeQXhdbdbo34b7hQhh9ySRE1TQSNcy9t61Wy6cgV-kXyHu0VHKL99eFHyKxBouWDtZ8mgRcjhVkLIccSgX7s2d5nA9LFJyngqJsJUg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA" /> <meta property="og:image:url" content="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f1.jpeg?Expires=1794517789&Signature=eWh7HHHsCYWezRFtAFWvRluAqs7ihfBK1ywy~T3hpQgJYqVXx3JbKxXf70K4y7jC31FHEUbKDhlkWFwIRIluyMgbbzXndgNn6ZfbAfZjQAd-O316IMijKLMZmTOb5M7Y2b-898e9zuDENQViMXzYWW2uxzwN29O1Aqq4yShaCfBHqA4lnIxoQ5Rj87IAGxI9Rgf8DPVCVPziLHOvv2edjOV-gQRpjy9e0JSpC9cp9GmuwwYVFeQXhdbdbo34b7hQhh9ySRE1TQSNcy9t61Wy6cgV-kXyHu0VHKL99eFHyKxBouWDtZ8mgRcjhVkLIccSgX7s2d5nA9LFJyngqJsJUg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA" /> <meta property="og:image:secure_url" content="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f1.jpeg?Expires=1794517789&Signature=eWh7HHHsCYWezRFtAFWvRluAqs7ihfBK1ywy~T3hpQgJYqVXx3JbKxXf70K4y7jC31FHEUbKDhlkWFwIRIluyMgbbzXndgNn6ZfbAfZjQAd-O316IMijKLMZmTOb5M7Y2b-898e9zuDENQViMXzYWW2uxzwN29O1Aqq4yShaCfBHqA4lnIxoQ5Rj87IAGxI9Rgf8DPVCVPziLHOvv2edjOV-gQRpjy9e0JSpC9cp9GmuwwYVFeQXhdbdbo34b7hQhh9ySRE1TQSNcy9t61Wy6cgV-kXyHu0VHKL99eFHyKxBouWDtZ8mgRcjhVkLIccSgX7s2d5nA9LFJyngqJsJUg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA" /> <meta property="og:image:alt" content="Comparison of the number of complete BUSCOs obtained by running BUSCO v5 and v3 with BUSCO odb_10 and odb_9 data sets on (a) bacterial, (b) fungal, and (c) metazoan gene sets." /> <meta name="twitter:card" content="summary_large_image" /> <meta name="citation_author" content="Manni, Mosè" /><meta name="citation_author_institution" content="Department of Genetic Medicine and Development, University of Geneva, Geneva, Switzerland" /><meta name="citation_author_institution" content="Swiss Institute of Bioinformatics, Geneva, Switzerland" /><meta name="citation_author" content="Berkeley, Matthew R" /><meta name="citation_author_institution" content="Department of Genetic Medicine and Development, University of Geneva, Geneva, Switzerland" /><meta name="citation_author_institution" content="Swiss Institute of Bioinformatics, Geneva, Switzerland" /><meta name="citation_author" content="Seppey, Mathieu" /><meta name="citation_author_institution" content="Department of Genetic Medicine and Development, University of Geneva, Geneva, Switzerland" /><meta name="citation_author_institution" content="Swiss Institute of Bioinformatics, Geneva, Switzerland" /><meta name="citation_author" content="Simão, Felipe A" /><meta name="citation_author_institution" content="Department of Genetic Medicine and Development, University of Geneva, Geneva, Switzerland" /><meta name="citation_author_institution" content="Swiss Institute of Bioinformatics, Geneva, Switzerland" /><meta name="citation_author" content="Zdobnov, Evgeny M" /><meta name="citation_author_institution" content="Department of Genetic Medicine and Development, University of Geneva, Geneva, Switzerland" /><meta name="citation_author_institution" content="Swiss Institute of Bioinformatics, Geneva, Switzerland" /><meta name="citation_title" content="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" /><meta name="citation_firstpage" content="4647" /><meta name="citation_lastpage" content="4654" /><meta name="citation_doi" content="10.1093/molbev/msab199" /><meta name="citation_journal_title" content="Molecular Biology and Evolution" /><meta name="citation_journal_abbrev" content="Mol Biol Evol" /><meta name="citation_volume" content="38" /><meta name="citation_issue" content="10" /><meta name="citation_publication_date" content="2021/09/27" /><meta name="citation_publisher" content="Oxford Academic" /><meta name="citation_reference" content="citation_title=NCBI viral genomes resource; citation_author=Brister JR; citation_author=Ako-adjei D; citation_author=Bao Y; citation_author=Blinkova O.; citation_journal_title=Nucleic Acids Res; citation_year=2015; citation_volume=43(Database issue; citation_pages=D571-D577; " /><meta name="citation_reference" content="citation_title=Anvi’o: an advanced analysis and visualization platform for ‘omics data; citation_author=Eren AM; citation_author=Esen ÖC; citation_author=Quince C; citation_author=Vineis JH; citation_author=Morrison HG; citation_author=Sogin ML; citation_author=Delmont TO.; citation_journal_title=PeerJ; citation_year=2015; citation_volume=3; citation_pages=e1319" /><meta name="citation_reference" content="citation_title=Bioconda: sustainable and comprehensive software distribution for the life sciences; citation_author=Grüning B; citation_author=Dale R; citation_author=Sjödin A; citation_author=Chapman BA; citation_author=Rowe J; citation_author=Tomkins-Tinch CH; citation_author=Valieris R; citation_author=Köster J; citation_journal_title=Nat Methods; citation_year=2018; citation_volume=15; citation_issue=7; citation_pages=475-476; " /><meta name="citation_reference" content="citation_title=Prodigal: prokaryotic gene recognition and translation initiation site identification; citation_author=Hyatt D; citation_author=Chen G-L; citation_author=LoCascio PF; citation_author=Land ML; citation_author=Larimer FW; citation_author=Hauser LJ.; citation_journal_title=BMC Bioinformatics; citation_year=2010; citation_volume=11; citation_pages=119" /><meta name="citation_reference" content="citation_title=OrthoDB v10: sampling the diversity of animal, plant, fungal, protist, bacterial and viral genomes for evolutionary and functional annotations of orthologs; citation_author=Kriventseva EV; citation_author=Kuznetsov D; citation_author=Tegenfeldt F; citation_author=Manni M; citation_author=Dias R; citation_author=Simão FA; citation_author=Zdobnov EM.; citation_journal_title=Nucleic Acids Res; citation_year=2019; citation_volume=47; citation_issue=D1; citation_pages=D807-D811; " /><meta name="citation_reference" content="citation_title=MetaEuk—sensitive, high-throughput gene discovery, and annotation for large-scale eukaryotic metagenomics; citation_author=Levy Karin E; citation_author=Mirdita M; citation_author=Söding J.; citation_journal_title=Microbiome; citation_year=2020; citation_volume=8; citation_issue=1; citation_pages=48" /><meta name="citation_reference" content="citation_title=pplacer: linear time maximum-likelihood and Bayesian phylogenetic placement of sequences onto a fixed reference tree; citation_author=Matsen FA; citation_author=Kodner RB; citation_author=Armbrust EV.; citation_journal_title=BMC Bioinformatics; citation_year=2010; citation_volume=11; citation_pages=538" /><meta name="citation_reference" content="citation_title=Docker: lightweight Linux containers for consistent development and deployment; citation_author=Merkel D.; citation_journal_title=Linux J; citation_year=2014; citation_volume=2; citation_pages=2" /><meta name="citation_reference" content="citation_author=Mirarab S; citation_author=Nguyen N; citation_author=Warnow T.; citation_publisher=World Scientific, Kohala Coast (HI; citation_title=SEPP: SATé-enabled phylogenetic placement; citation_year=2011; citation_pages=247-258; " /><meta name="citation_reference" content="citation_title=Sustainable data analysis with Snakemake; citation_author=Mölder F; citation_author=Jablonski KP; citation_author=Letcher B; citation_author=Hall MB; citation_author=Tomkins-Tinch CH; citation_author=Sochat V; citation_author=Forster J; citation_author=Lee S; citation_author=Twardziok SO; citation_author=Kanitz A; citation_journal_title=F1000Res; citation_year=2021; citation_volume=10; citation_pages=33" /><meta name="citation_reference" content="citation_title=CheckV assesses the quality and completeness of metagenome-assembled viral genomes; citation_author=Nayfach S; citation_author=Camargo AP; citation_author=Schulz F; citation_author=Eloe-Fadrosh E; citation_author=Roux S; citation_author=Kyrpides NC.; citation_journal_title=Nat Biotechnol; citation_year=2021; citation_volume=39; citation_pages=578-585; " /><meta name="citation_reference" content="citation_title=Reference sequence (RefSeq) database at NCBI: current status, taxonomic expansion, and functional annotation; citation_author=O’Leary NA; citation_author=Wright MW; citation_author=Brister JR; citation_author=Ciufo S; citation_author=Haddad D; citation_author=McVeigh R; citation_author=Rajput B; citation_author=Robbertse B; citation_author=Smith-White B; citation_author=Ako-Adjei D; citation_journal_title=Nucleic Acids Res; citation_year=2016; citation_volume=44; citation_issue=D1; citation_pages=D733-D745; " /><meta name="citation_reference" content="citation_title=CheckM: assessing the quality of microbial genomes recovered from isolates, single cells, and metagenomes; citation_author=Parks DH; citation_author=Imelfort M; citation_author=Skennerton CT; citation_author=Hugenholtz P; citation_author=Tyson GW.; citation_journal_title=Genome Res; citation_year=2015; citation_volume=25; citation_issue=7; citation_pages=1043-1055; " /><meta name="citation_reference" content="citation_title=CEGMA: a pipeline to accurately annotate core genes in eukaryotic genomes; citation_author=Parra G; citation_author=Bradnam K; citation_author=Korf I.; citation_journal_title=Bioinformatics; citation_year=2007; citation_volume=23; citation_issue=9; citation_pages=1061-1067; " /><meta name="citation_reference" content="citation_publisher=R Foundation for Statistical Computing, Vienna (Austria; citation_title=R: a language and environment for statistical computing; citation_year=2020; " /><meta name="citation_reference" content="citation_title=Estimating the quality of eukaryotic genomes recovered from metagenomic analysis with EukCC; citation_author=Saary P; citation_author=Mitchell AL; citation_author=Finn RD.; citation_journal_title=Genome Biol; citation_year=2020; citation_volume=21; citation_issue=1; citation_pages=244" /><meta name="citation_reference" content="citation_title=BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs; citation_author=Simão FA; citation_author=Waterhouse RM; citation_author=Ioannidis P; citation_author=Kriventseva EV; citation_author=Zdobnov EM.; citation_journal_title=Bioinformatics; citation_year=2015; citation_volume=31; citation_issue=19; citation_pages=3210-3212; " /><meta name="citation_reference" content="citation_title=Using native and syntenically mapped cDNA alignments to improve de novo gene finding; citation_author=Stanke M; citation_author=Diekhans M; citation_author=Baertsch R; citation_author=Haussler D.; citation_journal_title=Bioinformatics; citation_year=2008; citation_volume=24; citation_issue=5; citation_pages=637-644; " /><meta name="citation_reference" content="citation_title=MMseqs2 enables sensitive protein sequence searching for the analysis of massive data sets; citation_author=Steinegger M; citation_author=Söding J.; citation_journal_title=Nat Biotechnol; citation_year=2017; citation_volume=35; citation_issue=11; citation_pages=1026-1028; " /><meta name="citation_reference" content="citation_title=Evolution of microsporidia: an extremely successful group of eukaryotic intracellular parasites; citation_author=Wadi L; citation_author=Reinke AW.; citation_journal_title=PLoS Pathog; citation_year=2020; citation_volume=16; citation_issue=2; citation_pages=e1008276" /><meta name="citation_reference" content="citation_title=BUSCO applications from quality assessments to gene prediction and phylogenomics; citation_author=Waterhouse RM; citation_author=Seppey M; citation_author=Simão FA; citation_author=Manni M; citation_author=Ioannidis P; citation_author=Klioutchnikov G; citation_author=Kriventseva EV; citation_author=Zdobnov EM.; citation_journal_title=Mol Biol Evol; citation_year=2018; citation_volume=35; citation_issue=3; citation_pages=543-548; " /><meta name="citation_reference" content="citation_author=Wickham H.; citation_publisher=Springer-Verlag, New York; citation_title=ggplot2: elegant graphics for data analysis; citation_year=2009; " /><meta name="citation_reference" content="citation_title=OrthoDB in 2020: evolutionary and functional annotations of orthologs; citation_author=Zdobnov EM; citation_author=Kuznetsov D; citation_author=Tegenfeldt F; citation_author=Manni M; citation_author=Berkeley M; citation_author=Kriventseva EV.; citation_journal_title=Nucleic Acids Res; citation_year=2021; citation_volume=49; citation_issue=D1; citation_pages=D389-D393; " /><meta name="citation_fulltext_world_readable" content="" /><meta name="citation_pdf_url" content="https://academic.oup.com/mbe/article-pdf/38/10/4647/40449445/msab199.pdf" /><meta name="description" content="Abstract. Methods for evaluating the quality of genomic and metagenomic data are essential to aid genome assembly procedures and to correctly interpret the" /><meta name="citation_xml_url" content="https://academic.oup.com/mbe/article-xml/38/10/4647/6329644" /> <link rel="canonical" href="https://academic.oup.com/mbe/article/38/10/4647/6329644" /> <meta name="citation_fulltext_world_readable" /> <meta name="product_code" content="J_MOLBEV_2021_01_12" /> <meta name="product_code" content="J_MOLBEV_1996_01_9999" /> <meta name="product_code" content="J_MOLBEV_2020_12_13" /> <meta name="product_code" content="J_MOLBEV_2021_02_13" /> <meta name="product_code" content="J_MOLBEV_2020_11_13" /> <meta name="product_code" content="OPEN_ACCESS" /> <meta name="product_code" content="j_ALLJOURNALS" /> <meta name="product_code" content="MBE_all_free" /> <meta name="product_code" content="SOLR_FACET_FREE" /> <meta name="product_code" content="J_6329644" /> <meta name="product_code" content="I_131323" /> <script> var SCM = SCM || {}; SCM.pubGradeAdsEnabled = true; SCM.pubGradeJSLibrary = 'https://cdn.pbgrd.com/core-oup-new.js'; </script> <script async="async" src="https://securepubads.g.doubleclick.net/tag/js/gpt.js"></script> <script> var googletag = googletag || {}; googletag.cmd = googletag.cmd || []; </script> <script type='text/javascript'> var gptAdSlots = []; googletag.cmd.push(function() { var mapping_ad1 = googletag.sizeMapping() .addSize([1024, 0], [[970, 90], [728, 90]]) .addSize([768, 0], [728, 90]) .addSize([0, 0], [320, 50]) .build(); gptAdSlots["ad1"] = googletag.defineSlot('/116097782/mbe_Supplement_Ad1', [[970, 90], [728, 90], [320, 50]], 'adBlockHeader') .defineSizeMapping(mapping_ad1) .addService(googletag.pubads()); var mapping_ad2 = googletag.sizeMapping() .addSize([768, 0], [[300, 250], [300, 600], [160, 600]]) .build(); gptAdSlots["ad2"] = googletag.defineSlot('/116097782/mbe_Supplement_Ad2', [[300, 250], [160, 600], [300, 600]], 'adBlockMainBodyTop') .defineSizeMapping(mapping_ad2) .addService(googletag.pubads()); var mapping_ad3 = googletag.sizeMapping() .addSize([768, 0], [[300, 250], [300, 600], [160, 600]]) .build(); gptAdSlots["ad3"] = googletag.defineSlot('/116097782/mbe_Supplement_Ad3', [[300, 250], [160, 600], [300, 600]], 'adBlockMainBodyBottom') .defineSizeMapping(mapping_ad3) .addService(googletag.pubads()); var mapping_ad4 = googletag.sizeMapping() .addSize([0,0], [320, 50]) .addSize([768, 0], [728, 90]) .build(); gptAdSlots["ad4"] = googletag.defineSlot('/116097782/mbe_Supplement_Ad4', [728, 90], 'adBlockFooter') .defineSizeMapping(mapping_ad4) .addService(googletag.pubads()); var mapping_ad6 = googletag.sizeMapping() .addSize([1024, 0], [[970, 90], [728, 90]]) .addSize([768, 0], [728, 90]) .addSize([0, 0], [320, 50]) .build(); gptAdSlots["ad6"] = googletag.defineSlot('/116097782/mbe_Supplement_Ad6', [[728, 90], [970, 90]], 'adBlockStickyFooter') .defineSizeMapping(mapping_ad6) .addService(googletag.pubads()); gptAdSlots["adInterstitial"] = googletag.defineOutOfPageSlot('/116097782/mbe_Interstitial_Ad', googletag.enums.OutOfPageFormat.INTERSTITIAL) .addService(googletag.pubads()); googletag.pubads().addEventListener('slotRenderEnded', function (event) { if (!event.isEmpty) { $('.js-' + event.slot.getSlotElementId()).each(function () { if ($(this).find('iframe').length) { $(this).removeClass('hide'); } }); } }); googletag.pubads().addEventListener('impressionViewable', function (event) { if (!event.isEmpty) { $('.js-' + event.slot.getSlotElementId()).each(function () { var $adblockDiv = $(this).find('.js-adblock'); var $adText = $(this).find('.js-adblock-advertisement-text'); if ($adblockDiv && $adblockDiv.is(':visible') && $adblockDiv.find('*').length > 1) { $adText.removeClass('hide'); App.CenterAdBlock.Init($adblockDiv, $adText); } else { $adText.addClass('hide'); } //Initialize logic for Sticky Footer Ad var $stickyFooterDiv = $(this).parents('.js-sticky-footer-ad'); if ($stickyFooterDiv && $stickyFooterDiv.is(':visible') && $stickyFooterDiv.find('*').length > 1) { App.StickyFooterAd.Init(); } }); } }); googletag.pubads().setTargeting("jnlspage", "article"); googletag.pubads().setTargeting("jnlsurl", "mbe/article/38/10/4647/6329644"); googletag.pubads().enableSingleRequest(); googletag.pubads().disableInitialLoad(); googletag.pubads().collapseEmptyDivs(); }); </script> <input type="hidden" class="hfInterstitial" data-interstitiallinks="mbe/issue,mbe/advance-articles,mbe/advance-article,mbe/supplements,mbe/article,mbe/article-abstract,mbe/pages" data-subdomain="mbe" /> <script type="text/javascript"> googletag.cmd.push(function () { googletag.pubads().setTargeting("jnlsdoi", "10.1093/molbev/msab199"); googletag.enableServices(); }); </script> <script type="text/javascript"> var NTPT_PGEXTRA= 'event_type=full-text&discipline_ot_level_1=Science and Mathematics&discipline_ot_level_2=Biological Sciences&supplier_tag=SC_Journals&object_type=Article&taxonomy=taxId%3a39%7ctaxLabel%3aAcademicSubjects%7cnodeId%3aSCI01180%7cnodeLabel%3aMolecular+and+Cell+Biology%7cnodeLevel%3a3%3btaxId%3a39%7ctaxLabel%3aAcademicSubjects%7cnodeId%3aSCI01130%7cnodeLabel%3aEvolutionary+Biology%7cnodeLevel%3a3&siteid=molbev&authzrequired=false&doi=10.1093/molbev/msab199'; </script> <script src="https://scholar.google.com/scholar_js/casa.js" async></script> </head> <body data-sitename="molecularbiologyandevolution" class="off-canvas pg_Article pg_article " theme-mbe data-sitestyletemplate="Journal" > <noscript> <iframe src="https://www.googletagmanager.com/ns.html?id=GTM-W6DD7HV" height="0" width="0" style="display:none;visibility:hidden"></iframe> </noscript> <a href="#skipNav" class="skipnav">Skip to Main Content</a> <input id="hdnSiteID" name="hdnSiteID" type="hidden" value="5325" /><input id="hdnAdDelaySeconds" name="hdnAdDelaySeconds" type="hidden" value="5000" /><input id="hdnAdConfigurationTop" name="hdnAdConfigurationTop" type="hidden" value="default" /><input id="hdnAdConfigurationRightRail" name="hdnAdConfigurationRightRail" type="hidden" value="sticky" /> <div class="master-container js-master-container"> <section class="master-header row js-master-header vt-site-page-header"> <div class="widget widget-SitePageHeader widget-instance-SitePageHeader"> <div class="ad-banner js-ad-banner-header"> <div class="widget widget-AdBlock widget-instance-HeaderAd"> <div class="js-adBlock-parent-wrap adblock-parent-wrap"> <div class="adBlockHeader-wrap js-adBlockHeader hide"> <div id="adBlockHeader" class="js-adblock at-adblock" data-lazy-load-margin="150"> <script> googletag.cmd.push(function () { googletag.display('adBlockHeader'); }); </script> </div> <div class="advertisement-text at-adblock js-adblock-advertisement-text hide">Advertisement</div> </div> </div> </div> </div> <div class="oup-header sigma "> <div class="center-inner-row"> <div class="oup-header-logo"> <a href="/"> <img src="//oup.silverchair-cdn.com/UI/app/svg/umbrella/oxford-academic-logo.svg" alt="Oxford Academic" class="oup-header-image at-oup-header-image " /> </a> </div> <div class="widget widget-CustomNavLinks widget-instance-CustomNavLinksDeskTop"> <div class="custom-nav-links-box"> <div class="custom-nav-link"> <a href="/journals">Journals</a> </div> <div class="custom-nav-link"> <a href="/books">Books</a> </div> </div> </div> <ul class="oup-header-menu account-menu sigma-account-menu "> <li class="oup-header-menu-item mobile"> <a href="javascript:;" class="mobile-dropdown-toggle mobile-search-toggle"> <i class="icon-menu_search"><span class="screenreader-text">Search Menu</span></i> </a> </li> <li class="oup-header-menu-item mobile info-icon-menu-item"> <a href="/pages/information" target="_blank" class="at-info-button sigma-info-wrapper" role="button"> <img class="sigma-info-icon" src="//oup.silverchair-cdn.com/UI/app/svg/i.svg" alt="Information" /> </a> </li> <li class="oup-header-menu-item mobile account-icon-menu-item"> <a href="javascript:;" class="account-button js-account-button at-account-button " role="button" data-turnawayparams="journal%3dmbe"> <img class="sigma-account-icon" src="//oup.silverchair-cdn.com/UI/app/svg/account.svg" alt="Account" /> </a> </li> <li class="oup-header-menu-item mobile"> <a href="javascript:;" class="mobile-dropdown-toggle mobile-nav-toggle"> <i class="icon-menu_hamburger"><span class="screenreader-text">Menu</span></i> </a> </li> <li class="oup-header-menu-item desktop info-icon-menu-item"> <a href="/pages/information" target="_blank" class="at-info-button sigma-info-wrapper" role="button"> <img class="sigma-info-icon" src="//oup.silverchair-cdn.com/UI/app/svg/i.svg" alt="Information" /> </a> </li> <li class="oup-header-menu-item desktop account-icon-menu-item"> <a href="javascript:;" class="account-button js-account-button at-account-button sigma-logo-wrapper" role="button" data-turnawayparams="journal%3dmbe"> <img class="sigma-account-icon" src="//oup.silverchair-cdn.com/UI/app/svg/account.svg" alt="Account" /> </a> </li> <li class="oup-header-menu-item desktop account-icon-menu-item"> <div class="widget widget-SeamlessAccess widget-instance-SitePageHeader"> <a href="javascript:;" class="js-shibboleth-action seamless-access-button seamless-button-header button-call-to-action at-institutional-sign-in" rel="nofollow" data-action-type="" data-entity-id=""> <span class="seamless-access-text">Sign in through your institution</span> </a> </div> </li> </ul> <div class="login-box-placeholder js-login-box-placeholder hide"> <div class="spinner"></div> </div> </div> </div> <div class="dropdown-panel-wrap"> <div class="dropdown-panel mobile-search-dropdown"> <div class="mobile-search-inner-wrap"> <div class="navbar-search"> <div class="mobile-microsite-search"> <label for="SitePageHeader-mobile-navbar-search-filter" class="screenreader-text js-mobile-navbar-search-filter-label"> Navbar Search Filter </label> <select class="mobile-navbar-search-filter js-mobile-navbar-search-filter at-navbar-search-filter" id="SitePageHeader-mobile-navbar-search-filter"> <option class="navbar-search-filter-option at-navbar-search-filter-option" value="">Molecular Biology and Evolution</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Issue">This issue</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Parent">Society for Molecular Biology and Evolution Journals</option> <optgroup class="navbar-search-optgroup" label="Search across Oxford Academic"> <option class="navbar-search-filter-option at-navbar-search-filter-option" value="AcademicSubjects/SCI01130">Evolutionary Biology</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="AcademicSubjects/SCI01180">Molecular and Cell Biology</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Books">Books</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Journals">Journals</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Umbrella">Oxford Academic</option> </optgroup> </select> <label for="SitePageHeader-mobile-microsite-search-term" class="screenreader-text js-mobile-microsite-search-term-label"> Mobile Enter search term </label> <input class="mobile-search-input mobile-microsite-search-term js-mobile-microsite-search-term at-microsite-search-term" type="text" maxlength="255" placeholder="Search" id="SitePageHeader-mobile-microsite-search-term"> <a href="javascript:;" class="mobile-microsite-search-icon mobile-search-submit icon-menu_search"> <span class="screenreader-text">Search</span> </a> </div> </div> </div> </div> <div class="dropdown-panel mobile-nav-dropdown"> <ul class="site-menu site-menu-lvl-0 at-site-menu"> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709066"> <a href="/mbe/issue" class="nav-link"> Issues </a> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709063"> <a href="javascript:;" class="nav-link js-nav-dropdown at-nav-dropdown" role="button" aria-expanded="false"> More content <i class="desktop-nav-arrow icon-general-arrow-filled-down arrow-icon"></i> </a> <i class="mobile-nav-arrow icon-general_arrow-down"></i> <ul class="site-menu site-menu-lvl-1 at-site-menu"> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709067"> <a href="/mbe/advance-articles" class="nav-link"> Advance Articles </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709068"> <a href="https://academic.oup.com/mbe/pages/virtual-issues" class="nav-link"> Virtual Issues </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709069"> <a href="https://academic.oup.com/mbe/pages/highly_cited" class="nav-link"> High-Impact Research Collection </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709070"> <a href="https://academic.oup.com/smbejournals/pages/40th-anniversary" class="nav-link"> Celebrate 40 years of MBE </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709071"> <a href="https://academic.oup.com/mbe/search-results?allJournals=1&f_TocHeadingTitleList=Perspective&fl_SiteID=5325&page=1&sort=Date+%e2%80%93+Newest+First" class="nav-link"> Perspectives </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709072"> <a href="https://academic.oup.com/mbe/search-results?sort=Date+%e2%80%93+Newest+First&allJournals=1&f_TocHeadingTitleList=Discoveries&fl_SiteID=5325&page=1" class="nav-link"> Discoveries </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709073"> <a href="https://academic.oup.com/mbe/search-results?sort=Date+%e2%80%93+Newest+First&allJournals=1&f_TocHeadingTitleList=METHODS&fl_SiteID=5325&page=1" class="nav-link"> Methods </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709074"> <a href="https://academic.oup.com/mbe/search-results?sort=Date+%e2%80%93+Newest+First&allJournals=1&f_TocHeadingTitleList=Resources&fl_SiteID=5325&page=1" class="nav-link"> Resources </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709075"> <a href="https://academic.oup.com/mbe/search-results?sort=Date+%e2%80%93+Newest+First&f_TocHeadingTitleList=PROTOCOLSANDProtocol&fl_SiteID=5325&page=1" class="nav-link"> Protocols </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709076"> <a href="https://academic.oup.com/mbe/search-results?f_TocHeadingTitleList=HighlightsANDNews&fl_SiteID=5325&page=1" class="nav-link"> Highlights </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709077"> <a href="https://academic.oup.com/mbe/issue-covers" class="nav-link"> Cover Archive </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709078"> <a href="https://academic.oup.com/mbe/search-results?f_TocHeadingTitleList=Brief+CommunicationsANDLetter&fl_SiteID=5325&page=1" class="nav-link"> Brief Communications </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709079"> <a href="https://academic.oup.com/mbe/search-results?f_TocHeadingTitleList=Review" class="nav-link"> Reviews </a> </li> </ul> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709064"> <a href="javascript:;" class="nav-link js-nav-dropdown at-nav-dropdown" role="button" aria-expanded="false"> Submit <i class="desktop-nav-arrow icon-general-arrow-filled-down arrow-icon"></i> </a> <i class="mobile-nav-arrow icon-general_arrow-down"></i> <ul class="site-menu site-menu-lvl-1 at-site-menu"> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709080"> <a href="http://mc.manuscriptcentral.com/mbe" class="nav-link"> Submission site </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709081"> <a href="https://academic.oup.com/mbe/pages/author-guidelines" class="nav-link"> Author guidelines </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709082"> <a href="https://academic.oup.com/mbe/pages/Open_Access" class="nav-link"> Open access </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709083"> <a href="https://academic.oup.com/journals/pages/self_archiving_policy_c" class="nav-link"> Self-archiving policy </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709084"> <a href="https://academic.oup.com/mbe/pages/why-publish" class="nav-link"> Reasons to submit </a> </li> </ul> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709085"> <a href="https://academic.oup.com/journals/pages/help/journal_alerts" class="nav-link"> Alerts </a> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709065"> <a href="javascript:;" class="nav-link js-nav-dropdown at-nav-dropdown" role="button" aria-expanded="false"> About <i class="desktop-nav-arrow icon-general-arrow-filled-down arrow-icon"></i> </a> <i class="mobile-nav-arrow icon-general_arrow-down"></i> <ul class="site-menu site-menu-lvl-1 at-site-menu"> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709086"> <a href="/mbe/pages/About" class="nav-link"> About Molecular Biology and Evolution </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709087"> <a href="http://www.smbe.org/smbe/" class="nav-link"> About the Society for Molecular Biology and Evolution </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709088"> <a href="/mbe/pages/Editorial_Board" class="nav-link"> Editorial Board </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709089"> <a href="https://academic.oup.com/advertising-and-corporate-services/pages/mbe-media-kit" class="nav-link"> Advertising and Corporate Services </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709090"> <a href="http://medicine-and-health-careernetwork.oxfordjournals.org" class="nav-link"> Journals Career Network </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709091"> <a href="http://www.smbe.org/smbe/" class="nav-link"> Contact Us </a> </li> </ul> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-custom"> <a href="/journals" class="nav-link">Journals on Oxford Academic</a> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-custom"> <a href="/books" class="nav-link">Books on Oxford Academic</a> </li> </ul> </div> </div> <div class="journal-header journal-bg"> <div class="center-inner-row"> <div class="site-parent-link-wrap"> <a href="//academic.oup.com/smbejournals" class="site-parent-link">Society for Molecular Biology and Evolution Journals</a> </div> <a href="/mbe" class="journal-logo-container"> <img id="logo-MolecularBiologyandEvolution" class="journal-logo" src="//oup.silverchair-cdn.com/data/SiteBuilderAssets/Live/Images/mbe/mbe_title188616415.svg" alt="Molecular Biology and Evolution" /> </a> <div class="society-logo-block"> <div class="society-block-inner-wrap"> <a href="http://www.smbe.org/smbe/" target="" class="society-logo-container"> <img id="logo-SocietyforMolecularBiologyandEvolution" class="society-logo" src="//oup.silverchair-cdn.com/data/SiteBuilderAssets/Live/Images/mbe/mbe_h1-1277340080.svg" alt="Society for Molecular Biology and Evolution" /> </a> </div> </div> </div> </div> <div class="navbar"> <div class="center-inner-row"> <nav class="navbar-menu"> <ul class="site-menu site-menu-lvl-0 at-site-menu"> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709066"> <a href="/mbe/issue" class="nav-link"> Issues </a> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709063"> <a href="javascript:;" class="nav-link js-nav-dropdown at-nav-dropdown" role="button" aria-expanded="false"> More content <i class="desktop-nav-arrow icon-general-arrow-filled-down arrow-icon"></i> </a> <i class="mobile-nav-arrow icon-general_arrow-down"></i> <ul class="site-menu site-menu-lvl-1 at-site-menu"> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709067"> <a href="/mbe/advance-articles" class="nav-link"> Advance Articles </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709068"> <a href="https://academic.oup.com/mbe/pages/virtual-issues" class="nav-link"> Virtual Issues </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709069"> <a href="https://academic.oup.com/mbe/pages/highly_cited" class="nav-link"> High-Impact Research Collection </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709070"> <a href="https://academic.oup.com/smbejournals/pages/40th-anniversary" class="nav-link"> Celebrate 40 years of MBE </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709071"> <a href="https://academic.oup.com/mbe/search-results?allJournals=1&f_TocHeadingTitleList=Perspective&fl_SiteID=5325&page=1&sort=Date+%e2%80%93+Newest+First" class="nav-link"> Perspectives </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709072"> <a href="https://academic.oup.com/mbe/search-results?sort=Date+%e2%80%93+Newest+First&allJournals=1&f_TocHeadingTitleList=Discoveries&fl_SiteID=5325&page=1" class="nav-link"> Discoveries </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709073"> <a href="https://academic.oup.com/mbe/search-results?sort=Date+%e2%80%93+Newest+First&allJournals=1&f_TocHeadingTitleList=METHODS&fl_SiteID=5325&page=1" class="nav-link"> Methods </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709074"> <a href="https://academic.oup.com/mbe/search-results?sort=Date+%e2%80%93+Newest+First&allJournals=1&f_TocHeadingTitleList=Resources&fl_SiteID=5325&page=1" class="nav-link"> Resources </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709075"> <a href="https://academic.oup.com/mbe/search-results?sort=Date+%e2%80%93+Newest+First&f_TocHeadingTitleList=PROTOCOLSANDProtocol&fl_SiteID=5325&page=1" class="nav-link"> Protocols </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709076"> <a href="https://academic.oup.com/mbe/search-results?f_TocHeadingTitleList=HighlightsANDNews&fl_SiteID=5325&page=1" class="nav-link"> Highlights </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709077"> <a href="https://academic.oup.com/mbe/issue-covers" class="nav-link"> Cover Archive </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709078"> <a href="https://academic.oup.com/mbe/search-results?f_TocHeadingTitleList=Brief+CommunicationsANDLetter&fl_SiteID=5325&page=1" class="nav-link"> Brief Communications </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709079"> <a href="https://academic.oup.com/mbe/search-results?f_TocHeadingTitleList=Review" class="nav-link"> Reviews </a> </li> </ul> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709064"> <a href="javascript:;" class="nav-link js-nav-dropdown at-nav-dropdown" role="button" aria-expanded="false"> Submit <i class="desktop-nav-arrow icon-general-arrow-filled-down arrow-icon"></i> </a> <i class="mobile-nav-arrow icon-general_arrow-down"></i> <ul class="site-menu site-menu-lvl-1 at-site-menu"> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709080"> <a href="http://mc.manuscriptcentral.com/mbe" class="nav-link"> Submission site </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709081"> <a href="https://academic.oup.com/mbe/pages/author-guidelines" class="nav-link"> Author guidelines </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709082"> <a href="https://academic.oup.com/mbe/pages/Open_Access" class="nav-link"> Open access </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709083"> <a href="https://academic.oup.com/journals/pages/self_archiving_policy_c" class="nav-link"> Self-archiving policy </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709084"> <a href="https://academic.oup.com/mbe/pages/why-publish" class="nav-link"> Reasons to submit </a> </li> </ul> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709085"> <a href="https://academic.oup.com/journals/pages/help/journal_alerts" class="nav-link"> Alerts </a> </li> <li class="site-menu-item site-menu-lvl-0 at-site-menu-item" id="site-menu-item-1709065"> <a href="javascript:;" class="nav-link js-nav-dropdown at-nav-dropdown" role="button" aria-expanded="false"> About <i class="desktop-nav-arrow icon-general-arrow-filled-down arrow-icon"></i> </a> <i class="mobile-nav-arrow icon-general_arrow-down"></i> <ul class="site-menu site-menu-lvl-1 at-site-menu"> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709086"> <a href="/mbe/pages/About" class="nav-link"> About Molecular Biology and Evolution </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709087"> <a href="http://www.smbe.org/smbe/" class="nav-link"> About the Society for Molecular Biology and Evolution </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709088"> <a href="/mbe/pages/Editorial_Board" class="nav-link"> Editorial Board </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709089"> <a href="https://academic.oup.com/advertising-and-corporate-services/pages/mbe-media-kit" class="nav-link"> Advertising and Corporate Services </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709090"> <a href="http://medicine-and-health-careernetwork.oxfordjournals.org" class="nav-link"> Journals Career Network </a> </li> <li class="site-menu-item site-menu-lvl-1 at-site-menu-item" id="site-menu-item-1709091"> <a href="http://www.smbe.org/smbe/" class="nav-link"> Contact Us </a> </li> </ul> </li> </ul> </nav> <div class="navbar-search-container js-navbar-search-container"> <a href="javascript:;" class="navbar-search-close js_close-navsearch">Close</a> <div class="navbar-search"> <div class="microsite-search"> <label for="SitePageHeader-navbar-search-filter" class="screenreader-text js-navbar-search-filter-label"> Navbar Search Filter </label> <select class="navbar-search-filter js-navbar-search-filter at-navbar-search-filter" id="SitePageHeader-navbar-search-filter"> <option class="navbar-search-filter-option at-navbar-search-filter-option" value="">Molecular Biology and Evolution</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Issue">This issue</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Parent">Society for Molecular Biology and Evolution Journals</option> <optgroup class="navbar-search-optgroup" label="Search across Oxford Academic"> <option class="navbar-search-filter-option at-navbar-search-filter-option" value="AcademicSubjects/SCI01130">Evolutionary Biology</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="AcademicSubjects/SCI01180">Molecular and Cell Biology</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Books">Books</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Journals">Journals</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Umbrella">Oxford Academic</option> </optgroup> </select> <label for="SitePageHeader-microsite-search-term" class="screenreader-text js-microsite-search-term-label"> Enter search term </label> <input class="navbar-search-input microsite-search-term js-microsite-search-term at-microsite-search-term" type="text" maxlength="255" placeholder="Search" id="SitePageHeader-microsite-search-term"> <a href="javascript:;" class="microsite-search-icon navbar-search-submit icon-menu_search"> <span class="screenreader-text">Search</span> </a> </div> </div> <input id="hfCurrentBookSearch" name="hfCurrentBookSearch" type="hidden" value="" /><input id="hfCurrentBookScope" name="hfCurrentBookScope" type="hidden" value="CurrentBook" /><input id="hfBookSiteScope" name="hfBookSiteScope" type="hidden" value="Books" /><input id="hfSeriesScope" name="hfSeriesScope" type="hidden" value="taxWithOr" /><input id="hfParentSiteName" name="hfParentSiteName" type="hidden" value="Society for Molecular Biology and Evolution Journals" /><input id="hfParentSiteUrl" name="hfParentSiteUrl" type="hidden" value="academic.oup.com/smbejournals" /><input id="hfSiteID" name="hfSiteID" type="hidden" value="5325" /><input id="hfParentSiteID" name="hfParentSiteID" type="hidden" value="6612" /><input id="hfJournalSiteScope" name="hfJournalSiteScope" type="hidden" value="Journals" /><input id="hfParentSiteScope" name="hfParentSiteScope" type="hidden" value="Parent" /><input id="hfDefaultSearchURL" name="hfDefaultSearchURL" type="hidden" value="search-results?page=1&q=" /><input id="hfIssueSearch" name="hfIssueSearch" type="hidden" value="&fl_IssueID=131323" /><input id="hfIssueSiteScope" name="hfIssueSiteScope" type="hidden" value="Issue" /><input id="hfUmbrellaScope" name="hfUmbrellaScope" type="hidden" value="Umbrella" /><input id="hfUmbrellaSiteUrl" name="hfUmbrellaSiteUrl" type="hidden" value="academic.oup.com" /><input id="hfUmbrellaSiteId" name="hfUmbrellaSiteId" type="hidden" value="191" /><input id="hfDefaultAdvancedSearchUrl" name="hfDefaultAdvancedSearchUrl" type="hidden" value="advanced-search?page=1&q=" /><input id="hfTaggedCollectionScope" name="hfTaggedCollectionScope" type="hidden" value="" /> <div class="navbar-search-advanced"><a href="/mbe/advanced-search" class="advanced-search js-advanced-search">Advanced Search</a></div> </div> <div class="navbar-search-collapsed"><a href="javascript:;" class="icon-menu_search js_expand-navsearch"><span class="screenreader-text">Search Menu</span></a></div> </div> </div> <input type="hidden" name="searchScope" id="hfSolrJournalID" value="" /> <input type="hidden" id="hfSolrJournalName" value="" /> <input type="hidden" id="hfSolrMaxAllowSearchChar" value="100" /> <input type="hidden" id="hfJournalShortName" value="" /> <input type="hidden" id="hfSearchPlaceholder" value="" /> <input type="hidden" name="hfGlobalSearchSiteURL" id="hfGlobalSearchSiteURL" value="" /> <input type="hidden" name="hfSearchSiteURL" id="hfSiteURL" value="academic.oup.com/mbe" /> <input type="hidden" name="RedirectSiteUrl" id="RedirectSiteUrl" value="httpszazjzjacademiczwoupzwcom" /> <script type="text/javascript"> (function () { var hfSiteUrl = document.getElementById('hfSiteURL'); var siteUrl = hfSiteUrl.value; var subdomainIndex = siteUrl.indexOf('/'); hfSiteUrl.value = location.host + (subdomainIndex >= 0 ? siteUrl.substring(subdomainIndex) : ''); })(); </script> <input id="routename" name="RouteName" type="hidden" value="mbe" /> </div> </section> <div class="widget widget-SitewideBanner widget-instance-"> </div> <div id="main" class="content-main js-main ui-base"> <section class="master-main row"> <div class="center-inner-row no-overflow"> <div id="skipNav" tabindex="-1"></div> <div class="page-column-wrap"> <div id="InfoColumn" class="page-column page-column--left js-left-nav-col"> <div class="mobile-content-topbar hide"> <button class="toggle-left-col toggle-left-col__article">Article Navigation</button> </div> <div class="info-inner-wrap js-left-nav"> <button class="toggle-left-col__close btn-as-icon icon-general-close"> <span class="screenreader-text">Close mobile search navigation</span> </button> <div class="responsive-nav-title">Article Navigation</div> <div class="info-widget-wrap"> <div class="widget widget-IssueInfo widget-instance-OUP_IssueInfo_Article"> <div id="issueInfo-OUP_IssueInfo_Article" class="article-info-wrap clearfix"> <i class="icon-general-close mobile-nav-btn nav-open"></i> <a class="article-issue-link" href="/mbe/issue/38/10"> <div class="article-issue-img"> <img id="issueImage" class="fb-featured-image" src="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/Issue/38/10/2/m_molbiolevol_38_10cover.jpeg?Expires=1735516585&Signature=ZBQP3IkC1dXKTXePuBRwJNhakBZ67wLMjpoRVxR1VvO9~fzeOsVt3ccBtfspWmCUgl7gkEkab9iru1UbVwbtGCIijmxIeXc-ak4rIE5kIVB4mIGi2Brzvvml9Rjw9z578cDQfE945I3trZHJR8SJKLzGrYBz9TMxRQgTM69ATDlqBhJiaGNa6YkG0PnA-y7em22QTupLt4Qwgc9rUP~7T8j2ZFBRRMJ4D4aPqL~D4-Zi46nnEygD~cYSczHASDM4I3C9NiP6yV9c2km0Iq8U~hPGI8NyY2yBdHbcZL0eVFmiJSNGxSU3ACquJJuYLXoq2WumSBDj9GKqf~41hJTqLQ__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA" alt="Issue Cover" /> </div> <div class="article-issue-info"> <div class="volume-issue__wrap"> <div class="volume trailing-comma">Volume 38</div> <div class="issue">Issue 10</div> </div> <div class="ii-pub-date"> October 2021 </div> </div> </a> </div> </div> <div class="content-nav"> <div class="widget widget-ArticleJumpLinks widget-instance-OUP_ArticleJumpLinks_Widget"> <h3 class="contents-title" >Article Contents</h3> <ul class="jumplink-list js-jumplink-list"> <li class="section-jump-link head-1" link-destination="304110801"> <div class="section-jump-link__link-wrap"> <a class="js-jumplink scrollTo" href="#304110801">Abstract</a> </div> </li> <li class="section-jump-link head-1" link-destination="304110805"> <div class="section-jump-link__link-wrap"> <a class="js-jumplink scrollTo" href="#304110805">New Approaches</a> </div> </li> <li class="section-jump-link head-1" link-destination="304110807"> <div class="section-jump-link__link-wrap"> <a class="js-jumplink scrollTo" href="#304110807">Results and Discussion</a> </div> </li> <li class="section-jump-link head-1" link-destination="304110832"> <div class="section-jump-link__link-wrap"> <a class="js-jumplink scrollTo" href="#304110832">Materials and Methods</a> </div> </li> <li class="section-jump-link head-1" link-destination="304110834"> <div class="section-jump-link__link-wrap"> <a class="js-jumplink scrollTo" href="#304110834">Supplementary Material</a> </div> </li> <li class="section-jump-link head-1" link-destination="304110836"> <div class="section-jump-link__link-wrap"> <a class="js-jumplink scrollTo" href="#304110836">Acknowledgments</a> </div> </li> <li class="section-jump-link head-1 backReferenceLink" link-destination="304110840"> <div class="section-jump-link__link-wrap"> <a class="js-jumplink scrollTo" href="#304110840">References</a> </div> </li> </ul> </div> </div> <div class="widget widget-ArticleNavLinks widget-instance-OUP_ArticleNavLinks_Article"> <ul class="inline-list"> <li class="prev arrow"> <a href="/mbe/article/38/10/4634/6297222">< Previous</a> </li> <li class="next arrow"> <a href="/mbe/article/38/10/4655/6355927">Next ></a> </li> </ul> </div> </div> </div> </div> <div class="sticky-toolbar js-sticky-toolbar"></div> <div id="ContentColumn" class="page-column page-column--center"> <div class="article-browse-top article-browse-mobile-nav js-mobile-nav"> <div class="article-browse-mobile-nav-inner js-mobile-nav-inner"> <button class="toggle-left-col toggle-left-col__article btn-as-link"> Article Navigation </button> </div> </div> <div class="article-browse-top article-browse-mobile-nav mobile-sticky-toolbar js-mobile-nav-sticky"> <div class="article-browse-mobile-nav-inner"> <button class="toggle-left-col toggle-left-col__article btn-as-link"> Article Navigation </button> </div> </div> <div class="content-inner-wrap"> <div class="widget widget-ArticleTopInfo widget-instance-OUP_ArticleTop_Info_Widget"> <div class="module-widget article-top-widget"> <div class="access-state-logos all-viewports"> <span class="journal-info__format-label">Journal Article</span> </div> <div class="widget-items"> <div class="title-wrap"> <h1 class="wi-article-title article-title-main accessible-content-title at-articleTitle"> BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes <i class='icon-availability_open' title='Open Access' ></i> </h1> </div> <div class="wi-authors at-ArticleAuthors"> <div class="al-authors-list"> <span class="al-author-name-more js-flyout-wrap"> <button type="button" class="linked-name js-linked-name-trigger btn-as-link">Mosè Manni</button><span class='delimiter'>, </span> <span class="al-author-info-wrap arrow-up"> <div class="info-card-author authorInfo_OUP_ArticleTop_Info_Widget"> <div class="name-role-wrap"> <div class="info-card-name"> Mosè Manni </div> </div> <div class="info-card-affilitation"> <div class="aff"><div class="institution">Department of Genetic Medicine and Development, University of Geneva</div>, Geneva, <div class="country">Switzerland</div></div><div class="aff"><div class="institution">Swiss Institute of Bioinformatics</div>, Geneva, <div class="country">Switzerland</div></div> </div> <div class="info-card-location"> <a id="contrib-orcid-0000-0002-4146-6523" href="https://orcid.org/0000-0002-4146-6523"> <img class="orchid-icon" alt="ORCID logo" aria-hidden="true" src="//oup.silverchair-cdn.com/Themes/Silver/app/img/mini-icon.png"/> https://orcid.org/0000-0002-4146-6523 </a> </div> <div class="info-card-search-label"> Search for other works by this author on: </div> <div class="info-card-search info-card-search-internal"> <a href="/mbe/search-results?f_Authors=Mos%c3%a8+Manni" rel="nofollow">Oxford Academic</a> </div> <div class="info-card-search info-card-search-pubmed"> <a href="http://www.ncbi.nlm.nih.gov/pubmed?cmd=search&term=Manni M">PubMed</a> </div> <div class="info-card-search info-card-search-google"> <a href="http://scholar.google.com/scholar?q=author:%22Manni Mosè%22">Google Scholar</a> </div> </div> </span> </span> <span class="al-author-name-more js-flyout-wrap"> <button type="button" class="linked-name js-linked-name-trigger btn-as-link">Matthew R Berkeley</button><span class='delimiter'>, </span> <span class="al-author-info-wrap arrow-up"> <div class="info-card-author authorInfo_OUP_ArticleTop_Info_Widget"> <div class="name-role-wrap"> <div class="info-card-name"> Matthew R Berkeley </div> </div> <div class="info-card-affilitation"> <div class="aff"><div class="institution">Department of Genetic Medicine and Development, University of Geneva</div>, Geneva, <div class="country">Switzerland</div></div><div class="aff"><div class="institution">Swiss Institute of Bioinformatics</div>, Geneva, <div class="country">Switzerland</div></div> </div> <div class="info-card-search-label"> Search for other works by this author on: </div> <div class="info-card-search info-card-search-internal"> <a href="/mbe/search-results?f_Authors=Matthew+R+Berkeley" rel="nofollow">Oxford Academic</a> </div> <div class="info-card-search info-card-search-pubmed"> <a href="http://www.ncbi.nlm.nih.gov/pubmed?cmd=search&term=Berkeley M">PubMed</a> </div> <div class="info-card-search info-card-search-google"> <a href="http://scholar.google.com/scholar?q=author:%22Berkeley Matthew R%22">Google Scholar</a> </div> </div> </span> </span> <span class="al-author-name-more js-flyout-wrap"> <button type="button" class="linked-name js-linked-name-trigger btn-as-link">Mathieu Seppey</button><span class='delimiter'>, </span> <span class="al-author-info-wrap arrow-up"> <div class="info-card-author authorInfo_OUP_ArticleTop_Info_Widget"> <div class="name-role-wrap"> <div class="info-card-name"> Mathieu Seppey </div> </div> <div class="info-card-affilitation"> <div class="aff"><div class="institution">Department of Genetic Medicine and Development, University of Geneva</div>, Geneva, <div class="country">Switzerland</div></div><div class="aff"><div class="institution">Swiss Institute of Bioinformatics</div>, Geneva, <div class="country">Switzerland</div></div> </div> <div class="info-card-search-label"> Search for other works by this author on: </div> <div class="info-card-search info-card-search-internal"> <a href="/mbe/search-results?f_Authors=Mathieu+Seppey" rel="nofollow">Oxford Academic</a> </div> <div class="info-card-search info-card-search-pubmed"> <a href="http://www.ncbi.nlm.nih.gov/pubmed?cmd=search&term=Seppey M">PubMed</a> </div> <div class="info-card-search info-card-search-google"> <a href="http://scholar.google.com/scholar?q=author:%22Seppey Mathieu%22">Google Scholar</a> </div> </div> </span> </span> <span class="al-author-name-more js-flyout-wrap"> <button type="button" class="linked-name js-linked-name-trigger btn-as-link">Felipe A Simão</button><span class='delimiter'>, </span> <span class="al-author-info-wrap arrow-up"> <div class="info-card-author authorInfo_OUP_ArticleTop_Info_Widget"> <div class="name-role-wrap"> <div class="info-card-name"> Felipe A Simão </div> </div> <div class="info-card-affilitation"> <div class="aff"><div class="institution">Department of Genetic Medicine and Development, University of Geneva</div>, Geneva, <div class="country">Switzerland</div></div><div class="aff"><div class="institution">Swiss Institute of Bioinformatics</div>, Geneva, <div class="country">Switzerland</div></div> </div> <div class="info-card-search-label"> Search for other works by this author on: </div> <div class="info-card-search info-card-search-internal"> <a href="/mbe/search-results?f_Authors=Felipe+A+Sim%c3%a3o" rel="nofollow">Oxford Academic</a> </div> <div class="info-card-search info-card-search-pubmed"> <a href="http://www.ncbi.nlm.nih.gov/pubmed?cmd=search&term=Simão F">PubMed</a> </div> <div class="info-card-search info-card-search-google"> <a href="http://scholar.google.com/scholar?q=author:%22Simão Felipe A%22">Google Scholar</a> </div> </div> </span> </span> <span class="al-author-name-more js-flyout-wrap"> <button type="button" class="linked-name js-linked-name-trigger btn-as-link">Evgeny M Zdobnov</button><span class='delimiter'></span> <span class="al-author-info-wrap arrow-up"> <div class="info-card-author authorInfo_OUP_ArticleTop_Info_Widget"> <div class="name-role-wrap"> <div class="info-card-name"> Evgeny M Zdobnov <span class="info-card-footnote"><span class="xrefLink" id="jumplink-msab199-cor1"></span><a href="javascript:;" reveal-id="msab199-cor1" data-open="msab199-cor1" class="link link-ref link-reveal xref-default"><!----></a></span> </div> </div> <div class="info-card-affilitation"> <div class="aff"><div class="institution">Department of Genetic Medicine and Development, University of Geneva</div>, Geneva, <div class="country">Switzerland</div></div><div class="aff"><div class="institution">Swiss Institute of Bioinformatics</div>, Geneva, <div class="country">Switzerland</div></div> </div> <div class="info-author-correspondence"> <div content-id="msab199-cor1"><strong>Corresponding author:</strong> E-mail: <a href="mailto:evgeny.zdobnov@unige.ch" target="_blank">evgeny.zdobnov@unige.ch</a>.</div> </div> <div class="info-card-search-label"> Search for other works by this author on: </div> <div class="info-card-search info-card-search-internal"> <a href="/mbe/search-results?f_Authors=Evgeny+M+Zdobnov" rel="nofollow">Oxford Academic</a> </div> <div class="info-card-search info-card-search-pubmed"> <a href="http://www.ncbi.nlm.nih.gov/pubmed?cmd=search&term=Zdobnov E">PubMed</a> </div> <div class="info-card-search info-card-search-google"> <a href="http://scholar.google.com/scholar?q=author:%22Zdobnov Evgeny M%22">Google Scholar</a> </div> </div> </span> </span> <div class="al-author-name al-author-footnotes"> <div class="al-author-info-wrap arrow-up"> <div class="widget widget-SingleSection widget-instance-OUP_FootnoteSection"> <div content-id="msab199-FM1" class="footnote"><span class="fn"><div class="footnote-content"><p class="footnote-compatibility">Mosè Manni, Matthew R Berkeley and Mathieu Seppey authors contributed equally to this work.</p></div></span></div> </div> </div> <a class="js-linked-footnotes" href="javascript:;">Author Notes</a> </div> </div> </div> <div class="pub-history-wrap clearfix js-history-dropdown-wrap"> <div class="pub-history-row clearfix"> <div class="ww-citation-primary"><em>Molecular Biology and Evolution</em>, Volume 38, Issue 10, October 2021, Pages 4647–4654, <a href='https://doi.org/10.1093/molbev/msab199'>https://doi.org/10.1093/molbev/msab199</a></div> </div> <div class="pub-history-row clearfix"> <div class="ww-citation-date-wrap"> <div class="citation-label">Published:</div> <div class="citation-date">28 July 2021</div> </div> </div> </div> </div> </div> <script> $(document).ready(function () { $('.article-top-widget').on('click', '.ati-toggle-trigger', function () { $(this).find('.icon-general-add, .icon-minus').toggleClass('icon-minus icon-general-add'); $(this).siblings('.ati-toggle-content').toggleClass('hide'); }); // In Chrome, an anchor tag with target="_blank" and a "mailto:" href opens a new tab/window as well as the email client // I suspect this behavior will be corrected in the future // Remove the target="_blank" $('ul.wi-affiliationList').find('a[href^="mailto:"]').each(function () { $(this).removeAttr('target'); }); }); </script> </div> <div class="widget widget-ArticleLinks widget-instance-OUP_Article_Links_Widget"> </div> <div class="article-body js-content-body"> <div class="toolbar-wrap js-toolbar-wrap"> <div class="toolbar-inner-wrap"> <ul id="Toolbar" role="navigation"> <li class="toolbar-item item-pdf js-item-pdf "> <a class="al-link pdf article-pdfLink" data-article-id="6329644" href="/mbe/article-pdf/38/10/4647/40449445/msab199.pdf"> <img src=//oup.silverchair-cdn.com/UI/app/svg/pdf.svg alt="pdf" /><span class="pdf-link-text">PDF</span> </a> </li> <li class="toolbar-item item-link item-split-view"> <a href="javascript:;" class="split-view js-split-view st-split-view at-split-view" target=""> <i class="icon-menu-split"></i> Split View </a> </li> <li class="toolbar-item item-with-dropdown item-views"> <a class="at-views-dropdown drop-trigger" href="javascript:;" data-dropdown="FilterDrop" aria-haspopup="true"> <i class="icon-menu_views"></i> <div class="toolbar-label"> <div class="toolbar-text">Views</div> <i class="icon-general-arrow-filled-down arrow-icon"></i> </div> </a> <ul id="ViewsDrop" class="f-dropdown js-dropdown-content" data-dropdown-content aria-label="submenu"> <div class="arrow-up"></div> <li class="article-content-filter js-article-content-filter" data-content-filter="article-content"> <a href="javascript:;"><span>Article contents</span></a> </li> <li class="at-figures-tables article-content-filter js-article-content-filter" data-content-filter="figures-tables"> <a href="javascript:;"><span>Figures & tables</span></a> </li> <li class="article-content-filter js-article-content-filter" data-content-filter="video"> <a href="javascript:;"><span>Video</span></a> </li> <li class="article-content-filter js-article-content-filter" data-content-filter="audio"> <a href="javascript:;"><span>Audio</span></a> </li> <li class="article-content-filter js-article-content-filter" data-content-filter="supplementary-data"> <a href="javascript:;"><span>Supplementary Data</span></a> </li> </ul> </li> <li class="toolbar-item item-cite js-item-cite"> <div class="widget widget-ToolboxGetCitation widget-instance-OUP_Get_Citation"> <a href="#" class="js-cite-button at-CiteButton" data-reveal-id="getCitation" data-reveal> <i class="icon-read-more"></i> <span>Cite</span> </a> <div id="getCitation" class="reveal-modal js-citation-modal" data-reveal> <h3 class="modal-title">Cite</h3> <div class="oxford-citation-text"> <p>Mosè Manni, Matthew R Berkeley, Mathieu Seppey, Felipe A Simão, Evgeny M Zdobnov, BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes, <em>Molecular Biology and Evolution</em>, Volume 38, Issue 10, October 2021, Pages 4647–4654, <a href="https://doi.org/10.1093/molbev/msab199">https://doi.org/10.1093/molbev/msab199</a></p> </div> <div class="citation-download-wrap"> <form action="/Citation/Download" method="get" id="citationModal"> <input type="hidden" name="resourceId" value="6329644" /> <input type="hidden" name="resourceType" value="3" /> <label for="selectFormat" class="hide js-citation-format-label">Select Format</label> <select required name="citationFormat" class="citation-download-format js-citation-format" id="selectFormat"> <option selected disabled >Select format</option> <option value="0" >.ris (Mendeley, Papers, Zotero)</option> <option value="1" >.enw (EndNote)</option> <option value="2" >.bibtex (BibTex)</option> <option value="3" >.txt (Medlars, RefWorks)</option> </select> <button class="btn citation-download-link disabled" type="submit">Download citation</button> </form> </div> <a class="close-reveal-modal" href="javascript:;"><i class="icon-general-close"></i><span class="screenreader-text">Close</span></a> </div> </div> </li> <li class="toolbar-item item-tools"> <div class="widget widget-ToolboxPermissions widget-instance-OUP_Get_Permissions"> <div class="module-widget"> <a href="https://s100.copyright.com/AppDispatchServlet?publisherName=OUP&publication=1537-1719&title=BUSCO%20Update%3A%20Novel%20and%20Streamlined%20Workflows%20along%20with%20Broader%20and%20Deeper%20Phylogenetic%20Coverage%20for%20Scoring%20of%20Eukaryotic%2C%20Prokaryotic%2C%20and%20Viral%20Genomes&publicationDate=2021-07-28&volumeNum=38&issueNum=10&author=Manni%2C%20Mos%C3%A8%3B%20Berkeley%2C%20Matthew%20R&startPage=4647&endPage=4654&contentId=10.1093%2Fmolbev%2Fmsab199&oa=CC%20BY&copyright=%C2%A9%20The%20Author%28s%29%202021.%20Published%20by%20Oxford%20University%20Press%20on%20behalf%20of%20the%20Society%20for%20Molecular%20Biology%20and%20Evolution.&orderBeanReset=True" id="PermissionsLink" class="" target="_blank"> <i class="icon-menu_permissions"> <span class="screenreader-text">Permissions Icon</span> </i> Permissions </a> </div> </div> </li> <li class="toolbar-item item-with-dropdown item-share"> <a href="javascript:;" class="drop-trigger js-toolbar-dropdown at-ShareButton" data-dropdown="ShareDrop"> <i class="icon-menu_share"><span class="screenreader-text">Share Icon</span></i> <span class="toolbar-label"> <span class="toolbar-text">Share</span> <i class="arrow-icon icon-general-arrow-filled-down js-toolbar-arrow-icon"></i> </span> </a> <ul id="ShareDrop" class="addthis_toolbox addthis_default_style addthis_20x20_style f-dropdown js-dropdown-content" data-dropdown-content> <li> <a class="st-custom-button addthis_button_facebook js-share-link" data-network="facebook" data-title="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" data-url="https://academic.oup.com/mbe/article/38/10/4647/6329644" data-email-subject="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" href="javascript:;"><span>Facebook</span></a> </li> <li> <a class="st-custom-button addthis_button_twitter js-share-link" data-network="twitter" data-title="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" data-url="https://academic.oup.com/mbe/article/38/10/4647/6329644" data-email-subject="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" href="javascript:;"><span>Twitter</span></a> </li> <li> <a class="st-custom-button addthis_button_linkedin js-share-link" data-network="linkedin" data-title="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" data-url="https://academic.oup.com/mbe/article/38/10/4647/6329644" data-email-subject="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" href="javascript:;"><span>LinkedIn</span></a> </li> <li> <a class="st-custom-button addthis_button_email js-share-link" data-network="email" data-title="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" data-url="https://academic.oup.com/mbe/article/38/10/4647/6329644" data-email-subject="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes" href="javascript:;"><span>Email</span></a> </li> </ul> </li> </ul> <div class="toolbar-search"> <div class="widget widget-SitePageHeader widget-instance-OUP_ArticleToolbarSearchBox"> <div class="dropdown-panel-wrap"> <div class="dropdown-panel mobile-search-dropdown"> <div class="mobile-search-inner-wrap"> <div class="navbar-search"> <div class="mobile-microsite-search"> <label for="OUP_ArticleToolbarSearchBox-mobile-navbar-search-filter" class="screenreader-text js-mobile-navbar-search-filter-label"> Navbar Search Filter </label> <select class="mobile-navbar-search-filter js-mobile-navbar-search-filter at-navbar-search-filter" id="OUP_ArticleToolbarSearchBox-mobile-navbar-search-filter"> <option class="navbar-search-filter-option at-navbar-search-filter-option" value="">Molecular Biology and Evolution</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Issue">This issue</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Parent">Society for Molecular Biology and Evolution Journals</option> <optgroup class="navbar-search-optgroup" label="Search across Oxford Academic"> <option class="navbar-search-filter-option at-navbar-search-filter-option" value="AcademicSubjects/SCI01130">Evolutionary Biology</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="AcademicSubjects/SCI01180">Molecular and Cell Biology</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Books">Books</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Journals">Journals</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Umbrella">Oxford Academic</option> </optgroup> </select> <label for="OUP_ArticleToolbarSearchBox-mobile-microsite-search-term" class="screenreader-text js-mobile-microsite-search-term-label"> Mobile Enter search term </label> <input class="mobile-search-input mobile-microsite-search-term js-mobile-microsite-search-term at-microsite-search-term" type="text" maxlength="255" placeholder="Search" id="OUP_ArticleToolbarSearchBox-mobile-microsite-search-term"> <a href="javascript:;" class="mobile-microsite-search-icon mobile-search-submit icon-menu_search"> <span class="screenreader-text">Search</span> </a> </div> </div> </div> </div> <div class="dropdown-panel mobile-nav-dropdown"> </div> </div> <div class="navbar"> <div class="center-inner-row"> <nav class="navbar-menu"> </nav> <div class="navbar-search-container js-navbar-search-container"> <a href="javascript:;" class="navbar-search-close js_close-navsearch">Close</a> <div class="navbar-search"> <div class="microsite-search"> <label for="OUP_ArticleToolbarSearchBox-navbar-search-filter" class="screenreader-text js-navbar-search-filter-label"> Navbar Search Filter </label> <select class="navbar-search-filter js-navbar-search-filter at-navbar-search-filter" id="OUP_ArticleToolbarSearchBox-navbar-search-filter"> <option class="navbar-search-filter-option at-navbar-search-filter-option" value="">Molecular Biology and Evolution</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Issue">This issue</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Parent">Society for Molecular Biology and Evolution Journals</option> <optgroup class="navbar-search-optgroup" label="Search across Oxford Academic"> <option class="navbar-search-filter-option at-navbar-search-filter-option" value="AcademicSubjects/SCI01130">Evolutionary Biology</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="AcademicSubjects/SCI01180">Molecular and Cell Biology</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Books">Books</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Journals">Journals</option><option class="navbar-search-filter-option at-navbar-search-filter-option" value="Umbrella">Oxford Academic</option> </optgroup> </select> <label for="OUP_ArticleToolbarSearchBox-microsite-search-term" class="screenreader-text js-microsite-search-term-label"> Enter search term </label> <input class="navbar-search-input microsite-search-term js-microsite-search-term at-microsite-search-term" type="text" maxlength="255" placeholder="Search" id="OUP_ArticleToolbarSearchBox-microsite-search-term"> <a href="javascript:;" class="microsite-search-icon navbar-search-submit icon-menu_search"> <span class="screenreader-text">Search</span> </a> </div> </div> <div class="navbar-search-advanced"><a href="/mbe/advanced-search" class="advanced-search js-advanced-search">Advanced Search</a></div> </div> <div class="navbar-search-collapsed"><a href="javascript:;" class="icon-menu_search js_expand-navsearch"><span class="screenreader-text">Search Menu</span></a></div> </div> </div> <input id="routename" name="RouteName" type="hidden" value="mbe" /> </div> </div> </div> </div> <div id="ContentTab" class="content active"> <div class="widget widget-ArticleFulltext widget-instance-OUP_Article_FullText_Widget"> <div class="module-widget"> <div class="widget-items" data-widgetname="ArticleFulltext"> <h2 scrollto-destination=304110801 id="304110801" class="abstract-title js-splitscreen-abstract-title" >Abstract</h2> <section class="abstract"><p class="chapter-para">Methods for evaluating the quality of genomic and metagenomic data are essential to aid genome assembly procedures and to correctly interpret the results of subsequent analyses. BUSCO estimates the completeness and redundancy of processed genomic data based on universal single-copy orthologs. Here, we present new functionalities and major improvements of the BUSCO software, as well as the renewal and expansion of the underlying data sets in sync with the OrthoDB v10 release. Among the major novelties, BUSCO now enables phylogenetic placement of the input sequence to automatically select the most appropriate BUSCO data set for the assessment, allowing the analysis of metagenome-assembled genomes of unknown origin. A newly introduced genome workflow increases the efficiency and runtimes especially on large eukaryotic genomes. BUSCO is the only tool capable of assessing both eukaryotic and prokaryotic species, and can be applied to various data types, from genome assemblies and metagenomic bins, to transcriptomes and gene sets.</p></section> <div class="article-metadata-panel clearfix at-ArticleMetadata"></div> <div class="kwd-group"><a class="kwd-part kwd-main" href="javascript:;" data-keyword=""quality assessment"">quality assessment</a>, <a class="kwd-part kwd-main" href="javascript:;" data-keyword="completeness">completeness</a>, <a class="kwd-part kwd-main" href="javascript:;" data-keyword="genome">genome</a>, <a class="kwd-part kwd-main" href="javascript:;" data-keyword="transcriptome">transcriptome</a>, <a class="kwd-part kwd-main" href="javascript:;" data-keyword="prokaryotes">prokaryotes</a>, <a class="kwd-part kwd-main" href="javascript:;" data-keyword="eukaryotes">eukaryotes</a>, <a class="kwd-part kwd-main" href="javascript:;" data-keyword="viruses">viruses</a>, <a class="kwd-part kwd-main" href="javascript:;" data-keyword="microbes">microbes</a>, <a class="kwd-part kwd-main" href="javascript:;" data-keyword="metagenomes">metagenomes</a></div><p class="chapter-para">Advances in sequencing technologies are powering accumulation of genomics data at an accelerating rate, from sequencing isolates and single cells to metagenomes of entire microbial communities. In turn, computational genomics approaches are essential to digest such molecular data into our evolving understanding of genome diversity across the tree of life, from microbes to animals and plants. Evaluating the quality of genomic data, in terms of completeness and redundancy, is critical for subsequent analyses and for the correct interpretation of the results. Complementing technical measures like the N50 value, biologically meaningful metrics based on expected gene content have proved to be useful for estimating the quality of genomes, as exemplified by our BUSCO tool (<span class="xrefLink" id="jumplink-msab199-B17"></span><a href="javascript:;" reveal-id="msab199-B17" data-open="msab199-B17" class="link link-ref link-reveal xref-bibr">Simão et al. 2015</a>; <span class="xrefLink" id="jumplink-msab199-B21"></span><a href="javascript:;" reveal-id="msab199-B21" data-open="msab199-B21" class="link link-ref link-reveal xref-bibr">Waterhouse et al. 2018</a>), the now discontinued CEGMA (<span class="xrefLink" id="jumplink-msab199-B14"></span><a href="javascript:;" reveal-id="msab199-B14" data-open="msab199-B14" class="link link-ref link-reveal xref-bibr">Parra et al. 2007</a>), CheckM (<span class="xrefLink" id="jumplink-msab199-B13"></span><a href="javascript:;" reveal-id="msab199-B13" data-open="msab199-B13" class="link link-ref link-reveal xref-bibr">Parks et al. 2015</a>) aimed at prokaryotes, EukCC (<span class="xrefLink" id="jumplink-msab199-B16"></span><a href="javascript:;" reveal-id="msab199-B16" data-open="msab199-B16" class="link link-ref link-reveal xref-bibr">Saary et al. 2020</a>) proposed for microbial eukaryotes, and CheckV (<span class="xrefLink" id="jumplink-msab199-B11"></span><a href="javascript:;" reveal-id="msab199-B11" data-open="msab199-B11" class="link link-ref link-reveal xref-bibr">Nayfach et al. 2020</a>) for viruses. The latest BUSCO versions introduce new functionalities for assessments of eukaryotic, prokaryotic, and viral data, along with improvements in runtimes and user experience. The underlying data sets have been renewed and expanded in sync with the OrthoDB v10 release (<span class="xrefLink" id="jumplink-msab199-B5"></span><a href="javascript:;" reveal-id="msab199-B5" data-open="msab199-B5" class="link link-ref link-reveal xref-bibr">Kriventseva et al. 2019</a>; <span class="xrefLink" id="jumplink-msab199-B23"></span><a href="javascript:;" reveal-id="msab199-B23" data-open="msab199-B23" class="link link-ref link-reveal xref-bibr">Zdobnov et al. 2021</a>), providing coverage of many more lineages and a revised baseline with increased data sampling.</p> <h2 scrollto-destination=304110805 id="304110805" class="section-title js-splitscreen-section-title" >New Approaches</h2> <p class="chapter-para">Here, we describe the new functionalities and datasets introduced after the release of BUSCO v3. With respect to v3, the last BUSCO version, v5, features: 1) a major upgrade of the underlying data sets in sync with OrthoDB v10; 2) an updated workflow for the assessment of prokaryotic and viral genomes using the gene predictor Prodigal (<span class="xrefLink" id="jumplink-msab199-B4"></span><a href="javascript:;" reveal-id="msab199-B4" data-open="msab199-B4" class="link link-ref link-reveal xref-bibr">Hyatt et al. 2010</a>); 3) an alternative workflow for the assessment of eukaryotic genomes using the gene predictor MetaEuk (<span class="xrefLink" id="jumplink-msab199-B6"></span><a href="javascript:;" reveal-id="msab199-B6" data-open="msab199-B6" class="link link-ref link-reveal xref-bibr">Levy Karin et al. 2020</a>); 4) a workflow to automatically select the most appropriate BUSCO data set, enabling the analysis of sequences of unknown origin; 5) an option to run batch analysis of multiple inputs to facilitate high-throughput assessments of large data sets and metagenomic bins; and 6) a major refactoring of the code, and maintenance of two distribution channels on Bioconda (<span class="xrefLink" id="jumplink-msab199-B3"></span><a href="javascript:;" reveal-id="msab199-B3" data-open="msab199-B3" class="link link-ref link-reveal xref-bibr">Grüning et al. 2018</a>) and Docker (<span class="xrefLink" id="jumplink-msab199-B8"></span><a href="javascript:;" reveal-id="msab199-B8" data-open="msab199-B8" class="link link-ref link-reveal xref-bibr">Merkel 2014</a>). These developments make BUSCO suitable for comprehensive analyses of large heterogeneous data sets, from large eukaryotic genomes to metagenome-assembled genomes of microbial eukaryotes, prokaryotes, and viruses.</p> <h2 scrollto-destination=304110807 id="304110807" class="section-title js-splitscreen-section-title" >Results and Discussion</h2> <h3 scrollto-destination=304110808 id="304110808" class="section-title js-splitscreen-section-title" >Upgrade of Data Sets</h3> <p class="chapter-para">The benchmarking data sets of single-copy orthologs were revised and expanded using the v10 release of OrthoDB (<a class="link link-uri openInAnotherWindow" href="http://www.orthodb.org" target="_blank">www.orthodb.org</a>), which provides evolutionary and functional annotations of orthologs among the most comprehensive sampling of genomic diversity. The creation of novel data sets was necessary to cover more lineages with higher resolution data sets and to revise the existing ones with increased and evenly sampled data across the phylogenetic tree. Following the strategy devised previously (<span class="xrefLink" id="jumplink-msab199-B17"></span><a href="javascript:;" reveal-id="msab199-B17" data-open="msab199-B17" class="link link-ref link-reveal xref-bibr">Simão et al. 2015</a>; <span class="xrefLink" id="jumplink-msab199-B21"></span><a href="javascript:;" reveal-id="msab199-B21" data-open="msab199-B21" class="link link-ref link-reveal xref-bibr">Waterhouse et al. 2018</a>) and taking advantage of the greatly increased number of representative species, we compiled 193 odb10 (OrthoDB v10) data sets (<span class="xrefLink" id="jumplink-msab199-T1"></span><a href="javascript:;" reveal-id="msab199-T1" data-open="msab199-T1" class="link link-reveal link-table xref-fig">table 1</a>), more than a 3-fold increase over odb9 sets, and comprising overall a 5-fold increase in the number of BUSCO marker genes (hereafter BUSCOs) derived from more than twice as many species as in the previous data sets version. <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary table 1</a></span> lists the available BUSCO odb10 data sets along with the number of markers and species used to construct the sets. BUSCO v5 also includes 27 viral data sets, supporting the analysis of a subset of viruses. We compared the estimates of completeness of BUSCO v5 with v3 for a self-validation of the major data sets on gene sets of Bacteria, Fungi, and Metazoa (<span class="xrefLink" id="jumplink-msab199-F1"></span><a href="javascript:;" data-modal-source-id="msab199-F1" class="link xref-fig">fig. 1</a> and <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 2</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). <span class="xrefLink" id="jumplink-msab199-F1"></span><a href="javascript:;" data-modal-source-id="msab199-F1" class="link xref-fig">Figure 1</a> shows a good concordance overall, especially for Metazoa. Slightly more conservative estimates of v5 over v3 for fungi can be explained by the higher number of markers in odb10 BUSCO data sets compared with odb9, and by a more than 6-fold increase in the number of species. <span class="xrefLink" id="jumplink-msab199-F1"></span><a href="javascript:;" data-modal-source-id="msab199-F1" class="link xref-fig">Figure 1b</a> shows a cluster of fungal genomes with BUSCO v5 scores diverging from v3. These species belong to Microsporidia, a group of early diverging fungi once thought to be protozoans (<span class="xrefLink" id="jumplink-msab199-B20"></span><a href="javascript:;" reveal-id="msab199-B20" data-open="msab199-B20" class="link link-ref link-reveal xref-bibr">Wadi and Reinke 2020</a>). Their genomes are known to have a reduced set of genes that are commonly present in fungi and other eukaryotes. The discrepancy between v3 and v5 reflects the increased number of markers for the fungi_odb10 data set which is more balanced toward the majority of fungal clades (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary fig. 1</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). The “microsporidia_odb10” panel in <span class="xrefLink" id="jumplink-msab199-F2"></span><a href="javascript:;" data-modal-source-id="msab199-F2" class="link xref-fig">figure 2a</a> displays the assessment of microsporidian genomes with the most specific data set microsporidia_odb10, which yields a more accurate assessment of these genomes. This example highlights the importance of using the most specific BUSCO data set available for the species of interest, as large differences in terms of gene content can often occur within higher taxonomic levels. Nevertheless, to obviate the biased estimation when the fungi_odb10 is used on microsporidians we also added a “parasitic check” that recalculates the scores based on the list of fungal markers missing in these species (see <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary note</a></span>s, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online).</p> <a id="304110810" scrollto-destination="304110810"></a> <div data-id="msab199-f1" data-content-id="msab199-f1" class="fig fig-section js-fig-section" swap-content-for-modal="true"><div class="graphic-wrap"><img class="content-image" src="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f1.jpeg?Expires=1734480393&Signature=dqdxAz21etD2ti1JNCWRuOeYOV7WwEL0MlhalQAaXJOgvFWev2JaSzj0La4d3l0DgIqe8WB9m1tLLOsPog9kpG2qHpEg2odBEZfCuhgg~iEF4cun4WMZMkIAXqW9U9Kafp9VN-Mn~OtSl2lXK-dARVO~PROCZasqivNQ7IPSh9fUh3FIWUdFZE3VJmrZjTMSurchgyeJN-ObaZEpznu2mIyL8cINDbGvAUCKcYK80rDuMyGVHqxNCFsqP4h0GtjPGi~gueSZBLkhIREPcAPHrRnpZrxmULxKnerZWay1~Dp-v1lRI1qPKBWF7~zVWJO0ibvaJGDKuE1q9ADeLuV0uA__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA" alt="Comparison of the number of complete BUSCOs obtained by running BUSCO v5 and v3 with BUSCO odb_10 and odb_9 data sets on (a) bacterial, (b) fungal, and (c) metazoan gene sets." data-path-from-xml="msab199f1.tif" /><div class="graphic-bottom"><div class="label fig-label" id="label-304110810">Fig. 1</div><div class="caption fig-caption"><p class="chapter-para">Comparison of the number of complete BUSCOs obtained by running BUSCO v5 and v3 with BUSCO odb_10 and odb_9 data sets on (<em>a</em>) bacterial, (<em>b</em>) fungal, and (<em>c</em>) metazoan gene sets.</p></div><div class="ajax-articleAbstract-exclude-regex fig-orig original-slide figure-button-wrap"><a class="fig-view-orig js-view-large at-figureViewLarge openInAnotherWindow" role="button" aria-describedby="label-304110810" href="/view-large/figure/304110810/msab199f1.tif" data-path-from-xml="msab199f1.tif" target="_blank">Open in new tab</a><a class="download-slide" role="button" aria-describedby="label-304110810" data-section="304110810" href="/DownloadFile/DownloadImage.aspx?image=https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199f1.jpeg?Expires=1734480393&Signature=hj~sXmuEQwgsUlSL4VLowNU0TEnBcorNBuWDpbzM~ENT1AsS7OuUAncGKGhx777pt~C4cT2nHPgHBBaGLDbbIJyNBxHXwWM~W9Ca~AnYQ5SYkGS-1buI-JLjAyenuS6cu63cEtH1FtcLJM4QvkByQWkFs7kXEnYohGbyHNs3mw-YGjhAcPYr3~xz4x93BJczfiwG4Ha2lsS03I854NG5Fw6Tb8JlyaU3JXZSogDDfaZJLDA6bVOBX5~tqEKMY0MHiyzrQzQo~PUXqbvPFArtAfPaFs-1M7e5DXJDSOG~RDMNg3bTa1tWMmPUTrSH0Omoz9H6pgz~NUHvPo-oqtsizA__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA&sec=304110810&ar=6329644&xsltPath=~/UI/app/XSLT&imagename=&siteId=5325" data-path-from-xml="msab199f1.tif">Download slide</a></div></div></div></div> <a id="304110811" scrollto-destination="304110811"></a> <div data-id="msab199-f2" data-content-id="msab199-f2" class="fig fig-section js-fig-section" swap-content-for-modal="true"><div class="graphic-wrap"><img class="content-image" src="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f2.jpeg?Expires=1734480393&Signature=Wj-olhPJaD6iovshs6sV3lbRM9U4WSHequVKhPnYpAhYxL0GybZf0zochKBobLqO6czOQgCMGO3as0mpHnF96JBlXlyzdrpBllgYKtg41LieW-6asCZP5uam3dXtThFo76rDJTHWTROog0tUTVyTV9T6Rn7g7f~8IxR~kJpX6EGYiX0ySn~llss5-vYK7OEbd6XexkJHfasRkVOxk9mM3A0hyIdN7pIQQCxdUTCn8URk5CKCUTfwwh4u5~Aw~DgfXw4uYB9vJ5KEBBSggPF792hCf9VNR1pt2IRXe3ix8MJglTM7hKdPY59BE77J5dHpG5-c3HuI2aZodOtRSV4ptg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA" alt="(a) Comparisons of BUSCO scores obtained on a set of fungal genomes using the two available workflows for eukaryotic species. The percentage on the y axis corresponds to the complete BUSCOs for the BUSCO_MetaEuk (orange) and BUSCO_Augustus (white) workflows. Assessments on gene sets are also displayed for comparison (green). Genomes were assessed using the most specific available data sets, which are displayed at the top of each subpanel. The newly introduced BUSCO_MetaEuk workflow allows faster assessments, see supplementary figure 3a, Supplementary Material online, for the differences in runtimes. (b and c) Effect of using different MetaEuk sensitivity values on BUSCO_Metaeuk runtimes and completeness estimation for 112 arthropod genomes evaluated with their most specific BUSCO data set. The default values are set at s = 4.5 and s = 6 for the first and the second MetaEuk runs, respectively. For the analyses, the same sensitivity value displayed on the y axis was used for both MetaEuk runs. The axis corresponding to runtimes (in seconds) is log-transformed." data-path-from-xml="msab199f2.tif" /><div class="graphic-bottom"><div class="label fig-label" id="label-304110811">Fig. 2</div><div class="caption fig-caption"><p class="chapter-para">(<em>a</em>) Comparisons of BUSCO scores obtained on a set of fungal genomes using the two available workflows for eukaryotic species. The percentage on the <em>y</em> axis corresponds to the complete BUSCOs for the BUSCO_MetaEuk (orange) and BUSCO_Augustus (white) workflows. Assessments on gene sets are also displayed for comparison (green). Genomes were assessed using the most specific available data sets, which are displayed at the top of each subpanel. The newly introduced BUSCO_MetaEuk workflow allows faster assessments, see <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary figure 3</a></span><em>a</em>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online, for the differences in runtimes. (<em>b</em> and <em>c</em>) Effect of using different MetaEuk sensitivity values on BUSCO_Metaeuk runtimes and completeness estimation for 112 arthropod genomes evaluated with their most specific BUSCO data set. The default values are set at <em>s</em> = 4.5 and <em>s</em> = 6 for the first and the second MetaEuk runs, respectively. For the analyses, the same sensitivity value displayed on the <em>y</em> axis was used for both MetaEuk runs. The axis corresponding to runtimes (in seconds) is log-transformed.</p></div><div class="ajax-articleAbstract-exclude-regex fig-orig original-slide figure-button-wrap"><a class="fig-view-orig js-view-large at-figureViewLarge openInAnotherWindow" role="button" aria-describedby="label-304110811" href="/view-large/figure/304110811/msab199f2.tif" data-path-from-xml="msab199f2.tif" target="_blank">Open in new tab</a><a class="download-slide" role="button" aria-describedby="label-304110811" data-section="304110811" href="/DownloadFile/DownloadImage.aspx?image=https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199f2.jpeg?Expires=1734480393&Signature=ptaqVBiuegmId0S4G6spUman2Da8ek5GpBxj5mG2ILhOthyTREqNaV5zAV7~xbOwUCmVhketRHc6~bM0vjPwp8SNSAyt9nL2p4HASk25YhK2VQdAkt0iOdhwxU~4EK9eFq-Cl1kQXzg2GxALAqEYtp89AC6xTzH5itV47~a7lN3iQBcoR4z2n3VHz7OX7syZz2eKHHKq1zaum8aU50M28Ui3tJwPQ7PpwjA0ReiVP-KY3HAesTOKbpEVSThoomxRVZk6W7d4nfzNJyEI9JaBlZyhd54Ruv72ckXiduiM2aJRLYojn-7FLRlgPgPiYfJaQjKVhDPYhhMKEdRQ2riLJA__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA&sec=304110811&ar=6329644&xsltPath=~/UI/app/XSLT&imagename=&siteId=5325" data-path-from-xml="msab199f2.tif">Download slide</a></div></div></div></div> <a id="304110812" scrollto-destination="304110812"></a> <div content-id="msab199-T1" class="table-modal table-full-width-wrap"><div class="table-wrap table-wide standard-table"><div class="table-wrap-title" id="msab199-T1" data-id="msab199-T1"><span class="label title-label" id="label-97940">Table 1</span><div class="
 graphic-wrap table-open-button-wrap
 "><a class="fig-view-orig at-tableViewLarge openInAnotherWindow btn js-view-large" role="button" target="_blank" href="
 /view-large/304110812" aria-describedby="label-97940"> Open in new tab </a></div><div class="caption caption-id-" id="caption-97940"><p class="chapter-para">Number of odb9 and odb10 BUSCO Data Sets.</p></div> </div><div class="table-overflow"><table role="table" aria-labelledby="
 label-97940" aria-describedby="
 caption-97940"><thead><tr><th>Taxonomic Group<span aria-hidden="true" style="display: none;"> . </span></th><th>odb9 (v3)<span aria-hidden="true" style="display: none;"> . </span></th><th>odb10 (v4/5)<span aria-hidden="true" style="display: none;"> . </span></th></tr></thead><tbody><tr><td>Bacteria</td><td>16</td><td>83</td></tr><tr><td>Archaea</td><td>0</td><td>16</td></tr><tr><td>Viruses</td><td>0</td><td>27</td></tr><tr><td>Eukaryota</td><td>33</td><td>67</td></tr><tr><td> Protist</td><td>2</td><td>7</td></tr><tr><td> Fungi</td><td>10</td><td>24</td></tr><tr><td> Plants</td><td>1</td><td>9</td></tr><tr><td> Metazoa</td><td>14</td><td>26</td></tr><tr><td> Arthropoda</td><td>5</td><td>8</td></tr><tr><td> Vertebrata</td><td>7</td><td>15</td></tr><tr><td>Total</td><td>49</td><td>193</td></tr></tbody></table></div><div class="table-modal"><table><thead><tr><th>Taxonomic Group<span aria-hidden="true" style="display: none;"> . </span></th><th>odb9 (v3)<span aria-hidden="true" style="display: none;"> . </span></th><th>odb10 (v4/5)<span aria-hidden="true" style="display: none;"> . </span></th></tr></thead><tbody><tr><td>Bacteria</td><td>16</td><td>83</td></tr><tr><td>Archaea</td><td>0</td><td>16</td></tr><tr><td>Viruses</td><td>0</td><td>27</td></tr><tr><td>Eukaryota</td><td>33</td><td>67</td></tr><tr><td> Protist</td><td>2</td><td>7</td></tr><tr><td> Fungi</td><td>10</td><td>24</td></tr><tr><td> Plants</td><td>1</td><td>9</td></tr><tr><td> Metazoa</td><td>14</td><td>26</td></tr><tr><td> Arthropoda</td><td>5</td><td>8</td></tr><tr><td> Vertebrata</td><td>7</td><td>15</td></tr><tr><td>Total</td><td>49</td><td>193</td></tr></tbody></table></div><div class="table-wrap-foot"><span id="fn-tblfn1"></span><div content-id="tblfn1" class="footnote"><span class="fn"><p class="chapter-para"><span class="small-caps">Note</span>.—The odb10 version greatly expanded the number of benchmarking data sets.</p></span></div></div></div></div><div class="table-full-width-wrap"><div class="table-wrap table-wide standard-table"><div class="table-wrap-title" id="msab199-T1" data-id="msab199-T1"><span class="label title-label" id="label-97940">Table 1</span><div class="
 graphic-wrap table-open-button-wrap
 "><a class="fig-view-orig at-tableViewLarge openInAnotherWindow btn js-view-large" role="button" target="_blank" href="
 /view-large/304110812" aria-describedby="label-97940"> Open in new tab </a></div><div class="caption caption-id-" id="caption-97940"><p class="chapter-para">Number of odb9 and odb10 BUSCO Data Sets.</p></div> </div><div class="table-overflow"><table role="table" aria-labelledby="
 label-97940" aria-describedby="
 caption-97940"><thead><tr><th>Taxonomic Group<span aria-hidden="true" style="display: none;"> . </span></th><th>odb9 (v3)<span aria-hidden="true" style="display: none;"> . </span></th><th>odb10 (v4/5)<span aria-hidden="true" style="display: none;"> . </span></th></tr></thead><tbody><tr><td>Bacteria</td><td>16</td><td>83</td></tr><tr><td>Archaea</td><td>0</td><td>16</td></tr><tr><td>Viruses</td><td>0</td><td>27</td></tr><tr><td>Eukaryota</td><td>33</td><td>67</td></tr><tr><td> Protist</td><td>2</td><td>7</td></tr><tr><td> Fungi</td><td>10</td><td>24</td></tr><tr><td> Plants</td><td>1</td><td>9</td></tr><tr><td> Metazoa</td><td>14</td><td>26</td></tr><tr><td> Arthropoda</td><td>5</td><td>8</td></tr><tr><td> Vertebrata</td><td>7</td><td>15</td></tr><tr><td>Total</td><td>49</td><td>193</td></tr></tbody></table></div><div class="table-modal"><table><thead><tr><th>Taxonomic Group<span aria-hidden="true" style="display: none;"> . </span></th><th>odb9 (v3)<span aria-hidden="true" style="display: none;"> . </span></th><th>odb10 (v4/5)<span aria-hidden="true" style="display: none;"> . </span></th></tr></thead><tbody><tr><td>Bacteria</td><td>16</td><td>83</td></tr><tr><td>Archaea</td><td>0</td><td>16</td></tr><tr><td>Viruses</td><td>0</td><td>27</td></tr><tr><td>Eukaryota</td><td>33</td><td>67</td></tr><tr><td> Protist</td><td>2</td><td>7</td></tr><tr><td> Fungi</td><td>10</td><td>24</td></tr><tr><td> Plants</td><td>1</td><td>9</td></tr><tr><td> Metazoa</td><td>14</td><td>26</td></tr><tr><td> Arthropoda</td><td>5</td><td>8</td></tr><tr><td> Vertebrata</td><td>7</td><td>15</td></tr><tr><td>Total</td><td>49</td><td>193</td></tr></tbody></table></div><div class="table-wrap-foot"><span id="fn-tblfn1"></span><div content-id="tblfn1" class="footnote"><span class="fn"><p class="chapter-para"><span class="small-caps">Note</span>.—The odb10 version greatly expanded the number of benchmarking data sets.</p></span></div></div></div></div> <h3 scrollto-destination=304110813 id="304110813" class="section-title js-splitscreen-section-title" >Novel BUSCO Workflows</h3> <p class="chapter-para">The BUSCO software was revised and new functionalities introduced to enable the analysis of inputs of unknown taxonomic origin, and to improve assessments, throughput and runtimes. A breakdown of the features in v5 and the differences with v3 are described in the schema of <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary figure 2</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 3</a></span>, and supplementary notes, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online.</p> <h4 scrollto-destination=304110815 id="304110815" class="section-title js-splitscreen-section-title" >New Prokaryotic and Eukaryotic Workflows</h4> <p class="chapter-para">The BUSCO software was revised to integrate the gene predictor Prodigal (<span class="xrefLink" id="jumplink-msab199-B4"></span><a href="javascript:;" reveal-id="msab199-B4" data-open="msab199-B4" class="link link-ref link-reveal xref-bibr">Hyatt et al. 2010</a>) for improving the analysis of prokaryotic genomes. The use of Prodigal coupled with the expanded number of data sets now available for Bacteria and Archaea (83 more data sets with respect to v3) make BUSCO a suitable choice when assessing prokaryotic data. A common issue when predicting genes is to select the correct genetic code (i.e. translation table) for the species under analysis. Each prokaryotic BUSCO data set now contains information on the potential genetic codes characteristic of the species within the corresponding lineage. BUSCO selects the most likely genetic code automatically based on which code yields the highest coding density.</p><p class="chapter-para">BUSCO v5 features a new workflow for the analysis of eukaryotic genomes that employs the gene predictor MetaEuk (<span class="xrefLink" id="jumplink-msab199-B6"></span><a href="javascript:;" reveal-id="msab199-B6" data-open="msab199-B6" class="link link-ref link-reveal xref-bibr">Levy Karin et al. 2020</a>), which relies on MMseqs2 (<span class="xrefLink" id="jumplink-msab199-B19"></span><a href="javascript:;" reveal-id="msab199-B19" data-open="msab199-B19" class="link link-ref link-reveal xref-bibr">Steinegger and Söding 2017</a>). MetaEuk was introduced to improve the assessment of large genomes for which the previous workflow was suffering from long runtimes. Two consecutive MetaEuk runs are implemented, and parameters are tuned differently for the second run to search for BUSCO genes missing after the first run. The BUSCO_MetaEuk workflow is the default option in v5, as it allows faster assessments. The Augustus gene predictor (<span class="xrefLink" id="jumplink-msab199-B18"></span><a href="javascript:;" reveal-id="msab199-B18" data-open="msab199-B18" class="link link-ref link-reveal xref-bibr">Stanke et al. 2008</a>) is still available in BUSCO and can be selected by specifying “–augustus” when running the analysis in “genome” mode. Since the two workflows use gene predictors that are based on different methods, it is expected to obtain nonidentical results when assessing the same genome. Nevertheless, they produce comparable completeness estimations on genomic sequences, which at times outperform the completeness of corresponding gene sets (<span class="xrefLink" id="jumplink-msab199-F2"></span><a href="javascript:;" data-modal-source-id="msab199-F2" class="link xref-fig">fig. 2a</a> and <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary fig. 3</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 4</a></span>, and supplementary notes, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). <span class="xrefLink" id="jumplink-msab199-F2"></span><a href="javascript:;" data-modal-source-id="msab199-F2" class="link xref-fig">Figure 2a</a> compares the results of BUSCO v5 using the two gene predictors on fungal genomes and their corresponding gene sets. Comparisons on arthropod and protist data are reported in <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary figure 3</a></span><em>b</em> and <em>c</em>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online. On a set of 139 arthropod genomes, we investigated if there is a set of BUSCOs consistently missed by one workflow and found by the other one. There were no consistent major differences in the ability to predict specific BUSCOs on this set, apart from a couple of exceptions (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary note</a></span>s and <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary fig. 4, </a></span><span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online).</p><p class="chapter-para"><span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary figure 3</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online, shows the substantial improvement in runtimes (runtimes axis has a log10 scale) when using the BUSCO_MetaEuk workflow. The higher speed is especially useful when assessing large genomes. For example, BUSCO_MetaEuk runs in 8 h and 50 min (using 56 CPUs) on the 10.7-Gb genome of the wheat <em>Triticum dicoccoides</em> (accession: GCF_002162155.1) with the poales_odb10 data set (BUSCO score: C : 99.1% [S : 9.6%, D : 89.5%], F : 0.1%, M : 0.8%, n : 4896), whereas the BUSCO_ Augustus workflow takes several days to complete. Even faster analyses can be obtained by reducing the sensitivity value (-s) of the two runs, via the “–metaeuk_parameters” and “–metaeuk_rerun_parameters” options (default values are <em>s</em> = 4.5 and <em>s</em> = 6 for the first and second run, respectively) (<span class="xrefLink" id="jumplink-msab199-F2"></span><a href="javascript:;" data-modal-source-id="msab199-F2" class="link xref-fig">fig. 2b</a>). For example, the runtime on the <em>T. dicoccoides</em> genome decreases to 2 h and 24 min using a sensitivity value of <em>s</em> = 3 (BUSCO score: C : 98.7% [S : 9.6%, D : 89.1%], F : 0.2%, M : 1.1%, n : 4896). However, changing the sensitivity values can have an impact on the estimates (<span class="xrefLink" id="jumplink-msab199-F2"></span><a href="javascript:;" data-modal-source-id="msab199-F2" class="link xref-fig">fig. 2c</a> and <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 5</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). The default values were chosen as a trade-off between accuracy and runtimes. In most settings it is not advisable to change the sensitivity values in order to keep BUSCO results comparable. Nevertheless, having this option can be convenient when assessing very large genomes or for getting faster evaluations on preliminary assemblies. Assembling genomes is an iterative process in which multiple draft assemblies are often produced to compare the outcome of different parameters/pipelines. Using smaller sensitivity values facilitates quick draft BUSCO assessments that were not feasible before, and should speed up the overall genome assembly procedure. The results now report the workflow used for the analysis, and this should be specified along with the BUSCO data set when reporting scores in publications.</p> <h4 scrollto-destination=304110819 id="304110819" class="section-title js-splitscreen-section-title" >Auto-Lineage Workflow: An All-in-One Option for Quality Assessment of (Meta)Genomic Data</h4> <p class="chapter-para">BUSCO v5 is the only available tool that can assess genomic data from the three domains of life in a single analysis by using the new “–auto-lineage” function. This is achieved through the phylogenetic placement of the input sequence (genome, gene set, or transcriptome) on a set of precomputed phylogenetic trees using SEPP (<span class="xrefLink" id="jumplink-msab199-B9"></span><a href="javascript:;" reveal-id="msab199-B9" data-open="msab199-B9" class="link link-ref link-reveal xref-bibr">Mirarab et al. 2011</a>) and pplacer (<span class="xrefLink" id="jumplink-msab199-B7"></span><a href="javascript:;" reveal-id="msab199-B7" data-open="msab199-B7" class="link link-ref link-reveal xref-bibr">Matsen et al. 2010</a>). Subsequently, BUSCO automatically attempts to select the most specific (i.e. highest resolution) data set available for the species of interest. This solves a major problem when analyzing metagenomic data where the taxonomic origin of metagenome-assembled genomes is often unknown and both eukaryotic and prokaryotic genomes can be present in the sample. For ease of batch analyses, it is now possible to run BUSCO on multiple input sequences, and an additional table summarizing the scores for all inputs is returned. Additionally, BUSCO can automatically detect a subset of viruses belonging to clades of the 27 newly introduced viral data sets. <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary figure 5 and s</a></span>upplementary table 6, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online, show the assessment on RefSeq (<span class="xrefLink" id="jumplink-msab199-B1"></span><a href="javascript:;" reveal-id="msab199-B1" data-open="msab199-B1" class="link link-ref link-reveal xref-bibr">Brister et al. 2015</a>) viral genomes and gene sets using the “–auto-lineage” function. We plan to expand the virus pipeline in future to allow assessments of a broader set of viruses. An overview of the auto-lineage workflow can be found in the <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary note</a></span>s, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online.</p><p class="chapter-para"><span class="xrefLink" id="jumplink-msab199-F3"></span><a href="javascript:;" data-modal-source-id="msab199-F3" class="link xref-fig">Figure 3a</a> presents the performance, in terms of selecting the right data set, of the auto-lineage procedure for 436 bacterial/archaeal genomes (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 7</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). We compared BUSCO v5 with CheckM v1.1.3 (<span class="xrefLink" id="jumplink-msab199-B13"></span><a href="javascript:;" reveal-id="msab199-B13" data-open="msab199-B13" class="link link-ref link-reveal xref-bibr">Parks et al. 2015</a>), which, while conceptually similar, is only capable of performing assessments on bacterial and archaeal data. <span class="xrefLink" id="jumplink-msab199-F3"></span><a href="javascript:;" data-modal-source-id="msab199-F3" class="link xref-fig">Figure 3b</a> and <em>c</em> reports BUSCO and CheckM completeness and redundancy scores for the same set of 436 genomes (see also <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 8</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). BUSCO estimates appear to be more conservative for some data points. This is in part related to the higher resolution data sets (i.e. more markers) automatically selected for the assessment (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary fig. S6</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). Overall, on prokaryotic data, BUSCO has comparable results to CheckM. However, a major advantage of BUSCO is the ability to detect and assess eukaryotic microbial genomes.</p> <a id="304110822" scrollto-destination="304110822"></a> <div data-id="msab199-f3" data-content-id="msab199-f3" class="fig fig-section js-fig-section" swap-content-for-modal="true"><div class="graphic-wrap"><img class="content-image" src="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f3.jpeg?Expires=1734480393&Signature=Czrqrmr-O89u8cDjMrRnd-3U4UnuwxRY39OxT7nVr5IBMsjyCQ2KJK9PBwyHwcfwv1NWObXGcTlMQLFnezU-XSsnznmsUaaeJSU0yo3UyqA~OAt4bGLvo7yCP7Vqxc2HJtxTMBg6mD~52isyL1s8NeGNsIvKRq-wn8EFWd3ZZF-WCLH0ypVYE7tz0M0br3I3hnaFcedOY7TxSZj26ZSpKG-84Eo1JHkSuyAx~0juRUIfaFd4cNbRAnz~sj6kK5bEBji6WK1wH5Sjb8IpR89Czp7foHUv2Wu9Qjp5hxHsZaNgRLGNlVSzdT5o4JT46UD~PQ9CL2NJgXnbgOKFZDoDpg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA" alt="BUSCO assessment on microbial data and comparison with CheckM. (a) Accuracy in the choice of data set produced by the auto-lineage mode when analyzing bacterial and archaeal assemblies (n = 436). For a given assembly, there can be between one and four suitable data sets (from the more general, root data set, down to the more specific one) to choose from (x axis). The selected data set is considered as “correct” when it is the most lineage-specific available for the genome; “suboptimal” when a parent lineage is selected; and “in disagreement with the NCBI” when the selected lineage is not part of the NCBI taxonomic annotation of that genome. This might indicate an error; however, 12 out of 19 genomes in this category are annotated by NCBI as “unclassified,” while sharing a parent lineage with the BUSCO selected data set; e.g. assembly GCF_000153385.1 is an unclassified Flavobacteria and was assigned to flavobacteriales_odb10 data set (also see supplementary table 7, Supplementary Material online). When supported by a high BUSCO score, this suggests that the data set selected by BUSCO was appropriate. (b and c) Comparison of BUSCO and CheckM completeness (blue) and redundancy (red) scores on a set of 436 genomes. For clarity, the two scatterplots are zoomed in on the areas of highest densities. n represents the number of data points displayed in the zoomed area. (d) Memory requirements for running BUSCO with the auto-lineage workflow on a set of bacterial and fungal genomes." data-path-from-xml="msab199f3.tif" /><div class="graphic-bottom"><div class="label fig-label" id="label-304110822">Fig. 3</div><div class="caption fig-caption"><p class="chapter-para">BUSCO assessment on microbial data and comparison with CheckM. (<em>a</em>) Accuracy in the choice of data set produced by the auto-lineage mode when analyzing bacterial and archaeal assemblies (<em>n</em> = 436). For a given assembly, there can be between one and four suitable data sets (from the more general, root data set, down to the more specific one) to choose from (<em>x</em> axis). The selected data set is considered as “correct” when it is the most lineage-specific available for the genome; “suboptimal” when a parent lineage is selected; and “in disagreement with the NCBI” when the selected lineage is not part of the NCBI taxonomic annotation of that genome. This might indicate an error; however, 12 out of 19 genomes in this category are annotated by NCBI as “unclassified,” while sharing a parent lineage with the BUSCO selected data set; e.g. assembly GCF_000153385.1 is an unclassified Flavobacteria and was assigned to flavobacteriales_odb10 data set (also see <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 7</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). When supported by a high BUSCO score, this suggests that the data set selected by BUSCO was appropriate. (<em>b</em> and <em>c</em>) Comparison of BUSCO and CheckM completeness (blue) and redundancy (red) scores on a set of 436 genomes. For clarity, the two scatterplots are zoomed in on the areas of highest densities. n represents the number of data points displayed in the zoomed area. (<em>d</em>) Memory requirements for running BUSCO with the auto-lineage workflow on a set of bacterial and fungal genomes.</p></div><div class="ajax-articleAbstract-exclude-regex fig-orig original-slide figure-button-wrap"><a class="fig-view-orig js-view-large at-figureViewLarge openInAnotherWindow" role="button" aria-describedby="label-304110822" href="/view-large/figure/304110822/msab199f3.tif" data-path-from-xml="msab199f3.tif" target="_blank">Open in new tab</a><a class="download-slide" role="button" aria-describedby="label-304110822" data-section="304110822" href="/DownloadFile/DownloadImage.aspx?image=https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199f3.jpeg?Expires=1734480393&Signature=vAVcjA~ZCWRSR4Iq8wJZit0SM6Z7ribdWrrQtOFH7ivZ1Qbu4GrQDFLTseS84R1tJx2IPq8XrVk2gB9~RKK9NbtbAFfjXJ5uuZ5PVyCZDbnMIfaheizrUlvABiml81vm2ztilC2V8x-fAMBxY37K313AD8gVX7GAXrmxwu16PXyHGqJEmUBJOcR~kSJ9cfxQSsnTh3tf~7L8ZMNIE-JzWmg4EaSysUi-rufes9yjhJ2Q0hG1pSr5dTt-Y841P6e7VqN1xx853sT3IGSYtwWeZWs1akf~96jmvpu18rwHjgNrclZe7lDi9g-8eOlA7E1wY83By2RaNSmNEsne2dwfnA__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA&sec=304110822&ar=6329644&xsltPath=~/UI/app/XSLT&imagename=&siteId=5325" data-path-from-xml="msab199f3.tif">Download slide</a></div></div></div></div><p class="chapter-para">In terms of resources, the mean runtime per genome with BUSCO (on the 436 prokaryotic genomes, in batch mode and using the prokaryotic-specific “–auto-lineage-prok”) is less than a minute (e.g. 35 and 48 s with 30 and eight CPUs, respectively) (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary tables 9 and 10</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). Running BUSCO through a workflow management system can considerably reduce the overall runtime. We provide an example using Snakemake (<span class="xrefLink" id="jumplink-msab199-B10"></span><a href="javascript:;" reveal-id="msab199-B10" data-open="msab199-B10" class="link link-ref link-reveal xref-bibr">Mölder et al. 2021</a>) at <a class="link link-uri openInAnotherWindow" href="https://gitlab.com/ezlab/plugins_buscov5" target="_blank">https://gitlab.com/ezlab/plugins_buscov5</a>. With this setup and allowing a total number of 30 CPUs with five CPUs per task, the overall runtime for completing the same assessment was reduced to 95 min (a mean runtime of 13 s per genome) compared with 257 min. <span class="xrefLink" id="jumplink-msab199-F3"></span><a href="javascript:;" data-modal-source-id="msab199-F3" class="link xref-fig">Figure 3d</a> shows the memory requirements for assessing a set of bacterial and fungal genomes with the BUSCO auto-lineage workflow. The memory requirements do not exceed 11GB for bacterial genomes, so that they can be assessed on laptops with limited memory and CPU resources (e.g. the same assessment ran to completion on a MacBook Pro with 16GB and eight cores). This is an advantage in comparison to the 70 GB of memory required by CheckM (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 9</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online).</p><p class="chapter-para">The percentage of duplicated markers reported by BUSCO can reflect technical or biological duplications (i.e. redundant markers derive from the same genome), or contaminations from other species/strains. BUSCO cannot directly distinguish whether redundant BUSCOs are due to duplications or contamination. Nevertheless the sequences detected by BUSCO as “duplicated” can be used as evidence for further investigation. In general, a high “duplication” score for prokaryotic data is more likely to be caused by contamination rather than gene duplication, especially for metagenome-assembled genomes, which often require manual refinements (<span class="xrefLink" id="jumplink-msab199-B2"></span><a href="javascript:;" reveal-id="msab199-B2" data-open="msab199-B2" class="link link-ref link-reveal xref-bibr">Eren et al. 2015</a>). <span class="xrefLink" id="jumplink-msab199-F3"></span><a href="javascript:;" data-modal-source-id="msab199-F3" class="link xref-fig">Figure 3c</a> shows an overall concordance between BUSCO “duplication” and CheckM “contamination” estimates.</p><p class="chapter-para">Additionally, BUSCO v5 can highlight contamination deriving from species belonging to other domains by means of the scores obtained from assessing the input with the three “root” data sets (bacteria_odb10, archaea_odb10, eukaryota_odb10). These assessments are automatically performed as the first step of the “auto-lineage” workflow. As there can be a background level of cross-matches between data sets, it is expected to have BUSCOs scoring in multiple “root” data sets. For example, running the “root” data sets on a set of 2,779 bacterial genomes from RefSeq (<span class="xrefLink" id="jumplink-msab199-B12"></span><a href="javascript:;" reveal-id="msab199-B12" data-open="msab199-B12" class="link link-ref link-reveal xref-bibr">O’Leary et al. 2016</a>) results in a median complete BUSCO score of 18.5% and 4.3% for the archaea_odb10 and eukaryota_odb10 data sets, respectively (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 10</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). The frequency of matches (including those reported as “fragmented”) for each BUSCO is shown in <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary figure 7</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online. 214 (83.9%) of the eukaryota_odb10 BUSCOs are detected in 5% or fewer of the bacterial genomes, with 184 (72.2%) with no matches at all. 120 (61.9%) of the archaea_odb10 BUSCOs are detected in 5% or fewer of the bacterial genomes, with 87 (44.84%) never showing up (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary table 11</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). The percentage of complete matches from bacteria_odb10 and archaea_odb10 in eukaryotic genomes is, on average, higher, e.g. 12.1% and 21.1% in fungal genomes and of 30.7% and 62.4% in arthropod gene sets, respectively (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary fig. 8 and s</a></span>upplementary tables 10 and 11, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online), making it less useful to spot contaminants. Nevertheless, high completeness scores from these data sets may alert users to the potential presence of contaminant species or horizontal gene transfer events from other domains, whereas high duplication scores may indicate the presence of multiple contaminant species.</p> <h3 scrollto-destination=304110826 id="304110826" class="section-title js-splitscreen-section-title" >Benchmark of Predictions</h3> <p class="chapter-para">To assess the precision of the BUSCO estimates, we benchmarked BUSCO v5 predictions on gene sets and genomes artificially depleted of randomly selected genes. Briefly, we randomly removed 0/10/30/50% of the genes in the official gene set, generating five simulated versions for each level of depletion. The corresponding genes in the genome were masked using the coordinates from the GFF file. BUSCO v5 was run on the simulated gene sets and genomes (both BUSCO_Augustus and BUSCO_MetaEuk workflows) using the most specific data set and the most generic one (for more details, see <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary note</a></span>s, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online). <span class="xrefLink" id="jumplink-msab199-F4"></span><a href="javascript:;" data-modal-source-id="msab199-F4" class="link xref-fig">Figure 4a</a> shows an example of the results of the benchmarks for <em>Drosophila melanogaster</em> (assembly accession: GCF_000001215.4). The predicted BUSCO estimates on depleted gene sets and genomes have a good overall correspondence to the expected values when using the diptera_odb10 data set, the most specific and appropriate data set. When using the more generic eukaryota_odb10 data set, the estimates are subjected to more variability (<span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary fig. 9</a></span><em>a</em>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online) across the different depleted versions, which is expected and explained by the lower number of markers, and the correspondingly lower coverage of the genome/gene set. This further highlights the importance of using the most specific data set when possible.</p> <a id="304110828" scrollto-destination="304110828"></a> <div data-id="msab199-f4" data-content-id="msab199-f4" class="fig fig-section js-fig-section" swap-content-for-modal="true"><div class="graphic-wrap"><img class="content-image" src="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/m_msab199f4.jpeg?Expires=1734480393&Signature=enZclGlwc34HoQQNny2kG3P2ad0dMDVu46u6mv2EQkRptWbBU1amOZTk22jeopLXFCxh-kG3g8RtBeEgFxKJGZQ2ERinIad5k6y21C4PMCNVqIqvhTmRCGvN~zkoxyjjuXKYVWtRf7u3TCX1t2ZhrjRJU6fhTqr3UIV-XAVM7XyyOHXkmiJuJPDD0CtAEYgsKa8202yQvOrD1CRGOKj0cnTCf3BJ03Q-34bOvl8ed35sYvQmy9FCNgW2JNTJ5Tn4ibHHpYM5e96XLjyrP5lSHGOwyjIx-IHX4F2U6adhyxk~hEZkB6thR0qCKHyjP7lTlvwBZIHCkDCYWsWob2SBqw__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA" alt="Benchmarking BUSCO estimates on artificially depleted genomes and gene sets of Drosophila melanogaster assessed with the diptera_odb10 data set. (a) Artificial depletion was made on the full gene set. (b) Artificial depletion exclusively made on genes matching BUSCO markers. For both panels, solid red lines indicate the expected missing values. Five randomly depleted versions were used for each level of depletion. (c) Precisions of the predictions for the analyses of panel (b)." data-path-from-xml="msab199f4.tif" /><div class="graphic-bottom"><div class="label fig-label" id="label-304110828">Fig. 4</div><div class="caption fig-caption"><p class="chapter-para">Benchmarking BUSCO estimates on artificially depleted genomes and gene sets of <em>Drosophila melanogaster</em> assessed with the diptera_odb10 data set. (<em>a</em>) Artificial depletion was made on the full gene set. (<em>b</em>) Artificial depletion exclusively made on genes matching BUSCO markers. For both panels, solid red lines indicate the expected missing values. Five randomly depleted versions were used for each level of depletion. (<em>c</em>) Precisions of the predictions for the analyses of panel (<em>b</em>).</p></div><div class="ajax-articleAbstract-exclude-regex fig-orig original-slide figure-button-wrap"><a class="fig-view-orig js-view-large at-figureViewLarge openInAnotherWindow" role="button" aria-describedby="label-304110828" href="/view-large/figure/304110828/msab199f4.tif" data-path-from-xml="msab199f4.tif" target="_blank">Open in new tab</a><a class="download-slide" role="button" aria-describedby="label-304110828" data-section="304110828" href="/DownloadFile/DownloadImage.aspx?image=https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199f4.jpeg?Expires=1734480393&Signature=fcdzQq7O5f9mGO0vAU0AQKEA0Cy6TQE9htaog0gaVw2B3nvqPdX0K4NMPX-tjHk0ZXawyTbLR36Y6QqBYJTUCvsaBPFoXJjStM7PMi4gbHio~67~NMkWs2XYvbcbuBOyLws5W9CU3fqYsWQ1XG~GsGLomFc3cXeaO-idY7WRzqMCUHvajDa2bJyW5TnVF5K~I3RaiRRN6XDLsy~9edPcJ12F913MI~-~DyB3xXOpAnRa9gw4awDUF2sZvupHWyTtQHw2Bvdu5v4eWhwfLqr4TeoZOn1lWeQur7~H2pMnIm8~PYFV2CaV0iEzWWEboIzEUaECBSyAmLpDy4YHzCeGdg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA&sec=304110828&ar=6329644&xsltPath=~/UI/app/XSLT&imagename=&siteId=5325" data-path-from-xml="msab199f4.tif">Download slide</a></div></div></div></div><p class="chapter-para">A second slightly different type of benchmarking was used to compute the number of false positive (FP)/false negative (FN) predictions. In this case we exclusively depleted genes predicted to be BUSCO markers. We first mapped the gene set to the OrthoDB level of interest (e.g. if assessing the species with diptera_odb10, the gene set was mapped to the OrthoDB diptera level). Based on this ortholog mapping we depleted the gene set/assemblies by 0/10/30/50/100% of the predicted BUSCO genes, generating five versions for each depletion level (except for 100% depletion). BUSCO v5 was run on these simulated data and the FP/FN and precision estimates were computed using the initial OrthoDB mapping as ground truth. <span class="xrefLink" id="jumplink-msab199-F4"></span><a href="javascript:;" data-modal-source-id="msab199-F4" class="link xref-fig">Figure 4b</a> shows the overall congruent estimates on <em>D. melanogaster</em> data. Removing 100% of the potential markers results in a small percentage of false positives, with the newly introduced BUSCO_MetaEuk workflow having a smaller number of false positives. All three modes have similar precision (<span class="xrefLink" id="jumplink-msab199-F4"></span><a href="javascript:;" data-modal-source-id="msab199-F4" class="link xref-fig">fig. 4c</a>), with BUSCO_MetaEuk workflow showing a slightly higher precision when depletion is equal to or above 50%. <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary figure 10</a></span>, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online, shows the results of the two benchmarks on the yeast <em>Saccharomyces cerevisiae</em> (GCF_000146045.2). A detailed description of the benchmark procedures is reported in the <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary note</a></span>s, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online.</p> <h3 scrollto-destination=304110830 id="304110830" class="section-title js-splitscreen-section-title" >Other Improvements and Distribution</h3> <p class="chapter-para">Along with a major refactoring of the code, new options have been added for managing the increasing number of data sets and to facilitate the analysis procedure. In particular, we added a default option to automatically download the necessary precomputed files for phylogenetic placement, and the data sets, either by specifying “-l <dataset_name>” as an option on the command line when initiating a BUSCO run, or by running in auto-lineage mode. Documentation and software setup instructions are all described in detail at <a class="link link-uri openInAnotherWindow" href="https://busco.ezlab.org/busco_userguide.html" target="_blank">https://busco.ezlab.org/busco_userguide.html</a>. We now also maintain a BUSCO package on Bioconda (<a class="link link-uri openInAnotherWindow" href="https://anaconda.org/bioconda/busco" target="_blank">https://anaconda.org/bioconda/busco</a>) and a Docker container. We encourage BUSCO users to favor these two approaches to control the version of each software dependency that is used. In addition, the BUSCO code is still distributed on GitLab <a class="link link-uri openInAnotherWindow" href="https://gitlab.com/ezlab/busco" target="_blank">https://gitlab.com/ezlab/busco</a>.</p> <h2 scrollto-destination=304110832 id="304110832" class="section-title js-splitscreen-section-title" >Materials and Methods</h2> <p class="chapter-para">BUSCO data sets are available at <a class="link link-uri openInAnotherWindow" href="https://busco-data.ezlab.org/v5/data/lineages/" target="_blank">https://busco-data.ezlab.org/v5/data/lineages/</a>. Each BUSCO data set contains the details on the species, orthologous groups, and genes used to construct the set. Versions and accessions of all the genome assemblies and gene sets, and the BUSCO main results analyzed as part of this study are listed in the supplementary tables, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online. Further details on the analyses are described in the <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">supplementary note</a></span>s, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online. Plots presenting the results of the analyses were made using the ggplot2 package (<span class="xrefLink" id="jumplink-msab199-B22"></span><a href="javascript:;" reveal-id="msab199-B22" data-open="msab199-B22" class="link link-ref link-reveal xref-bibr">Wickham 2009</a>) in R (<span class="xrefLink" id="jumplink-msab199-B15"></span><a href="javascript:;" reveal-id="msab199-B15" data-open="msab199-B15" class="link link-ref link-reveal xref-bibr">R Core Team 2020</a>).</p> <h2 scrollto-destination=304110834 id="304110834" class="section-title js-splitscreen-section-title" >Supplementary Material</h2> <p class="chapter-para"><span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary data</a></span> are available at <em>Molecular Biology and Evolution</em> online.</p> <h2 scrollto-destination=304110836 id="304110836" class="backacknowledgements-title js-splitscreen-backacknowledgements-title" data-legacy-id=ack1>Acknowledgments</h2> <p class="chapter-para">This work was supported by funding from the University of Geneva, Swiss National Science Foundation (Grant No. 310030_189062) and Swiss Institute of Bioinformatics SERI to E.Z. We would like to thank all current and former members of the E.Z. group, and Robert M. Waterhouse for continuing support of the BUSCO project and the user community.</p> <h3 scrollto-destination=304110838 id="304110838" class="section-title js-splitscreen-section-title" >Data Availability</h3> <p class="chapter-para">BUSCO is licensed and freely distributed under the MIT Licence. The BUSCO source code is available through the GitLab project, <a class="link link-uri openInAnotherWindow" href="https://gitlab.com/ezlab/busco" target="_blank">https://gitlab.com/ezlab/busco</a>, and it is also maintained on Bioconda (<a class="link link-uri openInAnotherWindow" href="https://anaconda.org/bioconda/busco" target="_blank">https://anaconda.org/bioconda/busco</a>) and as a Docker container. BUSCO data sets are available at <a class="link link-uri openInAnotherWindow" href="https://busco-data.ezlab.org/v5/data/lineages/" target="_blank">https://busco-data.ezlab.org/v5/data/lineages/</a>. Each BUSCO data set contains the details on the species, orthologous groups, and genes used to construct the set. Further information can be accessed by mapping through the OrthoDB website. We also provide a single text file at <a class="link link-uri openInAnotherWindow" href="https://busco-data.ezlab.org/v5/data/" target="_blank">https://busco-data.ezlab.org/v5/data/</a> reporting the IDs of all proteins used to build the data sets with all the mappings to relevant information (e.g. data set, Orthologous Group, species name, assemblyID). Versions and accessions of all the genome assemblies and gene sets analyzed in this study, along with their corresponding species name are listed in the supplementary tables, <span class="link link-data-supplement" data-supplement-target="sup1"></span><span class="content-section supplementary-material"><a path-from-xml="sup1" href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1734480393&Signature=zD5powbs78CcdNvJHLo-SE6wM3G7NLeSPRUVpeHIIJlChLl18DbeOT5Go53fYKnc7SPVIt2LPXzWAAm-5WZh6Y8SK-jEGjwiwtY5VJur9RoSr0f6bXOPyA8v8QpZ3NhrIH9PRz27WksRJRxK3cfhLcplJjwgVpF4v~hvsMWGR5D1pIo8Is43NFLbDLJiV453oiYqUgWn2GnMjtaSE4t5L0ukMy6Oqd04SAkhHip~h1SyvHA0qa1UIr-Z~sBxdiSmkGXQYgqZFCYFq~KFBKcIpHzI-9sls12BlEWwzCP83MCZ~PQdY9mwENSouy2Br4LBDikKGGv37-SF334393wcPg__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA">Supplementary Material</a></span> online, and are accessible through the NCBI database. The simulated data and the intermediate outputs underlying the benchmark of predictions are available on Zenodo, at <a class="link link-uri openInAnotherWindow" href="https://www.doi.org/10.5281/zenodo.4972052" target="_blank">https://www.doi.org/10.5281/zenodo.4972052</a>.</p> <h2 scrollto-destination=304110840 id="304110840" class="backreferences-title js-splitscreen-backreferences-title" data-legacy-id=ref1>References</h2> <div class="ref-list js-splitview-ref-list"><div content-id="msab199-B1" class="js-splitview-ref-item" data-legacy-id="msab199-B1"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B1" href="javascript:;" aria-label="jumplink-msab199-B1" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B1" class="ref-content " data-id="msab199-B1"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Brister</div> <div class="given-names">JR</div></span>, <span class="name string-name"><div class="surname">Ako-adjei</div> <div class="given-names">D</div></span>, <span class="name string-name"><div class="surname">Bao</div> <div class="given-names">Y</div></span>, <span class="name string-name"><div class="surname">Blinkova</div> <div class="given-names">O.</div></span></span> <div class="year">2015</div>. <div class="article-title">NCBI viral genomes resource</div>. <div class="source ">Nucleic Acids Res</div>. <div class="volume">43(Database issue</div>):<div class="fpage">D571</div>–<div class="lpage">D577</div>.</p><!--citationLinks: case 2--><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=NCBI%20viral%20genomes%20resource&author=JR%20Brister&author=D%20Ako-adjei&author=Y%20Bao&author=O.%20Blinkova&publication_year=2015&journal=Nucleic%20Acids%20Res&volume=43(Database issue&pages=D571-D577" target="_blank">Google Scholar</a></span></p><div class="xslopenurl empty-target"><span class="js-inst-open-url-holders-nodoi"><a class="js-open-url-link" data-href-template="{targetURL}?sid=oup:orr&genre=article&atitle=NCBI+viral+genomes+resource&aulast=Brister&title=Nucleic+Acids+Res&date=2015&spage=D571&epage=D577&volume=43(Database issue" href="javascript:;"><span class="screenreader-text">OpenURL Placeholder Text</span></a></span></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:NCBI%20viral%20genomes%20resource&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B2" class="js-splitview-ref-item" data-legacy-id="msab199-B2"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B2" href="javascript:;" aria-label="jumplink-msab199-B2" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B2" class="ref-content " data-id="msab199-B2"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Eren</div> <div class="given-names">AM</div></span>, <span class="name string-name"><div class="surname">Esen</div> <div class="given-names">ÖC</div></span>, <span class="name string-name"><div class="surname">Quince</div> <div class="given-names">C</div></span>, <span class="name string-name"><div class="surname">Vineis</div> <div class="given-names">JH</div></span>, <span class="name string-name"><div class="surname">Morrison</div> <div class="given-names">HG</div></span>, <span class="name string-name"><div class="surname">Sogin</div> <div class="given-names">ML</div></span>, <span class="name string-name"><div class="surname">Delmont</div> <div class="given-names">TO.</div></span></span> <div class="year">2015</div>. <div class="article-title">Anvi’o: an advanced analysis and visualization platform for ‘omics data</div>. <div class="source ">PeerJ</div> <div class="volume">3</div>:<div class="fpage">e1319</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Anvi%E2%80%99o%3A%20an%20advanced%20analysis%20and%20visualization%20platform%20for%20%E2%80%98omics%20data&author=AM%20Eren&author=%C3%96C%20Esen&author=C%20Quince&author=JH%20Vineis&author=HG%20Morrison&author=ML%20Sogin&author=TO.%20Delmont&publication_year=2015&journal=PeerJ&volume=3&pages=e1319" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.7717/peerj.1319" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.7717%2Fpeerj.1319" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.7717%2Fpeerj.1319"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/26500826" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Anvi%E2%80%99o%3A%20an%20advanced%20analysis%20and%20visualization%20platform%20for%20%E2%80%98omics%20data&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B3" class="js-splitview-ref-item" data-legacy-id="msab199-B3"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B3" href="javascript:;" aria-label="jumplink-msab199-B3" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B3" class="ref-content " data-id="msab199-B3"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Grüning</div> <div class="given-names">B</div></span>, <span class="name string-name"><div class="surname">Dale</div> <div class="given-names">R</div></span>, <span class="name string-name"><div class="surname">Sjödin</div> <div class="given-names">A</div></span>, <span class="name string-name"><div class="surname">Chapman</div> <div class="given-names">BA</div></span>, <span class="name string-name"><div class="surname">Rowe</div> <div class="given-names">J</div></span>, <span class="name string-name"><div class="surname">Tomkins-Tinch</div> <div class="given-names">CH</div></span>, <span class="name string-name"><div class="surname">Valieris</div> <div class="given-names">R</div></span>, <span class="name string-name"><div class="surname">Köster</div> <div class="given-names">J</div></span></span>, Bioconda Team. <div class="year">2018</div>. <div class="article-title">Bioconda: sustainable and comprehensive software distribution for the life sciences</div>. <div class="source ">Nat Methods</div>. <div class="volume">15</div>(<div class="issue">7</div>):<div class="fpage">475</div>–<div class="lpage">476</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Bioconda%3A%20sustainable%20and%20comprehensive%20software%20distribution%20for%20the%20life%20sciences&author=B%20Gr%C3%BCning&author=R%20Dale&author=A%20Sj%C3%B6din&author=BA%20Chapman&author=J%20Rowe&author=CH%20Tomkins-Tinch&author=R%20Valieris&author=J%20K%C3%B6ster&publication_year=2018&journal=Nat%20Methods&volume=15&pages=475-476" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1038/s41592-018-0046-7" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1038%2Fs41592-018-0046-7" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1038%2Fs41592-018-0046-7"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/29967506" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Bioconda%3A%20sustainable%20and%20comprehensive%20software%20distribution%20for%20the%20life%20sciences&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B4" class="js-splitview-ref-item" data-legacy-id="msab199-B4"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B4" href="javascript:;" aria-label="jumplink-msab199-B4" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B4" class="ref-content " data-id="msab199-B4"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Hyatt</div> <div class="given-names">D</div></span>, <span class="name string-name"><div class="surname">Chen</div> <div class="given-names">G-L</div></span>, <span class="name string-name"><div class="surname">LoCascio</div> <div class="given-names">PF</div></span>, <span class="name string-name"><div class="surname">Land</div> <div class="given-names">ML</div></span>, <span class="name string-name"><div class="surname">Larimer</div> <div class="given-names">FW</div></span>, <span class="name string-name"><div class="surname">Hauser</div> <div class="given-names">LJ.</div></span></span> <div class="year">2010</div>. <div class="article-title">Prodigal: prokaryotic gene recognition and translation initiation site identification</div>. <div class="source ">BMC Bioinformatics</div> <div class="volume">11</div>:<div class="fpage">119</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Prodigal%3A%20prokaryotic%20gene%20recognition%20and%20translation%20initiation%20site%20identification&author=D%20Hyatt&author=G-L%20Chen&author=PF%20LoCascio&author=ML%20Land&author=FW%20Larimer&author=LJ.%20Hauser&publication_year=2010&journal=BMC%20Bioinformatics&volume=11&pages=119" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1186/1471-2105-11-119" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1186%2F1471-2105-11-119" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1186%2F1471-2105-11-119"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/20211023" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Prodigal%3A%20prokaryotic%20gene%20recognition%20and%20translation%20initiation%20site%20identification&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B5" class="js-splitview-ref-item" data-legacy-id="msab199-B5"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B5" href="javascript:;" aria-label="jumplink-msab199-B5" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B5" class="ref-content " data-id="msab199-B5"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Kriventseva</div> <div class="given-names">EV</div></span>, <span class="name string-name"><div class="surname">Kuznetsov</div> <div class="given-names">D</div></span>, <span class="name string-name"><div class="surname">Tegenfeldt</div> <div class="given-names">F</div></span>, <span class="name string-name"><div class="surname">Manni</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Dias</div> <div class="given-names">R</div></span>, <span class="name string-name"><div class="surname">Simão</div> <div class="given-names">FA</div></span>, <span class="name string-name"><div class="surname">Zdobnov</div> <div class="given-names">EM.</div></span></span> <div class="year">2019</div>. <div class="article-title">OrthoDB v10: sampling the diversity of animal, plant, fungal, protist, bacterial and viral genomes for evolutionary and functional annotations of orthologs</div>. <div class="source ">Nucleic Acids Res</div>. <div class="volume">47</div>(<div class="issue">D1</div>):<div class="fpage">D807</div>–<div class="lpage">D811</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=OrthoDB%20v10%3A%20sampling%20the%20diversity%20of%20animal%2C%20plant%2C%20fungal%2C%20protist%2C%20bacterial%20and%20viral%20genomes%20for%20evolutionary%20and%20functional%20annotations%20of%20orthologs&author=EV%20Kriventseva&author=D%20Kuznetsov&author=F%20Tegenfeldt&author=M%20Manni&author=R%20Dias&author=FA%20Sim%C3%A3o&author=EM.%20Zdobnov&publication_year=2019&journal=Nucleic%20Acids%20Res&volume=47&pages=D807-D811" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1093/nar/gky1053" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1093%2Fnar%2Fgky1053" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1093%2Fnar%2Fgky1053"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/30395283" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:OrthoDB%20v10%3A%20sampling%20the%20diversity%20of%20animal%2C%20plant%2C%20fungal%2C%20protist%2C%20bacterial%20and%20viral%20genomes%20for%20evolutionary%20and%20functional%20annotations%20of%20orthologs&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B6" class="js-splitview-ref-item" data-legacy-id="msab199-B6"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B6" href="javascript:;" aria-label="jumplink-msab199-B6" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B6" class="ref-content " data-id="msab199-B6"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Levy Karin</div> <div class="given-names">E</div></span>, <span class="name string-name"><div class="surname">Mirdita</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Söding</div> <div class="given-names">J.</div></span></span> <div class="year">2020</div>. <div class="article-title">MetaEuk—sensitive, high-throughput gene discovery, and annotation for large-scale eukaryotic metagenomics</div>. <div class="source ">Microbiome</div> <div class="volume">8</div>(<div class="issue">1</div>):<div class="fpage">48</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=MetaEuk%E2%80%94sensitive%2C%20high-throughput%20gene%20discovery%2C%20and%20annotation%20for%20large-scale%20eukaryotic%20metagenomics&author=E%20Levy%20Karin&author=M%20Mirdita&author=J.%20S%C3%B6ding&publication_year=2020&journal=Microbiome&volume=8&pages=48" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1186/s40168-020-00808-x" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1186%2Fs40168-020-00808-x" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1186%2Fs40168-020-00808-x"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/32245390" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:MetaEuk%E2%80%94sensitive%2C%20high-throughput%20gene%20discovery%2C%20and%20annotation%20for%20large-scale%20eukaryotic%20metagenomics&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B7" class="js-splitview-ref-item" data-legacy-id="msab199-B7"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B7" href="javascript:;" aria-label="jumplink-msab199-B7" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B7" class="ref-content " data-id="msab199-B7"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Matsen</div> <div class="given-names">FA</div></span>, <span class="name string-name"><div class="surname">Kodner</div> <div class="given-names">RB</div></span>, <span class="name string-name"><div class="surname">Armbrust</div> <div class="given-names">EV.</div></span></span> <div class="year">2010</div>. <div class="article-title">pplacer: linear time maximum-likelihood and Bayesian phylogenetic placement of sequences onto a fixed reference tree</div>. <div class="source ">BMC Bioinformatics</div> <div class="volume">11</div>:<div class="fpage">538</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=pplacer%3A%20linear%20time%20maximum-likelihood%20and%20Bayesian%20phylogenetic%20placement%20of%20sequences%20onto%20a%20fixed%20reference%20tree&author=FA%20Matsen&author=RB%20Kodner&author=EV.%20Armbrust&publication_year=2010&journal=BMC%20Bioinformatics&volume=11&pages=538" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1186/1471-2105-11-538" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1186%2F1471-2105-11-538" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1186%2F1471-2105-11-538"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/21034504" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:pplacer%3A%20linear%20time%20maximum-likelihood%20and%20Bayesian%20phylogenetic%20placement%20of%20sequences%20onto%20a%20fixed%20reference%20tree&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B8" class="js-splitview-ref-item" data-legacy-id="msab199-B8"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B8" href="javascript:;" aria-label="jumplink-msab199-B8" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B8" class="ref-content " data-id="msab199-B8"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Merkel</div> <div class="given-names">D.</div></span></span> <div class="year">2014</div>. <div class="article-title">Docker: lightweight Linux containers for consistent development and deployment</div>. <div class="source ">Linux J</div>. <div class="volume">2</div>:<div class="fpage">2</div>.</p><!--citationLinks: case 2--><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Docker%3A%20lightweight%20Linux%20containers%20for%20consistent%20development%20and%20deployment&author=D.%20Merkel&publication_year=2014&journal=Linux%20J&volume=2&pages=2" target="_blank">Google Scholar</a></span></p><div class="xslopenurl empty-target"><span class="js-inst-open-url-holders-nodoi"><a class="js-open-url-link" data-href-template="{targetURL}?sid=oup:orr&genre=article&atitle=Docker%3a+lightweight+Linux+containers+for+consistent+development+and+deployment&aulast=Merkel&title=Linux+J&date=2014&spage=2&volume=2" href="javascript:;"><span class="screenreader-text">OpenURL Placeholder Text</span></a></span></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Docker%3A%20lightweight%20Linux%20containers%20for%20consistent%20development%20and%20deployment&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B9" class="js-splitview-ref-item" data-legacy-id="msab199-B9"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B9" href="javascript:;" aria-label="jumplink-msab199-B9" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B9" class="ref-content " data-id="msab199-B9"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Mirarab</div> <div class="given-names">S</div></span>, <span class="name string-name"><div class="surname">Nguyen</div> <div class="given-names">N</div></span>, <span class="name string-name"><div class="surname">Warnow</div> <div class="given-names">T.</div></span></span> <div class="year">2011</div>. <div class="source ">SEPP: SATé-enabled phylogenetic placement</div>. <div class="publisher-loc">Kohala Coast (HI</div>): <div class="publisher-name">World Scientific</div>. p. <div class="fpage">247</div>–<div class="lpage">258</div>.</p><!--citationLinks: case 2--><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=SEPP%3A%20SAT%C3%A9-enabled%20phylogenetic%20placement&author=S%20Mirarab&author=N%20Nguyen&author=T.%20Warnow&publication_year=2011&book=SEPP%3A%20SAT%C3%A9-enabled%20phylogenetic%20placement" target="_blank">Google Scholar</a></span></p><p class="citation-links-compatibility"><span class="google-preview-ref-link js-google-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.google.com/search?q=SEPP%3A%20SAT%C3%A9-enabled%20phylogenetic%20placement&btnG=Search+Books&tbm=bks&tbo=1" target="_blank">Google Preview</a></span></p><div class="xslopenurl empty-target"><span class="js-inst-open-url-holders-nodoi"><a class="js-open-url-link" data-href-template="{targetURL}?sid=oup:orr&genre=book&title=SEPP%3a+SAT%c3%a9-enabled+phylogenetic+placement&aulast=Mirarab&date=2011&spage=247&epage=258" href="javascript:;"><span class="screenreader-text">OpenURL Placeholder Text</span></a></span></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:SEPP%3A%20SAT%C3%A9-enabled%20phylogenetic%20placement&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p><div class="copac-reference-ref-link js-copac-preview-ref-link" style="display:none" data-pubtype="book"><span class="inst-copac"><a class="openInAnotherWindow" target="_blank" href="http://copac.ac.uk/search?ti=SEPP%3A%20SAT%C3%A9-enabled%20phylogenetic%20placement">COPAC</a></span></div> </div></div></div></div></div><div content-id="msab199-B10" class="js-splitview-ref-item" data-legacy-id="msab199-B10"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B10" href="javascript:;" aria-label="jumplink-msab199-B10" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B10" class="ref-content " data-id="msab199-B10"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Mölder</div> <div class="given-names">F</div></span>, <span class="name string-name"><div class="surname">Jablonski</div> <div class="given-names">KP</div></span>, <span class="name string-name"><div class="surname">Letcher</div> <div class="given-names">B</div></span>, <span class="name string-name"><div class="surname">Hall</div> <div class="given-names">MB</div></span>, <span class="name string-name"><div class="surname">Tomkins-Tinch</div> <div class="given-names">CH</div></span>, <span class="name string-name"><div class="surname">Sochat</div> <div class="given-names">V</div></span>, <span class="name string-name"><div class="surname">Forster</div> <div class="given-names">J</div></span>, <span class="name string-name"><div class="surname">Lee</div> <div class="given-names">S</div></span>, <span class="name string-name"><div class="surname">Twardziok</div> <div class="given-names">SO</div></span>, <span class="name string-name"><div class="surname">Kanitz</div> <div class="given-names">A</div></span></span>, et al. <div class="year">2021</div>. <div class="article-title">Sustainable data analysis with Snakemake</div>. <div class="source ">F1000Res</div>. <div class="volume">10</div>:<div class="fpage">33</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Sustainable%20data%20analysis%20with%20Snakemake&author=F%20M%C3%B6lder&author=KP%20Jablonski&author=B%20Letcher&author=MB%20Hall&author=CH%20Tomkins-Tinch&author=V%20Sochat&author=J%20Forster&author=S%20Lee&author=SO%20Twardziok&author=A%20Kanitz&publication_year=2021&journal=F1000Res&volume=10&pages=33" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.12688/f1000research" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.12688%2Ff1000research" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.12688%2Ff1000research"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/34035898" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Sustainable%20data%20analysis%20with%20Snakemake&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B11" class="js-splitview-ref-item" data-legacy-id="msab199-B11"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B11" href="javascript:;" aria-label="jumplink-msab199-B11" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B11" class="ref-content " data-id="msab199-B11"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Nayfach</div> <div class="given-names">S</div></span>, <span class="name string-name"><div class="surname">Camargo</div> <div class="given-names">AP</div></span>, <span class="name string-name"><div class="surname">Schulz</div> <div class="given-names">F</div></span>, <span class="name string-name"><div class="surname">Eloe-Fadrosh</div> <div class="given-names">E</div></span>, <span class="name string-name"><div class="surname">Roux</div> <div class="given-names">S</div></span>, <span class="name string-name"><div class="surname">Kyrpides</div> <div class="given-names">NC.</div></span></span> <div class="year">2021</div>. <div class="article-title">CheckV assesses the quality and completeness of metagenome-assembled viral genomes</div>. <div class="source ">Nat Biotechnol</div>. <div class="volume">39</div>:<div class="fpage">578</div>–<div class="lpage">585</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=CheckV%20assesses%20the%20quality%20and%20completeness%20of%20metagenome-assembled%20viral%20genomes&author=S%20Nayfach&author=AP%20Camargo&author=F%20Schulz&author=E%20Eloe-Fadrosh&author=S%20Roux&author=NC.%20Kyrpides&publication_year=2021&journal=Nat%20Biotechnol&volume=39&pages=578-585" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1038/s41587-020-00774-7" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1038%2Fs41587-020-00774-7" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1038%2Fs41587-020-00774-7"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/33349699" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:CheckV%20assesses%20the%20quality%20and%20completeness%20of%20metagenome-assembled%20viral%20genomes&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B12" class="js-splitview-ref-item" data-legacy-id="msab199-B12"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B12" href="javascript:;" aria-label="jumplink-msab199-B12" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B12" class="ref-content " data-id="msab199-B12"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">O’Leary</div> <div class="given-names">NA</div></span>, <span class="name string-name"><div class="surname">Wright</div> <div class="given-names">MW</div></span>, <span class="name string-name"><div class="surname">Brister</div> <div class="given-names">JR</div></span>, <span class="name string-name"><div class="surname">Ciufo</div> <div class="given-names">S</div></span>, <span class="name string-name"><div class="surname">Haddad</div> <div class="given-names">D</div></span>, <span class="name string-name"><div class="surname">McVeigh</div> <div class="given-names">R</div></span>, <span class="name string-name"><div class="surname">Rajput</div> <div class="given-names">B</div></span>, <span class="name string-name"><div class="surname">Robbertse</div> <div class="given-names">B</div></span>, <span class="name string-name"><div class="surname">Smith-White</div> <div class="given-names">B</div></span>, <span class="name string-name"><div class="surname">Ako-Adjei</div> <div class="given-names">D</div></span></span>, et al. <div class="year">2016</div>. <div class="article-title">Reference sequence (RefSeq) database at NCBI: current status, taxonomic expansion, and functional annotation</div>. <div class="source ">Nucleic Acids Res</div>. <div class="volume">44</div>(<div class="issue">D1</div>):<div class="fpage">D733</div>–<div class="lpage">D745</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Reference%20sequence%20%28RefSeq%29%20database%20at%20NCBI%3A%20current%20status%2C%20taxonomic%20expansion%2C%20and%20functional%20annotation&author=NA%20O%E2%80%99Leary&author=MW%20Wright&author=JR%20Brister&author=S%20Ciufo&author=D%20Haddad&author=R%20McVeigh&author=B%20Rajput&author=B%20Robbertse&author=B%20Smith-White&author=D%20Ako-Adjei&publication_year=2016&journal=Nucleic%20Acids%20Res&volume=44&pages=D733-D745" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1093/nar/gkv1189" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1093%2Fnar%2Fgkv1189" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1093%2Fnar%2Fgkv1189"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/26553804" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Reference%20sequence%20%28RefSeq%29%20database%20at%20NCBI%3A%20current%20status%2C%20taxonomic%20expansion%2C%20and%20functional%20annotation&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B13" class="js-splitview-ref-item" data-legacy-id="msab199-B13"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B13" href="javascript:;" aria-label="jumplink-msab199-B13" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B13" class="ref-content " data-id="msab199-B13"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Parks</div> <div class="given-names">DH</div></span>, <span class="name string-name"><div class="surname">Imelfort</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Skennerton</div> <div class="given-names">CT</div></span>, <span class="name string-name"><div class="surname">Hugenholtz</div> <div class="given-names">P</div></span>, <span class="name string-name"><div class="surname">Tyson</div> <div class="given-names">GW.</div></span></span> <div class="year">2015</div>. <div class="article-title">CheckM: assessing the quality of microbial genomes recovered from isolates, single cells, and metagenomes</div>. <div class="source ">Genome Res</div>. <div class="volume">25</div>(<div class="issue">7</div>):<div class="fpage">1043</div>–<div class="lpage">1055</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=CheckM%3A%20assessing%20the%20quality%20of%20microbial%20genomes%20recovered%20from%20isolates%2C%20single%20cells%2C%20and%20metagenomes&author=DH%20Parks&author=M%20Imelfort&author=CT%20Skennerton&author=P%20Hugenholtz&author=GW.%20Tyson&publication_year=2015&journal=Genome%20Res&volume=25&pages=1043-1055" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1101/gr.186072.114" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1101%2Fgr.186072.114" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1101%2Fgr.186072.114"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/25977477" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:CheckM%3A%20assessing%20the%20quality%20of%20microbial%20genomes%20recovered%20from%20isolates%2C%20single%20cells%2C%20and%20metagenomes&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B14" class="js-splitview-ref-item" data-legacy-id="msab199-B14"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B14" href="javascript:;" aria-label="jumplink-msab199-B14" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B14" class="ref-content " data-id="msab199-B14"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Parra</div> <div class="given-names">G</div></span>, <span class="name string-name"><div class="surname">Bradnam</div> <div class="given-names">K</div></span>, <span class="name string-name"><div class="surname">Korf</div> <div class="given-names">I.</div></span></span> <div class="year">2007</div>. <div class="article-title">CEGMA: a pipeline to accurately annotate core genes in eukaryotic genomes</div>. <div class="source ">Bioinformatics</div> <div class="volume">23</div>(<div class="issue">9</div>):<div class="fpage">1061</div>–<div class="lpage">1067</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=CEGMA%3A%20a%20pipeline%20to%20accurately%20annotate%20core%20genes%20in%20eukaryotic%20genomes&author=G%20Parra&author=K%20Bradnam&author=I.%20Korf&publication_year=2007&journal=Bioinformatics&volume=23&pages=1061-1067" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1093/bioinformatics/btm071" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1093%2Fbioinformatics%2Fbtm071" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1093%2Fbioinformatics%2Fbtm071"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/17332020" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:CEGMA%3A%20a%20pipeline%20to%20accurately%20annotate%20core%20genes%20in%20eukaryotic%20genomes&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B15" class="js-splitview-ref-item" data-legacy-id="msab199-B15"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B15" href="javascript:;" aria-label="jumplink-msab199-B15" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B15" class="ref-content " data-id="msab199-B15"><div class="mixed-citation citation"><p class="mixed-citation-compatibility">R Core Team. <div class="year">2020</div>. <div class="source ">R: a language and environment for statistical computing</div>. <div class="publisher-loc">Vienna (Austria</div>): <div class="publisher-name">R Foundation for Statistical Computing</div>. Accessed March 22, 2021.</p><!--citationLinks: case 3--><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=R%3A%20a%20language%20and%20environment%20for%20statistical%20computing&publication_year=2020&book=R%3A%20a%20language%20and%20environment%20for%20statistical%20computing" target="_blank">Google Scholar</a></span></p><p class="citation-links-compatibility"><span class="google-preview-ref-link js-google-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.google.com/search?q=R%3A%20a%20language%20and%20environment%20for%20statistical%20computing&btnG=Search+Books&tbm=bks&tbo=1" target="_blank">Google Preview</a></span></p><div class="xslopenurl empty-target"><span class="js-inst-open-url-holders-nodoi"><a class="js-open-url-link" data-href-template="{targetURL}?sid=oup:orr&genre=book&title=R%3a+a+language+and+environment+for+statistical+computing&date=2020" href="javascript:;"><span class="screenreader-text">OpenURL Placeholder Text</span></a></span></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:R%3A%20a%20language%20and%20environment%20for%20statistical%20computing&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p><div class="copac-reference-ref-link js-copac-preview-ref-link" style="display:none" data-pubtype="book"><span class="inst-copac"><a class="openInAnotherWindow" target="_blank" href="http://copac.ac.uk/search?ti=R%3A%20a%20language%20and%20environment%20for%20statistical%20computing">COPAC</a></span></div></div></div></div></div></div><div content-id="msab199-B16" class="js-splitview-ref-item" data-legacy-id="msab199-B16"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B16" href="javascript:;" aria-label="jumplink-msab199-B16" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B16" class="ref-content " data-id="msab199-B16"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Saary</div> <div class="given-names">P</div></span>, <span class="name string-name"><div class="surname">Mitchell</div> <div class="given-names">AL</div></span>, <span class="name string-name"><div class="surname">Finn</div> <div class="given-names">RD.</div></span></span> <div class="year">2020</div>. <div class="article-title">Estimating the quality of eukaryotic genomes recovered from metagenomic analysis with EukCC</div>. <div class="source ">Genome Biol</div>. <div class="volume">21</div>(<div class="issue">1</div>):<div class="fpage">244</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Estimating%20the%20quality%20of%20eukaryotic%20genomes%20recovered%20from%20metagenomic%20analysis%20with%20EukCC&author=P%20Saary&author=AL%20Mitchell&author=RD.%20Finn&publication_year=2020&journal=Genome%20Biol&volume=21&pages=244" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1186/s13059-020-02155-4" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1186%2Fs13059-020-02155-4" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1186%2Fs13059-020-02155-4"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/32912302" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Estimating%20the%20quality%20of%20eukaryotic%20genomes%20recovered%20from%20metagenomic%20analysis%20with%20EukCC&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B17" class="js-splitview-ref-item" data-legacy-id="msab199-B17"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B17" href="javascript:;" aria-label="jumplink-msab199-B17" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B17" class="ref-content " data-id="msab199-B17"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Simão</div> <div class="given-names">FA</div></span>, <span class="name string-name"><div class="surname">Waterhouse</div> <div class="given-names">RM</div></span>, <span class="name string-name"><div class="surname">Ioannidis</div> <div class="given-names">P</div></span>, <span class="name string-name"><div class="surname">Kriventseva</div> <div class="given-names">EV</div></span>, <span class="name string-name"><div class="surname">Zdobnov</div> <div class="given-names">EM.</div></span></span> <div class="year">2015</div>. <div class="article-title">BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs</div>. <div class="source ">Bioinformatics</div> <div class="volume">31</div>(<div class="issue">19</div>):<div class="fpage">3210</div>–<div class="lpage">3212</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=BUSCO%3A%20assessing%20genome%20assembly%20and%20annotation%20completeness%20with%20single-copy%20orthologs&author=FA%20Sim%C3%A3o&author=RM%20Waterhouse&author=P%20Ioannidis&author=EV%20Kriventseva&author=EM.%20Zdobnov&publication_year=2015&journal=Bioinformatics&volume=31&pages=3210-3212" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1093/bioinformatics/btv351" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1093%2Fbioinformatics%2Fbtv351" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1093%2Fbioinformatics%2Fbtv351"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/26059717" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:BUSCO%3A%20assessing%20genome%20assembly%20and%20annotation%20completeness%20with%20single-copy%20orthologs&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B18" class="js-splitview-ref-item" data-legacy-id="msab199-B18"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B18" href="javascript:;" aria-label="jumplink-msab199-B18" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B18" class="ref-content " data-id="msab199-B18"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Stanke</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Diekhans</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Baertsch</div> <div class="given-names">R</div></span>, <span class="name string-name"><div class="surname">Haussler</div> <div class="given-names">D.</div></span></span> <div class="year">2008</div>. <div class="article-title">Using native and syntenically mapped cDNA alignments to improve de novo gene finding</div>. <div class="source ">Bioinformatics</div> <div class="volume">24</div>(<div class="issue">5</div>):<div class="fpage">637</div>–<div class="lpage">644</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Using%20native%20and%20syntenically%20mapped%20cDNA%20alignments%20to%20improve%20de%20novo%20gene%20finding&author=M%20Stanke&author=M%20Diekhans&author=R%20Baertsch&author=D.%20Haussler&publication_year=2008&journal=Bioinformatics&volume=24&pages=637-644" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1093/bioinformatics/btn013" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1093%2Fbioinformatics%2Fbtn013" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1093%2Fbioinformatics%2Fbtn013"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/18218656" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Using%20native%20and%20syntenically%20mapped%20cDNA%20alignments%20to%20improve%20de%20novo%20gene%20finding&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B19" class="js-splitview-ref-item" data-legacy-id="msab199-B19"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B19" href="javascript:;" aria-label="jumplink-msab199-B19" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B19" class="ref-content " data-id="msab199-B19"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Steinegger</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Söding</div> <div class="given-names">J.</div></span></span> <div class="year">2017</div>. <div class="article-title">MMseqs2 enables sensitive protein sequence searching for the analysis of massive data sets</div>. <div class="source ">Nat Biotechnol</div>. <div class="volume">35</div>(<div class="issue">11</div>):<div class="fpage">1026</div>–<div class="lpage">1028</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=MMseqs2%20enables%20sensitive%20protein%20sequence%20searching%20for%20the%20analysis%20of%20massive%20data%20sets&author=M%20Steinegger&author=J.%20S%C3%B6ding&publication_year=2017&journal=Nat%20Biotechnol&volume=35&pages=1026-1028" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1038/nbt.3988" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1038%2Fnbt.3988" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1038%2Fnbt.3988"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/29035372" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:MMseqs2%20enables%20sensitive%20protein%20sequence%20searching%20for%20the%20analysis%20of%20massive%20data%20sets&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B20" class="js-splitview-ref-item" data-legacy-id="msab199-B20"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B20" href="javascript:;" aria-label="jumplink-msab199-B20" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B20" class="ref-content " data-id="msab199-B20"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Wadi</div> <div class="given-names">L</div></span>, <span class="name string-name"><div class="surname">Reinke</div> <div class="given-names">AW.</div></span></span> <div class="year">2020</div>. <div class="article-title">Evolution of microsporidia: an extremely successful group of eukaryotic intracellular parasites</div>. <div class="source ">PLoS Pathog</div>. <div class="volume">16</div>(<div class="issue">2</div>):<div class="fpage">e1008276</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=Evolution%20of%20microsporidia%3A%20an%20extremely%20successful%20group%20of%20eukaryotic%20intracellular%20parasites&author=L%20Wadi&author=AW.%20Reinke&publication_year=2020&journal=PLoS%20Pathog&volume=16&pages=e1008276" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1371/journal.ppat.1008276" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1371%2Fjournal.ppat.1008276" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1371%2Fjournal.ppat.1008276"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/32053705" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:Evolution%20of%20microsporidia%3A%20an%20extremely%20successful%20group%20of%20eukaryotic%20intracellular%20parasites&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B21" class="js-splitview-ref-item" data-legacy-id="msab199-B21"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B21" href="javascript:;" aria-label="jumplink-msab199-B21" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B21" class="ref-content " data-id="msab199-B21"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Waterhouse</div> <div class="given-names">RM</div></span>, <span class="name string-name"><div class="surname">Seppey</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Simão</div> <div class="given-names">FA</div></span>, <span class="name string-name"><div class="surname">Manni</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Ioannidis</div> <div class="given-names">P</div></span>, <span class="name string-name"><div class="surname">Klioutchnikov</div> <div class="given-names">G</div></span>, <span class="name string-name"><div class="surname">Kriventseva</div> <div class="given-names">EV</div></span>, <span class="name string-name"><div class="surname">Zdobnov</div> <div class="given-names">EM.</div></span></span> <div class="year">2018</div>. <div class="article-title">BUSCO applications from quality assessments to gene prediction and phylogenomics</div>. <div class="source ">Mol Biol Evol</div>. <div class="volume">35</div>(<div class="issue">3</div>):<div class="fpage">543</div>–<div class="lpage">548</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=BUSCO%20applications%20from%20quality%20assessments%20to%20gene%20prediction%20and%20phylogenomics&author=RM%20Waterhouse&author=M%20Seppey&author=FA%20Sim%C3%A3o&author=M%20Manni&author=P%20Ioannidis&author=G%20Klioutchnikov&author=EV%20Kriventseva&author=EM.%20Zdobnov&publication_year=2018&journal=Mol%20Biol%20Evol&volume=35&pages=543-548" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1093/molbev/msx319" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1093%2Fmolbev%2Fmsx319" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1093%2Fmolbev%2Fmsx319"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/29220515" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:BUSCO%20applications%20from%20quality%20assessments%20to%20gene%20prediction%20and%20phylogenomics&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div><div content-id="msab199-B22" class="js-splitview-ref-item" data-legacy-id="msab199-B22"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B22" href="javascript:;" aria-label="jumplink-msab199-B22" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B22" class="ref-content " data-id="msab199-B22"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Wickham</div> <div class="given-names">H.</div></span></span> <div class="year">2009</div>. <div class="source ">ggplot2: elegant graphics for data analysis</div>. <div class="publisher-loc">New York</div>: <div class="publisher-name">Springer-Verlag</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=ggplot2%3A%20elegant%20graphics%20for%20data%20analysis&author=H.%20Wickham&publication_year=2009&book=ggplot2%3A%20elegant%20graphics%20for%20data%20analysis" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1007/978-0-387-98141-3" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1007%2F978-0-387-98141-3" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1007%2F978-0-387-98141-3"> </span></div><p class="citation-links-compatibility"><span class="google-preview-ref-link js-google-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.google.com/search?q=ggplot2%3A%20elegant%20graphics%20for%20data%20analysis&btnG=Search+Books&tbm=bks&tbo=1" target="_blank">Google Preview</a></span></p><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:ggplot2%3A%20elegant%20graphics%20for%20data%20analysis&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p><div class="copac-reference-ref-link js-copac-preview-ref-link" style="display:none" data-pubtype="book"><span class="inst-copac"><a class="openInAnotherWindow" target="_blank" href="http://copac.ac.uk/search?ti=ggplot2%3A%20elegant%20graphics%20for%20data%20analysis">COPAC</a></span></div> </div></div></div></div></div><div content-id="msab199-B23" class="js-splitview-ref-item" data-legacy-id="msab199-B23"><div class="refLink-parent"><span class="refLink"><a name="jumplink-msab199-B23" href="javascript:;" aria-label="jumplink-msab199-B23" data-id=""></a></span></div><div class="ref false"><div id="ref-auto-msab199-B23" class="ref-content " data-id="msab199-B23"><div class="mixed-citation citation"><p class="mixed-citation-compatibility"><span class="person-group"><span class="name string-name"><div class="surname">Zdobnov</div> <div class="given-names">EM</div></span>, <span class="name string-name"><div class="surname">Kuznetsov</div> <div class="given-names">D</div></span>, <span class="name string-name"><div class="surname">Tegenfeldt</div> <div class="given-names">F</div></span>, <span class="name string-name"><div class="surname">Manni</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Berkeley</div> <div class="given-names">M</div></span>, <span class="name string-name"><div class="surname">Kriventseva</div> <div class="given-names">EV.</div></span></span> <div class="year">2021</div>. <div class="article-title">OrthoDB in 2020: evolutionary and functional annotations of orthologs</div>. <div class="source ">Nucleic Acids Res</div>. <div class="volume">49</div>(<div class="issue">D1</div>):<div class="fpage">D389</div>–<div class="lpage">D393</div>.</p><!--citationLinks: case 1--><div class="citation-links"></div><div class="citation-links"><p class="citation-links-compatibility"><span class="google-scholar-ref-link"><a class="openInAnotherWindow" href="https://scholar.google.com/scholar_lookup?title=OrthoDB%20in%202020%3A%20evolutionary%20and%20functional%20annotations%20of%20orthologs&author=EM%20Zdobnov&author=D%20Kuznetsov&author=F%20Tegenfeldt&author=M%20Manni&author=M%20Berkeley&author=EV.%20Kriventseva&publication_year=2021&journal=Nucleic%20Acids%20Res&volume=49&pages=D389-D393" target="_blank">Google Scholar</a></span></p><div class="crossref-doi js-ref-link"><a class="openInAnotherWindow" href="http://dx.doi.org/10.1093/nar/gkaa1009" target="_blank">Crossref</a></div><div class="adsDoiReference hide"><a class="openInAnotherWindow" href="http://adsabs.harvard.edu/cgi-bin/basic_connect?qsearch=10.1093%2Fnar%2Fgkaa1009" target="_blank">Search ADS</a></div><div class="xslopenurl empty-target"><span class="inst-open-url-holders" data-targetId="10.1093%2Fnar%2Fgkaa1009"> </span></div><div class="pub-id"><a href="http://www.ncbi.nlm.nih.gov/pubmed/33196836" class="link link-pub-id openInAnotherWindow" target="_blank">PubMed</a></div><p class="citation-links-compatibility"><span class="worldcat-reference-ref-link js-worldcat-preview-ref-link" style="display:none"><a class="openInAnotherWindow" href="https://www.worldcat.org/search?q=ti:OrthoDB%20in%202020%3A%20evolutionary%20and%20functional%20annotations%20of%20orthologs&qt=advanced&dblist=638" target="_blank">WorldCat</a></span></p> </div></div></div></div></div></div> <!-- /foreach in Model.Sections --> <div class="widget widget-ArticlePubStateInfo widget-instance-OUP_ArticlePubStateInfo"> </div> <div class="article-metadata-standalone-panel clearfix"></div> <h2 class="authorNotes-section-title" id="authorNotesSectionTitle" scrollto-destination="authorNotesSectionTitle">Author notes</h2> <div content-id="msab199-FM1" class="footnote"><span class="fn"><div class="footnote-content"><p class="footnote-compatibility">Mosè Manni, Matthew R Berkeley and Mathieu Seppey authors contributed equally to this work.</p></div></span></div><div class="copyright copyright-statement">© The Author(s) 2021. Published by Oxford University Press on behalf of the Society for Molecular Biology and Evolution.</div><div class="license"><div class="license-p">This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<a class="link link-uri openInAnotherWindow" href="https://creativecommons.org/licenses/by/4.0/" target="_blank">https://creativecommons.org/licenses/by/4.0/</a>), which permits unrestricted reuse, distribution, and reproduction in any medium, provided the original work is properly cited.</div></div><!-- /foreach --> <span id="UserHasAccess" data-userHasAccess="True"></span> </div><!-- /.widget-items --> </div><!-- /.module-widget --> </div> <div class="widget widget-SolrResourceMetadata widget-instance-OUP_Article_ResourceMetadata_Widget"> <div class="article-metadata-panel solr-resource-metadata js-metadata-panel at-ContentMetadata"> <div class="article-metadata-tocSections"> <div class="article-metadata-tocSections-title">Issue Section:</div> <a href="/mbe/search-results?f_TocHeadingTitleList=Resources">Resources</a> </div> </div> </div> <div class="widget widget-EditorInformation widget-instance-OUP_Article_EditorInformation_Widget"> <div class="wi-editors"> <div class="al-authors-list"> <div class="editor-tag-label"> <span class="editor-role-name">Associate Editor:</span> <span class="al-author-name js-flyout-wrap"> <a class="linked-name js-linked-name stats-author-info-trigger" href="javascript:;">Joanna Kelley</a><span class='delimiter'></span> <span id="info-28817203" class="al-author-info-wrap arrow-up stats-author-info-panel"> <div class="info-card-author authorInfo_OUP_Article_EditorInformation_Widget"> <div class="name-role-wrap"> <div class="info-card-name"> Joanna Kelley </div> <div class="info-card-role"> Associate Editor </div> </div> <div class="info-card-search-label"> Search for other works by this author on: </div> <div class="info-card-search info-card-search-internal"> <a href="/mbe/search-results?f_Authors=Joanna+Kelley" rel="nofollow">Oxford Academic</a> </div> <div class="info-card-search info-card-search-pubmed"> <a href="http://www.ncbi.nlm.nih.gov/pubmed?cmd=search&term=Kelley J">PubMed</a> </div> <div class="info-card-search info-card-search-google"> <a href="http://scholar.google.com/scholar?q=author:%22Kelley Joanna%22">Google Scholar</a> </div> </div> </span> </span> <br/> </div> </div> </div> </div> <div id="ContentTabFilteredView"></div> <div class="downloadImagesppt js-download-images-ppt st-download-images-ppt"> <a id="lnkDownloadAllImages" class="js-download-all-images-link btn" href="/DownloadFile/DownloadImage.aspx?image=&PPTtype=SlideSet&ar=6329644&xsltPath=~/UI/app/XSLT&siteId=5325">Download all slides</a> </div> <div class="widget widget-ArticleDataSupplements widget-instance-OUP_Data_Supplements_Tab"> <a name="SupplementalTab" id="SupplementalTab"></a> <li class="section-jump-link head-1 dataSupplements-jumplink"> <div class="section-jump-link__link-wrap"> <a class="jumplink js-jumplink scrollTo" href="#supplementary-data">Supplementary data</a> </div> </li> <h2 scrollto-destination="supplementary-data" id="supplementary-data" class="section-title">Supplementary data</h2> <div class="dataSuppLink"><a href="https://oup.silverchair-cdn.com/oup/backfile/Content_public/Journal/mbe/38/10/10.1093_molbev_msab199/1/msab199_supplementary_data.zip?Expires=1735509136&Signature=EQOl7PjcboegfU9mk-udbkLe44JG7cf8Ka-JxBrz-eS9xTNvvrWO94IPmOGH8s5Kju0fbNuHqrhxwNg39cz860BV53Mp48agZHpvQdMuBgDXY8iccjwShdIGFS7i6abDi67GlhVOjjJRlH9EmdvW6cTawpDqE7C~dUuHWsEamAzYRsOkcb16TJPGA9tsXaLxMFlW1nc0Rd0mL2ljKRZZcnYevpok-VYMxJ0TMwZz2aB598N7z9VdSFzUa1VVmdW7eyAoGUBjus5YYgOmdS1YodPM1oRtuldGBb7q2sKF7WY1bpagM7Ha9lbCvICD4gb8HV9rqcqkYtpHLmnaXT2p2g__&Key-Pair-Id=APKAIE5G5CRDK6RD3PGA"><span class="label title-label">msab199_Supplementary_Data</span></a> - zip file</div> </div> <div class="widget widget-ArticleDataRepositories widget-instance-Article_DryadLink"> </div> <div class="comments"> <div class="widget widget-UserCommentBody widget-instance-UserCommentBody_Article"> </div> <div class="widget widget-UserComment widget-instance-OUP_UserComment_Article"> </div> </div> </div> </div> </div> </div> <div id="Sidebar" class="page-column page-column--right"> <div class="widget widget-AdBlock widget-instance-ArticlePageTopSidebar"> <div class="js-adBlock-parent-wrap adblock-parent-wrap"> <div class="adBlockMainBodyTop-wrap js-adBlockMainBodyTop hide"> <div id="adBlockMainBodyTop" class="js-adblock at-adblock" data-lazy-load-margin="150"> <script> googletag.cmd.push(function () { googletag.display('adBlockMainBodyTop'); }); </script> </div> <div class="advertisement-text at-adblock js-adblock-advertisement-text hide">Advertisement</div> </div> </div> </div> <div class="widget widget-dynamic " data-count="1"> <div class="widget-dynamic-inner-wrap"> <div class="widget widget-dynamic " data-count="9"> <div class="widget-dynamic-inner-wrap"> <div class="widget widget-ArticleLevelMetrics widget-instance-Article_RightRailB0Article_RightRail_ArticleLevelMetrics"> <div class="artmet-wrapper horizontal-artmet"> <div class="contentmet-border"> <div class="contentmet-wrapper horizontal-contentmet"> <div class="contentmet-citations contentmet-badges-wrap js-contentmet-citations hide"> <h3 class="contentmet-text">Citations</h3> <div class="contentmet-item contentmet-dimensions"> <div class="widget widget-DimensionsBadge widget-instance-ArticleLevelMetrics_DimensionsBadge"> <span class="__dimensions_badge_embed__" data-doi="10.1093/molbev/msab199" data-legend="never" data-style="small_circle" data-hide-zero-citations="false"></span> <script async src="https://badge.dimensions.ai/badge.js" charset="utf-8"></script> </div> </div> </div> <div class="contentmet-views contentmet-badges-wrap js-contentmet-views"> <h3 class="contentmet-text">Views</h3> <div class="contentmet-item circle-text circle-text-views"> <div class="contentmet-number">41,068</div> </div> </div> <div class="contentmet-item contentmet-badges-wrap"> <h3 class="contentmet-text">Altmetric</h3> <div class="contentmet-item contentmet-altmetric"> <div class="widget widget-AltmetricLink widget-instance-ArticleLevelMetrics_AltmetricLinkSummary"> <!-- Altmetrics --> <div id="altmetricEmbedId" runat="server" class='altmetric-embed' data-badge-type="donut" data-hide-no-mentions="false" data-doi="10.1093/molbev/msab199" ></div> <script type='text/javascript' src='https://d1bxh8uas1mnw7.cloudfront.net/assets/embed.js'></script> </div> </div> </div> <div class="contentmet-modal-trigger-wrap clearfix"> <a href="javascript:;" class="artmet-modal-trigger js-artmet-modal-trigger at-alm-metrics-modal-trigger" data-resource-id="6329644" data-resource-type="3"> <img class="contentmet-info-icon" src="//oup.silverchair-cdn.com/UI/app/svg/i.svg" alt="Information"> <span class="contentmet-more-info">More metrics information</span> </a> </div> </div> </div> <div class="artmet-modal js-artmet-modal" id="MetricsModal"> <div class="artmet-modal-contents js-metric-modal-contents at-alm-modal-contents"> <div class="artmet-full-wrap clearfix js-metric-full-wrap hide"> <div class="widget-title-1 artmet-widget-title-1">Metrics</div> <div class="artmet-item artmet-views-wrap"> <div class="artmet-views clearfix"> <div class="artmet-total-views"> <span class="artmet-text">Total Views</span> <span class="artmet-number">41,068</span> </div> <div class="artmet-breakdown-views-wrap"> <div class="artmet-breakdown-view breakdown-border"> <span class="artmet-number">32,843</span> <span class="artmet-text">Pageviews</span> </div> <div class="artmet-breakdown-view"> <span class="artmet-number">8,225</span> <span class="artmet-text">PDF Downloads</span> </div> </div> </div> <div class="artmet-views-since">Since 7/1/2021</div> </div> <script> var ChartistData = ChartistData || {}; ChartistData.data = { labels: ['Jul 2021', 'Aug 2021', 'Sep 2021', 'Oct 2021', 'Nov 2021', 'Dec 2021', 'Jan 2022', 'Feb 2022', 'Mar 2022', 'Apr 2022', 'May 2022', 'Jun 2022', 'Jul 2022', 'Aug 2022', 'Sep 2022', 'Oct 2022', 'Nov 2022', 'Dec 2022', 'Jan 2023', 'Feb 2023', 'Mar 2023', 'Apr 2023', 'May 2023', 'Jun 2023', 'Jul 2023', 'Aug 2023', 'Sep 2023', 'Oct 2023', 'Nov 2023', 'Dec 2023', 'Jan 2024', 'Feb 2024', 'Mar 2024', 'Apr 2024', 'May 2024', 'Jun 2024', 'Jul 2024', 'Aug 2024', 'Sep 2024', 'Oct 2024', 'Nov 2024'], series: [[115, 714, 712, 916, 944, 788, 760, 872, 1022, 828, 870, 750, 806, 861, 861, 1013, 972, 731, 946, 1136, 1170, 999, 1025, 999, 1090, 1093, 941, 1160, 1097, 1022, 1306, 1443, 1612, 1297, 1256, 1278, 1194, 1110, 1164, 1322, 873]] }; </script> <div class="artmet-item artmet-chart"> <div class="ct-chart ct-octave js-ct-chart"></div> <div class="artmet-table"> <table> <thead> <tr> <th>Month:</th> <th>Total Views:</th> </tr> </thead> <tbody> <tr> <td>July 2021</td> <td>115</td> </tr> <tr> <td>August 2021</td> <td>714</td> </tr> <tr> <td>September 2021</td> <td>712</td> </tr> <tr> <td>October 2021</td> <td>916</td> </tr> <tr> <td>November 2021</td> <td>944</td> </tr> <tr> <td>December 2021</td> <td>788</td> </tr> <tr> <td>January 2022</td> <td>760</td> </tr> <tr> <td>February 2022</td> <td>872</td> </tr> <tr> <td>March 2022</td> <td>1,022</td> </tr> <tr> <td>April 2022</td> <td>828</td> </tr> <tr> <td>May 2022</td> <td>870</td> </tr> <tr> <td>June 2022</td> <td>750</td> </tr> <tr> <td>July 2022</td> <td>806</td> </tr> <tr> <td>August 2022</td> <td>861</td> </tr> <tr> <td>September 2022</td> <td>861</td> </tr> <tr> <td>October 2022</td> <td>1,013</td> </tr> <tr> <td>November 2022</td> <td>972</td> </tr> <tr> <td>December 2022</td> <td>731</td> </tr> <tr> <td>January 2023</td> <td>946</td> </tr> <tr> <td>February 2023</td> <td>1,136</td> </tr> <tr> <td>March 2023</td> <td>1,170</td> </tr> <tr> <td>April 2023</td> <td>999</td> </tr> <tr> <td>May 2023</td> <td>1,025</td> </tr> <tr> <td>June 2023</td> <td>999</td> </tr> <tr> <td>July 2023</td> <td>1,090</td> </tr> <tr> <td>August 2023</td> <td>1,093</td> </tr> <tr> <td>September 2023</td> <td>941</td> </tr> <tr> <td>October 2023</td> <td>1,160</td> </tr> <tr> <td>November 2023</td> <td>1,097</td> </tr> <tr> <td>December 2023</td> <td>1,022</td> </tr> <tr> <td>January 2024</td> <td>1,306</td> </tr> <tr> <td>February 2024</td> <td>1,443</td> </tr> <tr> <td>March 2024</td> <td>1,612</td> </tr> <tr> <td>April 2024</td> <td>1,297</td> </tr> <tr> <td>May 2024</td> <td>1,256</td> </tr> <tr> <td>June 2024</td> <td>1,278</td> </tr> <tr> <td>July 2024</td> <td>1,194</td> </tr> <tr> <td>August 2024</td> <td>1,110</td> </tr> <tr> <td>September 2024</td> <td>1,164</td> </tr> <tr> <td>October 2024</td> <td>1,322</td> </tr> <tr> <td>November 2024</td> <td>873</td> </tr> </tbody> </table> </div> </div> <div class="artmet-stats-wrap clearfix"> <div class="artmet-item artmet-citations hide"> <div class="widget-title-2 artmet-widget-title-2">Citations</div> <div class="artmet-badges-wrap artmet-dimensions"> <div class="widget widget-DimensionsBadge widget-instance-ArticleLevelMetrics_DimensionsBadgeDetails"> <span class="__dimensions_badge_embed__" data-doi="10.1093/molbev/msab199" data-legend="always" data-style="" data-hide-zero-citations="false"></span> <script async src="https://badge.dimensions.ai/badge.js" charset="utf-8"></script> </div> <span class="artmet-dimensions-text">Powered by Dimensions</span> </div> <div class="artmet-wos"> <span class="artmet-number"> <a href="https://www.webofscience.com/api/gateway?GWVersion=2&SrcApp=silverchair&SrcAuth=WosAPI&KeyUT=WOS:000715359700041&DestLinkType=CitingArticles&DestApp=WOS_CPL" target="_blank">1,390</a> </span> <span class="artmet-text">Web of Science</span> </div> </div> <div class="artmet-item artmet-altmetric js-show-if-unknown"> <div class="widget-title-2 artmet-widget-title-2">Altmetrics</div> <div class="artmet-badges-wrap js-artmet-badges"> <div class="widget widget-AltmetricLink widget-instance-ArticleLevelMetrics_AltmetricLinkDetails"> <!-- Altmetrics --> <div id="altmetricEmbedId" runat="server" class='altmetric-embed' data-badge-type="donut" data-hide-no-mentions="false" data-doi="10.1093/molbev/msab199" data-badge-details = "right" ></div> <script type='text/javascript' src='https://d1bxh8uas1mnw7.cloudfront.net/assets/embed.js'></script> </div> </div> </div> </div> </div> <a class="artmet-close-modal js-artmet-close-modal">×</a> </div> </div> </div> </div> <div class="widget widget-Alerts widget-instance-Article_RightRailB0Article_RightRail_Alerts"> <div class="alertsWidget"> <h3>Email alerts</h3> <div class="userAlert alertType-1"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-alertType="1" href="javascript:;">Article activity alert</a> </div> <div class="userAlert alertType-3"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-alertType="3" href="javascript:;">Advance article alerts</a> </div> <div class="userAlert alertType-5"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-alertType="5" href="javascript:;">New issue alert</a> </div> <div class="userAlert alertType-30"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-alertType="30" href="javascript:;">In progress issue alert</a> </div> <div class="userAlert alertType-MarketingLink"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-additionalUrl="/my-account/communication-preferences" href="javascript:;">Receive exclusive offers and updates from Oxford Academic</a> </div> <div class="userAlertSignUpModal reveal-modal small" data-reveal> <div class="userAlertSignUp at-userAlertSignUp"></div> <a href="javascript:;" role="button" aria-label="Close" class="close-reveal-modal" href="javascript:;"> <i class="icon-general-close"></i> </a> </div> </div> </div> <div class="widget widget-Alerts widget-instance-Article_RightRailB0Secondary_RightRail_Alerts"> <div class="alertsWidget"> <h3>Email alerts</h3> <div class="userAlert alertType-3"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-alertType="3" href="javascript:;">Advance article alerts</a> </div> <div class="userAlert alertType-5"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-alertType="5" href="javascript:;">New issue alert</a> </div> <div class="userAlert alertType-30"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-alertType="30" href="javascript:;">In progress issue alert</a> </div> <div class="userAlert alertType-MarketingLink"> <a href="javascript:;" class="js-user-alert" role="button" data-userLoggedIn="False" data-additionalUrl="/my-account/communication-preferences" href="javascript:;">Receive exclusive offers and updates from Oxford Academic</a> </div> <div class="userAlertSignUpModal reveal-modal small" data-reveal> <div class="userAlertSignUp at-userAlertSignUp"></div> <a href="javascript:;" role="button" aria-label="Close" class="close-reveal-modal" href="javascript:;"> <i class="icon-general-close"></i> </a> </div> </div> </div> <div class="widget widget-TrendMD widget-instance-Article_RightRailB0trendmd"> <div id="trendmd-suggestions"></div> <div class="options" data-suppress-if-hum-is-present="True"></div> </div> <div class="widget widget-ArticleCitedBy widget-instance-Article_RightRailB0Article_RightRail_ArticleCitedBy"> <div class="rail-widget_wrap vt-articles-cited-by"> <h3 class="article-cited-title">Citing articles via</h3> <div class="widget-links_wrap"> <div class="article-cited-link-wrap web-of-science"> <a href="https://www.webofscience.com/api/gateway?GWVersion=2&SrcApp=silverchair&SrcAuth=WosAPI&KeyUT=WOS:000715359700041&DestLinkType=CitingArticles&DestApp=WOS_CPL" target="_blank">Web of Science (1390)</a> </div> <div class="article-cited-link-wrap google-scholar-url"> <a href="http://scholar.google.com/scholar?q=link:https%3A%2F%2Facademic.oup.com%2Fmbe%2Farticle%2F38%2F10%2F4647%2F6329644" target="_blank">Google Scholar</a> </div> </div> </div> </div> <div class="widget widget-ArticleListNewAndPopular widget-instance-Article_RightRailB0Article_RightRail_ArticleNewPopularCombined"> <ul class="articleListNewAndPopularCombinedView"> <li> <h3> <a href="javascript:;" class="articleListNewAndPopular-mode active" data-mode="MostRecent">Latest</a> </h3> </li> <li> <h3> <a href="javascript:;" class="articleListNewAndPopular-mode " data-mode="MostRead">Most Read</a> </h3> </li> <li> <h3> <a href="javascript:;" class="articleListNewAndPopular-mode " data-mode="MostCited">Most Cited</a> </h3> </li> </ul> <section class="articleListNewPopContent articleListNewAndPopular-ContentView-MostRecent hasContent"> <div id="newPopularList-Article_RightRailB0Article_RightRail_ArticleNewPopularCombined" class="fb"> <div class="widget-layout widget-layout--vert "> <div class="widget-columns widget-col-1"> <div class="col"> <div class="widget-dynamic-entry journalArticleItem at-widget-entry-SCL"> <span class="hfDoi" data-attribute="10.1093/molbev/msae243" aria-hidden="true"></span> <a class="journal-link" href="/mbe/advance-article/doi/10.1093/molbev/msae243/7906539?searchresult=1"> <div class="widget-dynamic-journal-title"> Remarkable evolutionary rate variations among lineages and among genome compartments in malaria parasites of mammals </div> </a> <div class="widget-dynamic-journal-image-synopsis"> <div class="widget-dynamic-journal-synopsis"> </div> </div> </div> <div class="widget-dynamic-entry journalArticleItem at-widget-entry-SCL"> <span class="hfDoi" data-attribute="10.1093/molbev/msae242" aria-hidden="true"></span> <a class="journal-link" href="/mbe/advance-article/doi/10.1093/molbev/msae242/7905441?searchresult=1"> <div class="widget-dynamic-journal-title"> Digital image processing to detect adaptive evolution </div> </a> <div class="widget-dynamic-journal-image-synopsis"> <div class="widget-dynamic-journal-synopsis"> </div> </div> </div> <div class="widget-dynamic-entry journalArticleItem at-widget-entry-SCL"> <span class="hfDoi" data-attribute="10.1093/molbev/msae241" aria-hidden="true"></span> <a class="journal-link" href="/mbe/advance-article/doi/10.1093/molbev/msae241/7902053?searchresult=1"> <div class="widget-dynamic-journal-title"> Accurate Inference of the Polyploid Continuum using Forward-time Simulations </div> </a> <div class="widget-dynamic-journal-image-synopsis"> <div class="widget-dynamic-journal-synopsis"> </div> </div> </div> <div class="widget-dynamic-entry journalArticleItem at-widget-entry-SCL"> <span class="hfDoi" data-attribute="10.1093/molbev/msae240" aria-hidden="true"></span> <a class="journal-link" href="/mbe/advance-article/doi/10.1093/molbev/msae240/7896299?searchresult=1"> <div class="widget-dynamic-journal-title"> Diversity of transcriptional regulatory adaptation in <em>E. coli</em> </div> </a> <div class="widget-dynamic-journal-image-synopsis"> <div class="widget-dynamic-journal-synopsis"> </div> </div> </div> <div class="widget-dynamic-entry journalArticleItem at-widget-entry-SCL"> <span class="hfDoi" data-attribute="10.1093/molbev/msae208" aria-hidden="true"></span> <a class="journal-link" href="/mbe/advance-article/doi/10.1093/molbev/msae208/7893330?searchresult=1"> <div class="widget-dynamic-journal-title"> Comparative genomics provides insights into adaptive evolution and demographics of bats </div> </a> <div class="widget-dynamic-journal-image-synopsis"> <div class="widget-dynamic-journal-synopsis"> </div> </div> </div> </div> </div> </div></div> </section> <section class="articleListNewPopContent articleListNewAndPopular-ContentView-MostRead hide"> </section> <section class="articleListNewPopContent articleListNewAndPopular-ContentView-MostCited hide"> </section> </div> <div class="widget widget-RelatedTaxonomies widget-instance-Article_RightRailB0Article_RightRail_RelatedTaxonomies"> <div class="widget-related-taxonomies-wrap vt-related-taxonomies"> <div class="widget-related-taxonomies_title">More from Oxford Academic</div> <div class="widget-related-taxonomies"> <a id="more-from-oa-AcademicSubjects_SCI00960" class="related-taxonomies-link" href="/search-results?tax=AcademicSubjects/SCI00960">Biological Sciences</a> </div> <div class="widget-related-taxonomies"> <a id="more-from-oa-AcademicSubjects_SCI01130" class="related-taxonomies-link" href="/search-results?tax=AcademicSubjects/SCI01130">Evolutionary Biology</a> </div> <div class="widget-related-taxonomies"> <a id="more-from-oa-AcademicSubjects_SCI01180" class="related-taxonomies-link" href="/search-results?tax=AcademicSubjects/SCI01180">Molecular and Cell Biology</a> </div> <div class="widget-related-taxonomies"> <a id="more-from-oa-AcademicSubjects_SCI00010" class="related-taxonomies-link" href="/search-results?tax=AcademicSubjects/SCI00010">Science and Mathematics</a> </div> <div class="widget-related-taxonomies"> <a id="more-from-oa-format-Books" class="related-taxonomies-link" href="/books">Books</a> </div> <div class="widget-related-taxonomies"> <a id="more-from-oa-format-Journals" class="related-taxonomies-link" href="/journals">Journals</a> </div> </div> </div> </div> </div> </div> </div> <div class="widget widget-AdBlock widget-instance-ArticlePageTopMainBodyBottom"> <div class="js-adBlock-parent-wrap adblock-parent-wrap"> <div class="adBlockMainBodyBottom-wrap js-adBlockMainBodyBottom hide"> <div id="adBlockMainBodyBottom" class="js-adblock at-adblock js-adblock-lazy-loading" data-lazy-load-margin="150"> <script> googletag.cmd.push(function () { googletag.display('adBlockMainBodyBottom'); }); </script> </div> <div class="advertisement-text at-adblock js-adblock-advertisement-text hide">Advertisement</div> </div> </div> </div> </div> </div> <input id="hfArticleTitle" name="hfArticleTitle" type="hidden" value="BUSCO Update: Novel and Streamlined Workflows along with Broader and Deeper Phylogenetic Coverage for Scoring of Eukaryotic, Prokaryotic, and Viral Genomes | Molecular Biology and Evolution | Oxford Academic" /> <input id="hfLeftNavStickyOffset" name="hfLeftNavStickyOffset" type="hidden" value="29" /> </div><!-- /.center-inner-row no-overflow --> </section> </div> <div class="mobile-mask"> </div> <section class="footer_wrap vt-site-footer"> <div class="ad-banner-footer sticky-footer-ad js-sticky-footer-ad"> <div class="widget widget-AdBlock widget-instance-StickyFooterAd"> <div class="js-adBlock-parent-wrap adblock-parent-wrap"> <div class="adBlockStickyFooter-wrap js-adBlockStickyFooter hide"> <div id="adBlockStickyFooter" class="js-adblock at-adblock" data-lazy-load-margin="150"> <script> googletag.cmd.push(function () { googletag.display('adBlockStickyFooter'); }); </script> </div> <div class="advertisement-text at-adblock js-adblock-advertisement-text hide">Advertisement</div> <button type="button" class="close-footer-ad js-close-footer-ad"> <span class="screenreader-text">close advertisement</span> </button> </div> </div> </div> </div> <div class="widget widget-SitePageFooter widget-instance-SitePageFooter"> <div class="ad-banner ad-banner-footer"> <div class="widget widget-AdBlock widget-instance-FooterAd"> <div class="js-adBlock-parent-wrap adblock-parent-wrap"> <div class="adBlockFooter-wrap js-adBlockFooter hide"> <div id="adBlockFooter" class="js-adblock at-adblock js-adblock-lazy-loading" data-lazy-load-margin="150"> <script> googletag.cmd.push(function () { googletag.display('adBlockFooter'); }); </script> </div> <div class="advertisement-text at-adblock js-adblock-advertisement-text hide">Advertisement</div> </div> </div> </div> </div> <div class="journal-footer journal-bg"> <div class="center-inner-row"> <div class="journal-footer-menu"> <ul> <li class="link-1"> <a href="/mbe/pages/About">About Molecular Biology and Evolution</a> </li> <li class="link-2"> <a href="/mbe/pages/Editorial_Board">Editorial Board</a> </li> <li class="link-3"> <a href="/mbe/pages/General_Instructions">Author Guidelines</a> </li> <li class="link-4"> <a href="http://www.smbe.org/smbe/">Contact Us</a> </li> <li class="link-5"> <a href="https://www.facebook.com/OUPAcademic">Facebook</a> </li> </ul><ul><li class="link-1"> <a href="https://twitter.com/MolBioEvol">X (formerly Twitter)</a> </li> <li class="link-2"> <a href="https://academic.oup.com/advertising-and-corporate-services/pages/mbe-media-kit">Advertising and Corporate Services</a> </li> <li class="link-3"> <a href="http://medicine-and-health-careernetwork.oxfordjournals.org">Journals Career Network</a> </li> </ul> </div><!-- /.journal-footer-menu --> <div class="journal-footer-affiliations"> <!-- <h3>Affiliations</h3> --> <a href="https://academic.oup.com/mbe" target=""> <img id="footer-logo-MolecularBiologyandEvolution" class="journal-footer-affiliations-logo" src="//oup.silverchair-cdn.com/data/SiteBuilderAssets/Live/Images/mbe/mbe_f1-1542169774.svg" alt="Molecular Biology and Evolution" /> </a> </div><!-- /.journal-footer-affiliations --> <div class="journal-footer-colophon"> <ul> <li>Online ISSN 1537-1719</li> <li>Copyright © 2024 Society for Molecular Biology and Evolution</li> </ul> </div><!-- /.journal-footer-colophon --> </div><!-- /.center-inner-row --> </div><!-- /.journal-footer --> </div> <div class="oup-footer"> <div class="center-inner-row"> <div class="widget widget-SelfServeContent widget-instance-OupUmbrellaFooterSelfServe"> <input type="hidden" class="SelfServeContentId" value="GlobalFooter_Links" /> <input type="hidden" class="SelfServeVersionId" value="0" /> <div class="oup-footer-row journal-links"> <div class="global-footer selfservelinks"> <ul> <li><a href="/pages/about-oxford-academic">About Oxford Academic</a></li> <li><a href="/pages/about-oxford-academic/publish-journals-with-us">Publish journals with us</a></li> <li><a href="/pages/about-oxford-academic/our-university-press-partners">University press partners</a></li> <li><a href="/pages/what-we-publish">What we publish</a></li> <li><a href="/pages/new-features">New features</a> </li> </ul> </div> <div class="global-footer selfservelinks"> <ul> <li><a href="/pages/authoring">Authoring</a></li> <li><a href="/pages/open-research/open-access">Open access</a></li> <li><a href="/pages/purchasing">Purchasing</a></li> <li><a href="/pages/institutional-account-management">Institutional account management</a></li> <li><a href="https://academic.oup.com/pages/purchasing/rights-and-permissions">Rights and permissions</a></li> </ul> </div> <div class="global-footer selfservelinks"> <ul> <li><a href="/pages/get-help-with-access">Get help with access</a></li> <li><a href="/pages/about-oxford-academic/accessibility">Accessibility</a></li> <li><a href="/pages/contact-us">Contact us</a></li> <li><a href="/pages/advertising">Advertising</a></li> <li><a href="/pages/media-enquiries">Media enquiries</a></li> </ul> </div> <div class="global-footer selfservelinks global-footer-external"> <ul> <li><a href="https://global.oup.com/">Oxford University Press</a></li> <li><a href="https://www.mynewsdesk.com/uk/oxford-university-press">News</a></li> <li><a href="https://languages.oup.com/">Oxford Languages</a></li> <li><a href="https://www.ox.ac.uk/">University of Oxford</a></li> </ul> </div> <div class="OUP-mission"> <p>Oxford University Press is a department of the University of Oxford. It furthers the University's objective of excellence in research, scholarship, and education by publishing worldwide</p> <img class="journal-footer-logo" src="//oup.silverchair-cdn.com/UI/app/svg/umbrella/oup-logo.svg" alt="Oxford University Press" width="150" height="42" /> </div> </div> <div class="oup-footer-row"> <div class="oup-footer-row-links"> <ul> <li>Copyright © 2024 Oxford University Press</li> <li><button id="Change-Preferences" type="button" onclick="window.top.document.dispatchEvent(new Event('changeConsent'))">Cookie settings</button></li> <li><a href="https://global.oup.com/cookiepolicy">Cookie policy</a></li> <li><a href="https://global.oup.com/privacy">Privacy policy</a></li> <li><a href="/pages/legal-and-policy/legal-notice">Legal notice</a></li> </ul> </div> </div> <style type="text/css"> /* Issue right column fix for tablet/mobile */ @media (max-width: 1200px) { .pg_issue .widget-instance-OUP_Issue { width: 100%; } } .sf-facet-list .sf-facet label, .sf-facet-list .taxonomy-label-wrap label { font-size: 0.9375rem; } .issue-pagination-wrap .pagination-container { float: right; } </style> </div> </div> </div> <div class="ss-ui-only"> </div> </section> </div> <div class="widget widget-SiteWideModals widget-instance-SiteWideModals"> <div id="revealModal" class="reveal-modal" data-reveal> <div id="revealContent"></div> <a class="close-reveal-modal" href="javascript:;"><i class="icon-general-close"></i><span class="screenreader-text">Close</span></a> </div> <div id="globalModalContainer" class="modal-global-container"> <div id="globalModalContent"> <div class="js-globalModalPlaceholder"></div> </div> <a class="close-modal js-close-modal" href="javascript:;"><i class="icon-general-close"><span class="screenreader-text">Close</span></i></a> </div> <div id="globalModalOverlay" class="modal-overlay js-modal-overlay"></div> <div id="NeedSubscription" class="reveal-modal small" data-reveal> <div class="subscription-needed"> <h5>This Feature Is Available To Subscribers Only</h5> <p><a href="/sign-in">Sign In</a> or <a href="/my-account/register?siteId=5325&returnUrl=%2fmbe%2farticle%2f38%2f10%2f4647%2f6329644">Create an Account</a></p> </div> <a class="close-reveal-modal" href="javascript:;"><i class="icon-general-close"></i><span class="screenreader-text">Close</span></a> </div> <div id="noAccessReveal" class="reveal-modal tiny" data-reveal> <p>This PDF is available to Subscribers Only</p> <a class="hide-for-article-page" id="articleLinkToPurchase" data-reveal><span>View Article Abstract & Purchase Options</span></a> <div class="issue-purchase-modal"> <p>For full access to this pdf, sign in to an existing account, or purchase an annual subscription.</p> </div> <a class="close-reveal-modal" href="javascript:;"><i class="icon-general-close"></i><span class="screenreader-text">Close</span></a> </div> </div> <script type="text/javascript"> MathJax = { tex: { inlineMath: [['|$', '$|'], ['\\(', '\\)']] } }; </script> <script id="MathJax-script" async src="//cdn.jsdelivr.net/npm/mathjax@3/es5/tex-mml-chtml.js"></script> <!-- CookiePro Default Categories --> <!-- When the Cookie Compliance code loads, if cookies for the associated group have consent... it will dynamically change the tag to: script type=text/JavaScript... the code inside the tags will then be recognized and run as normal. --> <script> var NTPT_PGEXTRA = 'event_type=full-text\u0026discipline_ot_level_1=Science and Mathematics\u0026discipline_ot_level_2=Biological Sciences\u0026supplier_tag=SC_Journals\u0026object_type=Article\u0026taxonomy=taxId%3a39%7ctaxLabel%3aAcademicSubjects%7cnodeId%3aSCI01180%7cnodeLabel%3aMolecular+and+Cell+Biology%7cnodeLevel%3a3%3btaxId%3a39%7ctaxLabel%3aAcademicSubjects%7cnodeId%3aSCI01130%7cnodeLabel%3aEvolutionary+Biology%7cnodeLevel%3a3\u0026siteid=molbev\u0026authzrequired=false\u0026doi=10.1093/molbev/msab199'; </script> <!-- Copyright 2001-2010, IBM Corporation All rights reserved. --> <script type="text/javascript" src="//ouptag.scholarlyiq.com/ntpagetag.js" class="optanon-category-C0002"></script> <noscript> <img src="//ouptag.scholarlyiq.com/ntpagetag.gif?js=0" height="1" width="1" border="0" hspace="0" vspace="0" alt="Scholarly IQ" /> </noscript> <script type="text/javascript" src="//oup.silverchair-cdn.com/Themes/Client/app/jsdist/v-638669719712896271/site.min.js"></script> <script type="text/javascript" src="https://cdn.jsdelivr.net/chartist.js/latest/chartist.min.js"></script> <script type="text/javascript" src="//oup.silverchair-cdn.com/Themes/Client/app/jsdist/v-638669719629345371/article-page.min.js"></script> <div class="ad-banner js-ad-riser ad-banner-riser"> <div class="widget widget-AdBlock widget-instance-RiserAd"> </div> </div> <script src="//oup.silverchair-cdn.com/oup/scm.proxylogging.js"></script> <div class="end-of-page-js"></div> </body> </html>