CINXE.COM

Sequence-based Clustering

<!DOCTYPE html><html lang="en"><head><script src="https://www.googletagmanager.com/gtag/js?id=G-5JMGYPWJRR" async></script><script>//- global rcsb-config object var RC = { googleAnalyticsTrackingId: 'UA-3923365-3' , instance: 'production' , isProductionServer: true , dataUrl: 'https://data.rcsb.org/' , searchUrl: 'https://search.rcsb.org/rcsbsearch/v2/' , alignmentHost: 'https://alignment.rcsb.org' , alignmentUrl: 'https://alignment.rcsb.org/api/v1/' , fileStorageUrl: 'https://user-upload.rcsb.org/v1/' , fileStoragePutEndpoint: 'putMultipart' , fileStorageGetEndpoint: 'download' , sequenceCoordinatesUrl: 'https://1d-coordinates.rcsb.org/' , internalAnalyticsOriginHeaderKey: 'Rcsb-Analytics-Traffic-Origin' , internalAnalyticsOriginHeaderValue: 'internal' , internalAnalyticsStageHeaderKey: 'Rcsb-Analytics-Traffic-Stage' , internalAnalyticsStageHeaderValue: 'production' , MOLSTAR_IMG_URL: 'https://cdn.rcsb.org/images/structures/' }; </script><script src="/search/search-data?ts=5774754"></script><script src="/js/search/react-search.js?ts=5774754"></script><script>!function(){if("performance"in window==0&&(window.performance={}),Date.now=Date.now||function(){return(new Date).getTime()},"now"in window.performance==0){var n=Date.now();performance.timing&&performance.timing.navigationStart&&(n=performance.timing.navigationStart),window.performance.now=function(){return Date.now()-n}}}();(function(){var h="undefined"!=typeof window&&window===this?this:"undefined"!=typeof global&&null!=global?global:this,k="function"==typeof Object.defineProperties?Object.defineProperty:function(a,b,c){a!=Array.prototype&&a!=Object.prototype&&(a[b]=c.value)};function l(){l=function(){};h.Symbol||(h.Symbol=m)}var n=0;function m(a){return"jscomp_symbol_"+(a||"")+n++} function p(){l();var a=h.Symbol.iterator;a||(a=h.Symbol.iterator=h.Symbol("iterator"));"function"!=typeof Array.prototype[a]&&k(Array.prototype,a,{configurable:!0,writable:!0,value:function(){return q(this)}});p=function(){}}function q(a){var b=0;return r(function(){return b<a.length?{done:!1,value:a[b++]}:{done:!0}})}function r(a){p();a={next:a};a[h.Symbol.iterator]=function(){return this};return a}function t(a){p();var b=a[Symbol.iterator];return b?b.call(a):q(a)} function u(a){if(!(a instanceof Array)){a=t(a);for(var b,c=[];!(b=a.next()).done;)c.push(b.value);a=c}return a}var v=0;function w(a,b){var c=XMLHttpRequest.prototype.send,d=v++;XMLHttpRequest.prototype.send=function(f){for(var e=[],g=0;g<arguments.length;++g)e[g-0]=arguments[g];var E=this;a(d);this.addEventListener("readystatechange",function(){4===E.readyState&&b(d)});return c.apply(this,e)}} function x(a,b){var c=fetch;fetch=function(d){for(var f=[],e=0;e<arguments.length;++e)f[e-0]=arguments[e];return new Promise(function(d,e){var g=v++;a(g);c.apply(null,[].concat(u(f))).then(function(a){b(g);d(a)},function(a){b(a);e(a)})})}}var y="img script iframe link audio video source".split(" ");function z(a,b){a=t(a);for(var c=a.next();!c.done;c=a.next())if(c=c.value,b.includes(c.nodeName.toLowerCase())||z(c.children,b))return!0;return!1} function A(a){var b=new MutationObserver(function(c){c=t(c);for(var b=c.next();!b.done;b=c.next())b=b.value,"childList"==b.type&&z(b.addedNodes,y)?a(b):"attributes"==b.type&&y.includes(b.target.tagName.toLowerCase())&&a(b)});b.observe(document,{attributes:!0,childList:!0,subtree:!0,attributeFilter:["href","src"]});return b} function B(a,b){if(2<a.length)return performance.now();var c=[];b=t(b);for(var d=b.next();!d.done;d=b.next())d=d.value,c.push({timestamp:d.start,type:"requestStart"}),c.push({timestamp:d.end,type:"requestEnd"});b=t(a);for(d=b.next();!d.done;d=b.next())c.push({timestamp:d.value,type:"requestStart"});c.sort(function(a,b){return a.timestamp-b.timestamp});a=a.length;for(b=c.length-1;0<=b;b--)switch(d=c[b],d.type){case "requestStart":a--;break;case "requestEnd":a++;if(2<a)return d.timestamp;break;default:throw Error("Internal Error: This should never happen"); }return 0}function C(a){a=a?a:{};this.w=!!a.useMutationObserver;this.u=a.minValue||null;a=window.__tti&&window.__tti.e;var b=window.__tti&&window.__tti.o;this.a=a?a.map(function(a){return{start:a.startTime,end:a.startTime+a.duration}}):[];b&&b.disconnect();this.b=[];this.f=new Map;this.j=null;this.v=-Infinity;this.i=!1;this.h=this.c=this.s=null;w(this.m.bind(this),this.l.bind(this));x(this.m.bind(this),this.l.bind(this));D(this);this.w&&(this.h=A(this.B.bind(this)))} C.prototype.getFirstConsistentlyInteractive=function(){var a=this;return new Promise(function(b){a.s=b;"complete"==document.readyState?F(a):window.addEventListener("load",function(){F(a)})})};function F(a){a.i=!0;var b=0<a.a.length?a.a[a.a.length-1].end:0,c=B(a.g,a.b);G(a,Math.max(c+5E3,b))} function G(a,b){!a.i||a.v>b||(clearTimeout(a.j),a.j=setTimeout(function(){var b=performance.timing.navigationStart,d=B(a.g,a.b),b=(window.a&&window.a.A?1E3*window.a.A().C-b:0)||performance.timing.domContentLoadedEventEnd-b;if(a.u)var f=a.u;else performance.timing.domContentLoadedEventEnd?(f=performance.timing,f=f.domContentLoadedEventEnd-f.navigationStart):f=null;var e=performance.now();null===f&&G(a,Math.max(d+5E3,e+1E3));var g=a.a;5E3>e-d?d=null:(d=g.length?g[g.length-1].end:b,d=5E3>e-d?null:Math.max(d, f));d&&(a.s(d),clearTimeout(a.j),a.i=!1,a.c&&a.c.disconnect(),a.h&&a.h.disconnect());G(a,performance.now()+1E3)},b-performance.now()),a.v=b)} function D(a){a.c=new PerformanceObserver(function(b){b=t(b.getEntries());for(var c=b.next();!c.done;c=b.next())if(c=c.value,"resource"===c.entryType&&(a.b.push({start:c.fetchStart,end:c.responseEnd}),G(a,B(a.g,a.b)+5E3)),"longtask"===c.entryType){var d=c.startTime+c.duration;a.a.push({start:c.startTime,end:d});G(a,d+5E3)}});a.c.observe({entryTypes:["longtask","resource"]})}C.prototype.m=function(a){this.f.set(a,performance.now())};C.prototype.l=function(a){this.f.delete(a)}; C.prototype.B=function(){G(this,performance.now()+5E3)};h.Object.defineProperties(C.prototype,{g:{configurable:!0,enumerable:!0,get:function(){return[].concat(u(this.f.values()))}}});var H={getFirstConsistentlyInteractive:function(a){a=a?a:{};return"PerformanceLongTaskTiming"in window?(new C(a)).getFirstConsistentlyInteractive():Promise.resolve(null)}}; "undefined"!=typeof module&&module.exports?module.exports=H:"function"===typeof define&&define.amd?define("ttiPolyfill",[],function(){return H}):window.ttiPolyfill=H;})();function gtag(){dataLayer.push(arguments)}var logger=function(){"use strict";function n(n){if(n=JSON.stringify(n),"sendBeacon"in navigator)navigator.sendBeacon(t,n);else{var e=new XMLHttpRequest;e.open("POST",t,!1),e.setRequestHeader("Content-Type","text/plain;charset=UTF-8"),e.send(n)}}function e(e,t,i){if(!RC.isProductionServer)switch(e){case"error":case"warn":case"info":i?console[e](t,i):console[e](t);break;default:console.log(t,i)}"error"!==e&&"warn"!==e||(r.push({level:e,msg:t||"",info:Object.assign({},i,{path:window.location.pathname,userAgent:navigator.userAgent})}),r.length>=o&&n(r.splice(0,o)))}var t="/analytics",o=10,r=[];return window.addEventListener("unload",function(){n(r)},!1),{stack:Function.prototype.bind.call(function(n){n&&e("error",n.name+': "'+n.message+'"',{type:n.name,description:n.message,trace:n.stack})}),error:Function.prototype.bind.call(function(n,t){e("error",n,t)}),warn:Function.prototype.bind.call(function(n,t){e("warn",n,t)}),info:Function.prototype.bind.call(function(n,t){e("info",n,t)}),verbose:Function.prototype.bind.call(function(n,t){e("verbose",n,t)}),debug:Function.prototype.bind.call(function(n,t){e("debug",n,t)}),silly:Function.prototype.bind.call(function(n,t){e("silly",n,t)})}}();window.dataLayer=window.dataLayer||[],gtag("js",new Date),gtag("config","G-5JMGYPWJRR"),window.addEventListener("error",function(n){logger.stack(n.error)}),window.addEventListener("unhandledrejection",function(n){n&&n.reason&&logger.error('Unhandled promise rejection: "'+n.reason.message+'"',{type:"PromiseRejection",description:n.reason.message,trace:n.reason.stack})});var gtagFirstMeaningfulPaint=function(){var n=!1;return function(){n?logger.warn('Timing for "firstMeaningfulPaint" already sent'):(console.log("firstMeaningfulPaint",Math.round(performance.now())),n=!0)}}();!function(){"use strict";var n=0;if("PerformanceObserver"in window&&"PerformancePaintTiming"in window){new PerformanceObserver(function(e){e.getEntries().forEach(function(e){if(0===n){e.startTime,e.duration}})}).observe({entryTypes:["paint"]});var e=window.__tti={e:[]};e.o=new PerformanceObserver(function(n){e.e=e.e.concat(n.getEntries())}),e.o.observe({entryTypes:["longtask"]}),ttiPolyfill.getFirstConsistentlyInteractive({}).then(function(n){});new PerformanceObserver(function(n){n.getEntries().forEach(function(n){var e=n.attribution[0]||{},t={containerType:e.containerType,containerName:e.containerName,containerId:e.containerId,containerSrc:e.containerSrc,frameOrigin:n.name,durationMs:n.duration,startTimeMs:n.startTime};n.duration>500&&logger.warn("Long running task, duration "+n.duration.toFixed(2)+"ms.",t)})}).observe({entryTypes:["longtask"]})}var t=performance.now();window.addEventListener("visibilitychange",function(){document.hidden?t=performance.now():n+=performance.now()-t}),window.addEventListener("load",function(){performance.now()}),window.addEventListener("DOMContentLoaded",function(){performance.now()})}();</script><title>Sequence-based Clustering</title><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta property="og:title" content="Sequence-based Clustering"><meta property="og:description" content="As a member of the wwPDB, the RCSB PDB curates and annotates PDB data according to agreed upon standards. The RCSB PDB also provides a variety of tools and resources. Users can perform simple and advanced searches based on annotations relating to sequence, structure and function. These molecules are visualized, downloaded, and analyzed by users who range from students to specialized scientists."><meta property="og:image" content="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/rcsb_logo2.png"><meta name="twitter:card" content="summary_large_image"><meta name="twitter:title" content="Sequence-based Clustering"><meta name="twitter:description" content="As a member of the wwPDB, the RCSB PDB curates and annotates PDB data according to agreed upon standards. The RCSB PDB also provides a variety of tools and resources. Users can perform simple and advanced searches based on annotations relating to sequence, structure and function. These molecules are visualized, downloaded, and analyzed by users who range from students to specialized scientists."><meta name="twitter:image" content="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/rcsb_logo2.png"><meta name="description" content="As a member of the wwPDB, the RCSB PDB curates and annotates PDB data according to agreed upon standards. The RCSB PDB also provides a variety of tools and resources. Users can perform simple and advanced searches based on annotations relating to sequence, structure and function. These molecules are visualized, downloaded, and analyzed by users who range from students to specialized scientists."><meta name="author" content="RCSB Protein Data Bank"><meta name="email" content="info@rcsb.org"><meta name="Charset" content="UTF-8"><meta name="Distribution" content="Global"><meta name="Rating" content="General"><meta http-equiv="content-language" content="en-US"><meta name="viewport" content="width=device-width, initial-scale=1"><meta name="theme-color" content="#5e94c3"><meta class="elastic" name="release_date" content="release.date:undef"><link rel="manifest" href="/manifest.json"><link rel="apple-touch-icon" href="/img/rcsb-apple-touch-icon.jpg"><link rel="stylesheet" href="https://cdn.rcsb.org/javascript/bootstrap/latest/css/bootstrap.min.css"><link rel="stylesheet" href="https://cdn.rcsb.org/javascript/fontawesome/latest/css/font-awesome.min.css"><link rel="stylesheet" href="/build/css/main.css"><link rel="stylesheet" href="/css/search.css?ts=5774754"><script>window.addEventListener('load', function () { // load the JIRA feedback button only after everything else has been loaded var script = document.createElement("script"); script.src = "/js/jira-fdbck.js"; script.type = "text/javascript"; document.getElementsByTagName("head")[0].appendChild(script); var link = document.createElement("link"); link.rel = "stylesheet"; link.href = "https://cdn.rcsb.org/jira-feedback/css/jira-fdbck.css"; document.getElementsByTagName("head")[0].appendChild(link); // load the ekko-lightbox css only after everything else has been loaded var link = document.createElement("link"); link.rel = "stylesheet"; link.href = "/css/ekko-lightbox.css"; document.getElementsByTagName("head")[0].appendChild(link); }); </script><script src="https://cdn.rcsb.org/javascript/jquery/jquery-3.3.1.min.js"></script><script src="https://cdn.rcsb.org/javascript/bootstrap/latest/js/bootstrap.min.js"></script><script src="/js/ekko-lightbox.min.js" defer></script><script>$(document).delegate('*[data-toggle="lightbox"]',"click",function(t){t.preventDefault(),$(this).ekkoLightbox()});$(function(){$(".nav>.dropdown").on("mouseenter",function(o){$(this).addClass("open")}),$(".nav>.dropdown").on("mouseleave",function(o){$(".dropdown").removeClass("open")}),$('[data-toggle="tooltip"]').tooltip()});</script></head><body><div data-elastic-exclude><div data-elastic-exclude><nav class="navbar navbar-inverse navbar-fixed-top hidden-print" id="nav" role="navigation"><div class="hide hidden-print" id="UnsupportedBrowser" style="width: 100%; border-bottom: 2px solid #FFA500; background-color: #FFFFFF; color: #000000; display: inline-block; font-size: .9em; line-height: 2em; text-align: center; font-weight: bold; font-style: italic;"><span class="label label-warning" style="font-size: 100%;">Warning</span> You are using a web browser that we do not support. Our website will not work properly. Please update to a newer version or download a new web browser, such as Chrome or Firefox.</div><div class="container"><div class="row pull-right"><div class="col-sm-12"><div class="input-group"> <a class="button btn btn-sm basic navbar-buttons" href="/help">Help</a><div class="button btn btn-sm basic jira-fdbck-btn navbar-buttons" id="feedbackLink-ContactUs">Contact us</div><div class="navbar-buttons hidden-xs mypdb-style" id="mypdb-menu-container"></div></div></div></div><!-- Brand and toggle get grouped for better mobile display--><div class="navbar-header"><button class="navbar-toggle pull-left" type="button" data-toggle="collapse" data-target="#navbar-collapse-RCSB"><span class="sr-only">Toggle navigation</span><span class="icon-bar"></span><span class="icon-bar"></span><span class="icon-bar"></span></button><a class="navbar-brand" href="/">RCSB PDB</a></div><div class="collapse navbar-collapse" id="navbar-collapse-RCSB" style="max-height: 420px;"><ul class="nav navbar-nav pull-left"><li class="dropdown" id="headnav_deposit"><a class="dropdown-toggle" href="#" data-toggle="dropdown" aria-expanded="false">Deposit&nbsp;<b class="caret"></b></a><div class="dropdown-menu multi-column" id="DepositDropdownNav"><div class="row"><div class="col-xs-12 col-sm-2 col-md-2"><ul class="dropdown-menu" id="head-deposit_prepare"><h4>Prepare Data</h4><li> <a href="https://www.wwpdb.org/deposition/preparing-pdbx-mmcif-files" rel="noopener" target="_blank">PDBx/mmCIF file</a></li><li> <a href="https://pdb-extract.wwpdb.org/" rel="noopener" target="_blank">pdb_extract</a></li><li> <a href="http://sf-tool.wwpdb.org/" rel="noopener" target="_blank">SF-Tool</a></li><li> <a href="http://ligand-expo.rcsb.org/" rel="noopener" target="_blank">Ligand Expo</a></li><li> <a href="https://sw-tools.rcsb.org/apps/MAXIT/index.html" rel="noopener" target="_blank">MAXIT</a></li></ul></div><div class="col-xs-12 col-sm-3 col-md-3"><ul class="dropdown-menu" id="head-deposit_validate"><h4>Validate Data</h4><li> <a href="https://validate-rcsb.wwpdb.org" rel="noopener" target="_blank">Validation Server</a></li><li> <a href="http://www.wwpdb.org/validation/onedep-validation-web-service-interface" rel="noopener" target="_blank">Validation API</a></li><li> <a href="http://www.wwpdb.org/documentation/journals" rel="noopener" target="_blank">Information for Journals</a></li><li> <a href="http://www.wwpdb.org/task/validation-task-forces.php" rel="noopener" target="_blank">Validation Task Forces</a></li></ul></div><div class="col-xs-12 col-sm-3 col-md-3"><ul class="dropdown-menu" id="head-deposit_deposit-data"><h4>Deposit Data</h4><li style="word-break: normal"> <a href="https://deposit.wwpdb.org/deposition/" rel="noopener" target="_blank" style="word-break: normal">wwPDB OneDep System</a></li><li style="word-break: normal"> <a href="https://pdb-dev.wwpdb.org/" rel="noopener" target="_blank" style="word-break: normal">PDB-Dev</a></li></ul></div><div class="col-xs-12 col-sm-2 col-md-3"><ul class="dropdown-menu" id="head-deposit_deposit-help"><h4>Help and Resources</h4><li> <a href="http://www.wwpdb.org/deposition/faq" rel="noopener" target="_blank">Deposit FAQ</a></li><li> <a href="http://www.wwpdb.org/validation/2017/FAQs" rel="noopener" target="_blank">Validation FAQ</a></li><li> <a href="http://www.wwpdb.org/deposition/tutorial" rel="noopener" target="_blank">Tutorials</a></li><li> <a href="http://www.wwpdb.org/documentation/policy" rel="noopener" target="_blank">Annotation Policies</a></li><li> <a href="http://www.wwpdb.org/documentation/procedure" rel="noopener" target="_blank">Processing Procedures</a></li><li> <a href="https://mmcif.wwpdb.org/" rel="noopener" target="_blank">PDBx/mmCIF Dictionary</a></li><li> <a href="https://mmcif.wwpdb.org/docs/user-guide/guide.html" rel="noopener" target="_blank">PDBx/mmCIF User Guide</a></li><li> <a href="https://www.wwpdb.org/data/ccd" rel="noopener" target="_blank">Chemical Component Dictionary</a></li><li> <a href="https://www.wwpdb.org/data/bird" rel="noopener" target="_blank">Biologically Interesting Molecule Reference Dictionary (BIRD)</a></li><li> <a href="https://biosync.sbkb.org/" rel="noopener" target="_blank">BioSync/Beamlines/Facilities</a></li><li> <a href="https://sw-tools.rcsb.org/" rel="noopener" target="_blank">Related Tools</a></li></ul></div></div></div></li><li class="dropdown" id="headnav_search"><a class="dropdown-toggle" href="#" data-toggle="dropdown">Search&nbsp;<b class="caret"></b></a><ul class="dropdown-menu"><li><a href="/search/advanced" rel="noopener">Advanced Search</a></li><li><a href="/search/advanced/sequence" rel="noopener">Sequence Similarity Search</a></li><li><a href="/search/advanced/structure" rel="noopener">Structure Similarity Search</a></li><li><a href="/search/advanced/chemical" rel="noopener">Chemical Similarity Search</a></li><li><a href="/chemical-sketch" rel="noopener">Chemical Sketch Tool</a></li><li><a href="/search/browse/atc" rel="noopener">Browse by Annotations</a></li><li><a href="/search?query=%7B%22parameters%22%3A%7B%22attribute%22%3A%22rcsb_accession_info.initial_release_date%22%2C%22operator%22%3A%22range%22%2C%22value%22%3A%7B%22from%22%3A%22now-1w%22%2C%22include_lower%22%3Afalse%2C%22to%22%3A%22now%22%2C%22include_upper%22%3Atrue%7D%7D%7D" rel="noopener">New Entries</a></li><li><a href="/pages/unreleased" rel="noopener">Unreleased Entries</a></li><li><a href="/stats" rel="noopener">PDB Statistics</a></li></ul></li><li class="dropdown" id="headnav_visualize"><a class="dropdown-toggle" href="#" data-toggle="dropdown">Visualize&nbsp;<b class="caret"></b></a><ul class="dropdown-menu"> <li><a href="/3d-view" rel="noopener">Mol* (MolStar)</a></li><li><a href="/docs/sequence-viewers/sequence-annotations-viewer" rel="noopener">Sequence Annotations Viewer</a></li><li><a href="/docs/sequence-viewers/genome-view" rel="noopener">Genome View</a></li></ul></li><li class="dropdown" id="headnav_analyze"><a class="dropdown-toggle" href="#" data-toggle="dropdown">Analyze&nbsp;<b class="caret"></b></a><ul class="dropdown-menu"><li><a href="/alignment" rel="noopener">Pairwise Structure Alignment</a></li><li><a href="/docs/general-help/symmetry-resources-in-the-pdb" rel="noopener">Symmetry Resources in the PDB</a></li><li><a href="https://www.wwpdb.org/validation/validation-reports" rel="noopener" target="_blank">Structure Quality </a></li><li><a href="/docs/grouping-structures/overview-grouping-structures" rel="noopener">Grouping Structures</a></li><li><a href="https://cdn.rcsb.org/rcsb-pdb/pdb50mesh/index.html" rel="noopener" target="_blank">PDB Citation MeSH Network Explorer </a></li><li><a href="/stats" rel="noopener">PDB Statistics</a></li><li><a href="https://www.eppic-web.org" rel="noopener" target="_blank">EPPIC Biological Assemblies </a></li><li class="extraList">External Data and Resources </li><li class="extraMargin"><a href="/docs/general-help/data-from-external-resources-integrated-into-rcsb-pdb" rel="noopener">Integrated Resources </a></li><li class="extraMargin"><a href="/docs/additional-resources/databases-and-knowledgebases" rel="noopener">Additional Resources </a></li></ul></li><li class="dropdown hidden-xs hidden-sm" id="headnav_download"><a class="dropdown-toggle" href="#" data-toggle="dropdown">Download&nbsp;<b class="caret"></b></a><ul class="dropdown-menu"> <li><a href="/downloads" rel="noopener">Coordinates and Experimental Data</a></li><li><a href="/downloads/fasta" rel="noopener">Sequences</a></li><li><a href="/downloads/ligands" rel="noopener">Ligands</a></li><li><a href="/docs/programmatic-access/file-download-services" rel="noopener">File Download Services</a></li><li><a href="/docs/programmatic-access/web-apis-overview" rel="noopener">Web APIs</a></li></ul></li><li class="dropdown" id="headnav_learn"><a class="dropdown-toggle" href="#" data-toggle="dropdown">Learn&nbsp;<b class="caret"></b></a><ul class="dropdown-menu"><h4><a href="http://pdb101.rcsb.org" target="_blank" rel="noopener"><img class="image_submenu" src="https://cdn.rcsb.org/rcsb-pdb/v2/home/images/menuImgs/pdb101Logo.png"></a></h4><li><a href="https://pdb101.rcsb.org/train/training-events" rel="noopener" target="_blank">Training Courses </a></li><li><a href="https://pdb101.rcsb.org/learn/guide-to-understanding-pdb-data/introduction" rel="noopener" target="_blank">Guide to PDB Data </a></li><li><a href="https://pdb101.rcsb.org/motm/motm-by-date" rel="noopener" target="_blank">Molecule of the Month </a></li><li><a href="https://pdb101.rcsb.org/learn/paper-models" rel="noopener" target="_blank">Educational Resources </a></li><li><a href="https://pdb101.rcsb.org/teach/overview" rel="noopener" target="_blank">Curricula </a></li><li><a href="https://pdb101.rcsb.org/browse" rel="noopener" target="_blank">Browse </a></li><li><a href="https://pdb101.rcsb.org/news/2023" rel="noopener" target="_blank">News </a></li><li class="extraList">SciArt Galleries </li><li class="extraMargin"><a href="https://pdb101.rcsb.org/sci-art/geis-archive/gallery-by-name" rel="noopener" target="blank">Irving Geis </a></li><li class="extraMargin"><a href="https://pdb101.rcsb.org/sci-art/goodsell-gallery" rel="noopener" target="blank">David Goodsell </a></li></ul></li><li class="dropdown" id="headnav_more"><a class="dropdown-toggle" href="#" data-toggle="dropdown">About&nbsp;<b class="caret"></b></a><ul class="dropdown-menu"><li><a href="/pages/contactus" rel="noopener">Contact Us</a></li><li><a href="/pages/about-us/index" rel="noopener">About RCSB PDB</a></li><li><a href="/pages/about-us/mission" rel="noopener">Vision and Mission</a></li><li><a href="/pages/policies" rel="noopener">Citation, Usage, Privacy Policies, Logo</a></li><li><a href="/pages/news" rel="noopener">News</a></li><li><a href="/pages/about-us/history" rel="noopener">PDB History</a></li><li><a href="/pages/pdb50" rel="noopener">PDB50</a></li><li><a href="/pages/about-us/pdb-user-community" rel="noopener">User Community</a></li><li><a href="/pages/publications" rel="noopener">Publications</a></li><li><a href="/pages/advisory-committee" rel="noopener">RCSB PDB Advisory Committee</a></li><li><a href="/pages/team" rel="noopener">Team Members</a></li><li><a href="/pages/about-us/deia" rel="noopener">Diversity, Equity, Inclusion, and Access</a></li><li><a href="https://status.rcsb.org/" rel="noopener" target="_blank">Service Status </a></li></ul></li><li class="nodropdown"><a class="dropdown-toggle" href="/pages/jobs">Careers</a></li><li class="nodropdown"><a class="dropdown-toggle" href="/news/feature/5e74d55d2d410731e9944f52">COVID-19</a></li><li class="dropdown visible-xs"><div id="socialmedia_section_mobile"><ul class="fa-ul hidden-print"><li><a href="https://www.facebook.com/RCSBPDB" target="_blank" rel="noopener" title="Facebook" data-placement="top" data-toggle="tooltip"><i class="fa fa-facebook-square fa-lg"></i></a></li><li><a href="https://twitter.com/buildmodels" target="_blank" rel="noopener" title="Twitter" data-placement="top" data-toggle="tooltip"><i class="fa fa-twitter fa-lg"></i></a></li><li><a href="https://www.youtube.com/user/RCSBProteinDataBank" target="_blank" rel="noopener" title="YouTube" data-placement="top" data-toggle="tooltip"><i class="fa fa-youtube-play fa-lg"></i></a></li><li><a href="https://github.com/rcsb" target="_blank" rel="noopener" title="Github" data-placement="top" data-toggle="tooltip"><i class="fa fa-github fa-lg"></i></a></li><li><a href="https://www.linkedin.com/company/rcsb-protein-data-bank" target="_blank" rel="noopener" title="LinkedIn" data-placement="top" data-toggle="tooltip"><i class="fa fa-linkedin fa-lg"></i></a></li></ul></div></li></ul></div></div></nav></div><style>#PDBmembers li {margin-right: 15px; } </style><div data-elastic-exclude><div id="header"><div class="container"><div class="row" style="margin-bottom: 0px;"><div class="col-md-6 col-lg-5 hidden-sm hidden-xs" id="logo_container" style="padding-bottom: 15px;"><table class="header-left"><tr><td><a href="/"><img id="rcsblogo" src="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/rcsb_logo.png" alt="RCSB PDB"></a></td><td><table id="header-counts"><tr><td><div class="results-content-type-sm experimental"><span class="fa fa-flask" data-toggle="tooltip" data-placement="right" data-original-title="Experimental PDB Structure"></span></div></td><td><a href="/search?request=%7B%22query%22%3A%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22terminal%22%2C%22service%22%3A%22text%22%2C%22parameters%22%3A%7B%22attribute%22%3A%22rcsb_entry_info.structure_determination_methodology%22%2C%22operator%22%3A%22exact_match%22%2C%22value%22%3A%22experimental%22%7D%7D%5D%2C%22logical_operator%22%3A%22and%22%7D%5D%2C%22logical_operator%22%3A%22and%22%2C%22label%22%3A%22text%22%7D%5D%2C%22logical_operator%22%3A%22and%22%7D%2C%22return_type%22%3A%22entry%22%2C%22request_options%22%3A%7B%22scoring_strategy%22%3A%22combined%22%2C%22results_content_type%22%3A%5B%22experimental%22%5D%7D%7D" style="font-weight: bold; font-size: 110%">227,561</a><span>&nbsp;Structures from the PDB</span></td></tr><tr><td><div class="results-content-type-sm computational"><span class="fa fa-desktop" data-toggle="tooltip" data-placement="right" data-original-title="Computed Structure Model"></span></div></td><td><a href="/search?request=%7B%22query%22%3A%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22terminal%22%2C%22service%22%3A%22text%22%2C%22parameters%22%3A%7B%22attribute%22%3A%22rcsb_entry_info.structure_determination_methodology%22%2C%22operator%22%3A%22exact_match%22%2C%22value%22%3A%22computational%22%7D%7D%5D%2C%22logical_operator%22%3A%22and%22%7D%5D%2C%22logical_operator%22%3A%22and%22%2C%22label%22%3A%22text%22%7D%5D%2C%22logical_operator%22%3A%22and%22%7D%2C%22return_type%22%3A%22entry%22%2C%22request_options%22%3A%7B%22scoring_strategy%22%3A%22combined%22%2C%22results_content_type%22%3A%5B%22computational%22%5D%7D%7D" style="font-weight: bold; font-size: 110%">1,068,577</a><span>&nbsp;Computed Structure Models (CSM)</span></td></tr></table></td></tr></table></div><div class="col-sm-12 col-md-6 col-lg-7 hidden-print" id="search-bar-container"></div></div></div><div class="logos_bcg"><div class="container"><ul class="hidden-xs hidden-print" id="PDBmembers"><li><span data-toggle="tooltip" data-placement="right" data-original-title="PDB-101: Training and outreach portal of RCSB PDB"><a href="https://pdb101.rcsb.org/"><img id="pdb101logo" src="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/pdb101-truncated.png" alt="PDB-101"></a></span></li><li><span data-toggle="tooltip" data-placement="right" data-original-title="wwPDB: Worldwide Protein Data Bank"><a href="https://www.wwpdb.org/" target="_blank" rel="noopener"><img id="wwpdblogo" src="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/wwpdb-truncated.png" alt="wwPDB"></a></span></li><li><span data-toggle="tooltip" data-placement="right" data-original-title="EMDataResource: 3DEM resources"><a href="https://www.emdataresource.org" target="_blank" rel="noopener"><img id="emdatabanklogo" src="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/emdb-truncated.png" alt="EMDataResource"></a></span></li><li><span data-toggle="tooltip" data-placement="right" data-original-title="NAKB: Nucleic Acid Knowledgebase"><a href="https://nakb.org/" target="_blank" rel="noopener"><img id="nakblogo" src="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/nakb-logo.png" alt="NAKB: Nucleic Acid Knowledgebase"></a></span></li><li><span data-toggle="tooltip" data-placement="right" data-original-title="wwPDB Foundation: Donate to support wwPDB outreach activities"><a href="https://foundation.wwpdb.org/" target="_blank" rel="noopener"><img id="wwpdbfoundationlogo" src="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/foundation-truncated.png" alt="wwPDB Foundation"></a></span></li><li><span data-toggle="tooltip" data-placement="right" data-original-title="PDB-Dev: Prototype Archiving System for Integrative Structures"><a href="https://pdb-dev.wwpdb.org/" target="_blank" rel="noopener"><img id="pdbdevlogo" src="https://cdn.rcsb.org/rcsb-pdb/v2/common/images/pdb-dev-logo.png" alt="PDB-Dev Logo"></a></span></li></ul><div id="socialmedia_section"><ul class="fa-ul hidden-print"><li><a href="https://www.facebook.com/RCSBPDB" target="_blank" rel="noopener" title="Facebook" data-placement="top" data-toggle="tooltip"><i class="fa fa-facebook-square fa-lg"></i></a></li><li><a href="https://twitter.com/buildmodels" target="_blank" rel="noopener" title="Twitter" data-placement="top" data-toggle="tooltip"><i class="fa fa-twitter fa-lg"></i></a></li><li><a href="https://www.youtube.com/user/RCSBProteinDataBank" target="_blank" rel="noopener" title="YouTube" data-placement="top" data-toggle="tooltip"><i class="fa fa-youtube-play fa-lg"></i></a></li><li><a href="https://github.com/rcsb" target="_blank" rel="noopener" title="Github" data-placement="top" data-toggle="tooltip"><i class="fa fa-github fa-lg"></i></a></li><li><a href="https://www.linkedin.com/company/rcsb-protein-data-bank" target="_blank" rel="noopener" title="LinkedIn" data-placement="top" data-toggle="tooltip"><i class="fa fa-linkedin fa-lg"></i></a></li></ul></div></div></div></div></div><div class="container" id="maincontentcontainer"><style>p {font-size: 16px} ul li {font-size: 16px} div#docs-container { margin: 0; } span.glyphicon-new-window { font-size: 10px; } div .main-heading h1{ margin-top: 0; } div#helpmenu .small-menu { text-align: right; white-space: nowrap; /* Prevent text wrapping */ } div#helpmenu .small-menu p{ font-size: 15px; } div#helpmenu .small-menu a{ color: #325880; } div#helpmenu .divider { color: #5E5D5D; padding: 0 8px; } /* menu */ div#menu { border-bottom: 1px solid #ddd; } div#menu a { text-decoration: none; } div#menu-header { border-top: 1px solid #ddd; padding: 4px; } div.group { background-color: #f9f9f9; cursor: pointer; border-top: 1px solid #ddd; padding: 4px 0; } div.group table, div.group td:first-child, div.item table, div.item td:first-child { width: 100%; } div.item td { color: #337ab7; border-top: 1px solid #ddd; padding: 4px; } span.glyphicon-triangle-top, span.glyphicon-triangle-bottom { font-size: 8px; color: #666; } span.glyphicon-chevron-right { font-size: 10px; color: #337ab7; } /* add media query for mobile view */ @media (max-width: 768px) { /* optionally hide toggle icons on mobile */ span.glyphicon-triangle-top, span.glyphicon-triangle-bottom { display: none; } } /* item */ h5.menu-path { color: #666; } /* note: css defined here needs to be in sync with CMS Editor - TODO create a shared file on the CDN? */ a.content-anchor { display: block; position: relative; visibility: hidden; top: -60px; } table.content-resources { width: 100%; border-collapse: collapse; } table.content-resources td { border: 1px solid #ddd; vertical-align: top; padding: 5px; } td.content-img-caption { font-size: 16px; font-style: italic; padding: 5px 0; } img.content-img-border { border: 1px solid #ccc; } div.item-info { font-style: italic; font-size: 16px; color: #888; } div.ekko-lightbox div.modal-dialog { width: auto; max-width: 1170px; } </style><script>// groupMap passed from routes/docs.js var groupMap = {"5fca9f91eb210c2c564f0d7c":{"_id":"5fca9f91eb210c2c564f0d7c","depth":0,"name":"General Help","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["5fc537b03fb4b83beba83b23","5fc51a863fb4b83beb6e959f","63002035b05c2fccc1804d67","62d9b56b35ec5bb4ddb19a42","6003401bcff89d5fc8f8a3f3","6140b307ef055f03d1f222d2","60b686d701b8e50720f2ca63","6018251aecb9a74be53123a7","5fce4e38eb210c2c56790636","5fce5135eb210c2c567d7ab2","600756cec5ab5836659ab2e5","60ebb04e0882a5597783cc03","6080bf66ec901916050494bd","6005be80cff89d5fc8f8a3f5","5ff90b5af32c497fd6f7bf62","67224602e095838a1ce7d99f"],"show":true},"5fbe8e183fb4b83beb4d0e39":{"_id":"5fbe8e183fb4b83beb4d0e39","depth":0,"name":"Search and Browse","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["60006df7ae9f8477226a6c82","5ffde6ee3a38a923c3516cf2","60083954244a4309df45ad46","602c55d11a359e6e2d4a6ea7","6000bab4d3c1ff0cf1f44f48"],"show":true},"60083954244a4309df45ad46":{"_id":"60083954244a4309df45ad46","depth":1,"name":"Advanced Search","parent_id":"5fbe8e183fb4b83beb4d0e39","type":"group","_ids":["5ffde93f3a38a923c3516cf3","5fbecb613fb4b83bebb5e353","600b08bec5ab5836659ab2e9","5ffde9d03a38a923c3516cf5","5ffdeaf53a38a923c3516cf6","5ffe9c743a38a923c3516cfb","600b3277c5ab5836659ab2ea","5ffe9da13a38a923c3516cfc","602c2b653fed9e549afd7917","600061f0ae9f8477226a6c81"]},"602c55d11a359e6e2d4a6ea7":{"_id":"602c55d11a359e6e2d4a6ea7","depth":1,"name":"Browse Options","parent_id":"5fbe8e183fb4b83beb4d0e39","type":"group","_ids":["602c53f43fed9e549afd7918","602c56893fed9e549afd791a","602c56b23fed9e549afd791b","646f8b661d621d75127a7a53","602c57773fed9e549afd791f","602c59ab3fed9e549afd7922","65d93e6f72841524659883e1","61410115ef055f03d1f222d3","602c59da3fed9e549afd7923","602c59f53fed9e549afd7924","602c57cf3fed9e549afd7921","6080adaaec901916050494bc","602c57ae3fed9e549afd7920","602c5a1e3fed9e549afd7925","602c57133fed9e549afd791d","602c57603fed9e549afd791e","6141014def055f03d1f222d4","602c56f13fed9e549afd791c"]},"618271c92a7d828464a7d146":{"_id":"618271c92a7d828464a7d146","depth":0,"name":"Exploring a 3D Structure","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["618274c904fb9835c6ae189a","618271f904fb9835c6ae1892","6182729704fb9835c6ae1893","618272c004fb9835c6ae1894","618272e004fb9835c6ae1895","618272fb04fb9835c6ae1896","6182730904fb9835c6ae1897","6182731a04fb9835c6ae1898","6182732a04fb9835c6ae1899"],"show":true},"6256b2b3b4396e45e97bf3de":{"_id":"6256b2b3b4396e45e97bf3de","depth":0,"name":"Grouping Structures","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["62fbafaf3b6e49562fa5c055","6081c10aec901916050494be","6256b3269c3931864b07285b","6256b35e9c3931864b07285c","6364336066d6046810db7f11"],"show":true,"open":true},"5fd3e3a6eb210c2c5632d098":{"_id":"5fd3e3a6eb210c2c5632d098","depth":0,"name":"3D Viewers","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["5f98cc9614cc37a34de620ea","60075352c5ab5836659ab2e3","65a4b499c76ca3abcc925d0d"],"show":true},"5f98cc9614cc37a34de620ea":{"_id":"5f98cc9614cc37a34de620ea","depth":1,"name":"Mol*","parent_id":"5fd3e3a6eb210c2c5632d098","type":"group","_ids":["5ee0fc4d25aa7b208a9fe39e","5ee107b225aa7b208a9fe3a1","5ee10ad725aa7b208a9fe3a2","5ee1046625aa7b208a9fe3a0","5ee1192f25aa7b208a9fe3a3","5ee13ac17f50f44e6aa4fb1f","5ee231607f50f44e6aa4fb20","5ee253237f50f44e6aa4fb22"]},"5fd3e3f4eb210c2c56332c65":{"_id":"5fd3e3f4eb210c2c56332c65","depth":0,"name":"Sequence Viewers","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["60103d1ab1afe64903398251","60342ff52087e87def0d0b09","5fc7f2843fb4b83beb6a7a3d","60182dc1ecb9a74be53123aa"],"show":true},"60132e62aeeea33d3f095fa8":{"_id":"60132e62aeeea33d3f095fa8","depth":0,"name":"Tools","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["60132e6a610d04019e01d4c2"],"show":true},"601024f3244a4309df5d6630":{"_id":"601024f3244a4309df5d6630","depth":0,"name":"Additional Resources","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["6010260ee244795fc6dcb836","6010260ee244795fc6dcb839","6010260ee244795fc6dcb838","63ee50cac031758bf1c30ff4","60135c8f236b8b22a9824a4a","6010260ee244795fc6dcb83a","6010260ee244795fc6dcb83d","6010260ee244795fc6dcb83c","6168521eef055f03d1f2231b","60102b1ab1afe6490339824f","6010260ee244795fc6dcb83e","6317770e831916e52206a1ea","63dc03c2c031758bf1c30ff0","6010260ee244795fc6dcb837"],"show":true},"600217ee5b6ad53203751b79":{"_id":"600217ee5b6ad53203751b79","depth":0,"name":"Programmatic Access","parent_id":"5fd18dfceb210c2c5634aead","type":"group","_ids":["602d94713fed9e549afd7926","60398336fec59804432bfc37","60183326ecb9a74be53123ab","610337d7ef055f03d1f222b9","60033e6ccff89d5fc8f8a3f2"],"show":true}} //log(groupMap, 'groupMap') // open/close group function toggle(_id) { var group = groupMap[_id] , _ids = group._ids // list of child _ids of this group , open = (group.open) ? true : false if (open) { closeGroup(group) // close group and all descendants } else { for (var i = 0, n = _ids.length; i < n; i++) $('#' + _ids[i]).removeClass('hidden').addClass('show') group.open = true $('#glyph' + _id).removeClass('glyphicon-triangle-bottom').addClass('glyphicon-triangle-top') } } // recursive function to close all descendants of a group function closeGroup(group) { if (group.open) { var _ids = group._ids // list of child _ids of this group for (var i = 0, n = _ids.length; i < n; i++) { var _id = _ids[i] $('#' + _id).removeClass('show').addClass('hidden') if (groupMap[_id]) closeGroup(groupMap[_id]) // recursive call } group.open = false $('#glyph' + group._id).removeClass('glyphicon-triangle-top').addClass('glyphicon-triangle-bottom') } } // log obj or primitive function log(o, s) { if (!s) s = typeof s if (typeof o === 'object') console.log(s + '=' + JSON.stringify(o, null, 2)) else console.log(s + '=' + o) } // function to close all open groups for mobile view function closeAllGroups() { for (var id in groupMap) { var group = groupMap[id]; if (group.open) { closeGroup(group); // Close the group if it's open } } } // function to check the screen size and close groups on mobile function handleResize() { var isMobileView = window.innerWidth <= 768; // mobile view threshold if (isMobileView) { closeAllGroups(); // close all groups if in mobile view } } // call handleResize on initial load and on window resize window.onload = handleResize; window.onresize = handleResize; </script><div id="docs-container"><div class="row"><div class="col-sm-9 main-heading"><h1>RCSB PDB Help</h1></div><div id="helpmenu"><div class="col-sm-3 small-menu"><p><i class="fa fa-home" aria-hidden="true"></i>&nbsp<a href="/help">Help Topics</a><span class="divider">| </span><i class="fa fa-question-circle" aria-hidden="true"></i>&nbsp<a href="/docs/general-help/website-faq">FAQs</a><span class="divider">| </span><i class="fa fa-book" aria-hidden="true"></i>&nbsp<a href="/docs/general-help/glossary">Glossary</a></p></div></div></div><div class="row"><div class="col-lg-3 col-md-4 col-sm-12 hidden-print"><div data-elastic-exclude><div id="menu"><div id="menu-header">Documentation</div><div class="group show" id="5fca9f91eb210c2c564f0d7c" onclick="toggle(&quot;5fca9f91eb210c2c564f0d7c&quot;)"><table><tr><td style="padding-left: 4px">General Help</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph5fca9f91eb210c2c564f0d7c"></span></td></tr></table></div><div class="item hidden" id="5fc537b03fb4b83beba83b23"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/organization-of-3d-structures-in-the-protein-data-bank">Organization of 3D Structures in the Protein Data Bank</a></td></tr></table></div><div class="item hidden" id="5fc51a863fb4b83beb6e959f"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/identifiers-in-pdb">Identifiers in PDB</a></td></tr></table></div><div class="item hidden" id="63002035b05c2fccc1804d67"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/assessing-the-quality-of-3d-structures">Assessing the Quality of 3D Structures</a></td></tr></table></div><div class="item hidden" id="62d9b56b35ec5bb4ddb19a42"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/computed-structure-models-and-rcsborg">Computed Structure Models and RCSB.org</a></td></tr></table></div><div class="item hidden" id="6003401bcff89d5fc8f8a3f3"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/data-from-external-resources-integrated-into-rcsb-pdb">Data From External Resources Integrated Into RCSB PDB</a></td></tr></table></div><div class="item hidden" id="6140b307ef055f03d1f222d2"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/symmetry-resources-in-the-pdb">Symmetry Resources in the PDB</a></td></tr></table></div><div class="item hidden" id="60b686d701b8e50720f2ca63"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/ligand-structure-quality-in-pdb-structures">Ligand Structure Quality in PDB Structures</a></td></tr></table></div><div class="item hidden" id="6018251aecb9a74be53123a7"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/web-services-overview">Web Services Overview</a></td></tr></table></div><div class="item hidden" id="5fce4e38eb210c2c56790636"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/x-ray-electron-density-maps">X-ray Electron Density Maps</a></td></tr></table></div><div class="item hidden" id="5fce5135eb210c2c567d7ab2"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/structures-without-legacy-pdb-format-files">Structures Without Legacy PDB Format Files</a></td></tr></table></div><div class="item hidden" id="600756cec5ab5836659ab2e5"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/deposition-resources">Deposition Resources</a></td></tr></table></div><div class="item hidden" id="60ebb04e0882a5597783cc03"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/software-supporters">Software Supporters</a></td></tr></table></div><div class="item hidden" id="6080bf66ec901916050494bd"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/membrane-protein-resources">Membrane Protein Resources</a></td></tr></table></div><div class="item hidden" id="6005be80cff89d5fc8f8a3f5"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/website-faq">Website FAQ</a></td></tr></table></div><div class="item hidden" id="5ff90b5af32c497fd6f7bf62"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/glossary">Glossary</a></td></tr></table></div><div class="item hidden" id="67224602e095838a1ce7d99f"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/general-help/help-topics-home">Help Topics Home</a></td></tr></table></div><div class="group show" id="5fbe8e183fb4b83beb4d0e39" onclick="toggle(&quot;5fbe8e183fb4b83beb4d0e39&quot;)"><table><tr><td style="padding-left: 4px">Search and Browse</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph5fbe8e183fb4b83beb4d0e39"></span></td></tr></table></div><div class="item hidden" id="60006df7ae9f8477226a6c82"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/search-and-browse/overview-search-and-browse">Overview: Search and Browse</a></td></tr></table></div><div class="item hidden" id="5ffde6ee3a38a923c3516cf2"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/search-and-browse/basic-search">Basic Search</a></td></tr></table></div><div class="group hidden" id="60083954244a4309df45ad46" onclick="toggle(&quot;60083954244a4309df45ad46&quot;)"><table><tr><td style="padding-left: 24px">Advanced Search</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph60083954244a4309df45ad46"></span></td></tr></table></div><div class="item hidden" id="5ffde93f3a38a923c3516cf3"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/overview-advanced-search">Overview: Advanced Search</a></td></tr></table></div><div class="item hidden" id="5fbecb613fb4b83bebb5e353"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/attribute-search">Attribute Search</a></td></tr></table></div><div class="item hidden" id="600b08bec5ab5836659ab2e9"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/attribute-details">Attribute Details</a></td></tr></table></div><div class="item hidden" id="5ffde9d03a38a923c3516cf5"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/sequence-similarity-search">Sequence Similarity Search</a></td></tr></table></div><div class="item hidden" id="5ffdeaf53a38a923c3516cf6"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/sequence-motif-search">Sequence Motif Search</a></td></tr></table></div><div class="item hidden" id="5ffe9c743a38a923c3516cfb"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/structure-similarity-search">Structure Similarity Search</a></td></tr></table></div><div class="item hidden" id="600b3277c5ab5836659ab2ea"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/structure-motif-search">Structure Motif Search</a></td></tr></table></div><div class="item hidden" id="5ffe9da13a38a923c3516cfc"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/chemical-similarity-search">Chemical Similarity Search</a></td></tr></table></div><div class="item hidden" id="602c2b653fed9e549afd7917"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/chemical-sketch-tool">Chemical Sketch Tool</a></td></tr></table></div><div class="item hidden" id="600061f0ae9f8477226a6c81"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/advanced-search/search-examples">Search Examples</a></td></tr></table></div><div class="group hidden" id="602c55d11a359e6e2d4a6ea7" onclick="toggle(&quot;602c55d11a359e6e2d4a6ea7&quot;)"><table><tr><td style="padding-left: 24px">Browse Options</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph602c55d11a359e6e2d4a6ea7"></span></td></tr></table></div><div class="item hidden" id="602c53f43fed9e549afd7918"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/overview-browse">Overview: Browse</a></td></tr></table></div><div class="item hidden" id="602c56893fed9e549afd791a"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/atc">ATC</a></td></tr></table></div><div class="item hidden" id="602c56b23fed9e549afd791b"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/biological-process">Biological Process</a></td></tr></table></div><div class="item hidden" id="646f8b661d621d75127a7a53"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/card">CARD</a></td></tr></table></div><div class="item hidden" id="602c57773fed9e549afd791f"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/cath">CATH</a></td></tr></table></div><div class="item hidden" id="602c59ab3fed9e549afd7922"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/cellular-component">Cellular Component</a></td></tr></table></div><div class="item hidden" id="65d93e6f72841524659883e1"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/disease-ontology">Disease Ontology</a></td></tr></table></div><div class="item hidden" id="61410115ef055f03d1f222d3"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/ecod">ECOD</a></td></tr></table></div><div class="item hidden" id="602c59da3fed9e549afd7923"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/enzyme-classification">Enzyme Classification</a></td></tr></table></div><div class="item hidden" id="602c59f53fed9e549afd7924"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/genome-location">Genome Location</a></td></tr></table></div><div class="item hidden" id="602c57cf3fed9e549afd7921"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/mesh">MeSH</a></td></tr></table></div><div class="item hidden" id="6080adaaec901916050494bc"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/membrane-protein-opm">Membrane Protein (OPM)</a></td></tr></table></div><div class="item hidden" id="602c57ae3fed9e549afd7920"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/molecular-function">Molecular Function</a></td></tr></table></div><div class="item hidden" id="602c5a1e3fed9e549afd7925"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/membrane-protein-mpstruc">Membrane Protein (mpstruc)</a></td></tr></table></div><div class="item hidden" id="602c57133fed9e549afd791d"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/protein-symmetry">Protein Symmetry</a></td></tr></table></div><div class="item hidden" id="602c57603fed9e549afd791e"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/scop-e">SCOP-e</a></td></tr></table></div><div class="item hidden" id="6141014def055f03d1f222d4"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/scop2">SCOP2</a></td></tr></table></div><div class="item hidden" id="602c56f13fed9e549afd791c"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/search-and-browse/browse-options/source-organism">Source Organism</a></td></tr></table></div><div class="item hidden" id="6000bab4d3c1ff0cf1f44f48"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/search-and-browse/mypdb">MyPDB</a></td></tr></table></div><div class="group show" id="618271c92a7d828464a7d146" onclick="toggle(&quot;618271c92a7d828464a7d146&quot;)"><table><tr><td style="padding-left: 4px">Exploring a 3D Structure</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph618271c92a7d828464a7d146"></span></td></tr></table></div><div class="item hidden" id="618274c904fb9835c6ae189a"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/overview">Overview</a></td></tr></table></div><div class="item hidden" id="618271f904fb9835c6ae1892"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/structure-summary-page">Structure Summary Page</a></td></tr></table></div><div class="item hidden" id="6182729704fb9835c6ae1893"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/structure">Structure</a></td></tr></table></div><div class="item hidden" id="618272c004fb9835c6ae1894"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/annotations">Annotations</a></td></tr></table></div><div class="item hidden" id="618272e004fb9835c6ae1895"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/experiment">Experiment</a></td></tr></table></div><div class="item hidden" id="618272fb04fb9835c6ae1896"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/sequence">Sequence</a></td></tr></table></div><div class="item hidden" id="6182730904fb9835c6ae1897"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/genome">Genome</a></td></tr></table></div><div class="item hidden" id="6182731a04fb9835c6ae1898"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/ligands">Ligands</a></td></tr></table></div><div class="item hidden" id="6182732a04fb9835c6ae1899"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/exploring-a-3d-structure/versions">Versions</a></td></tr></table></div><div class="group show" id="6256b2b3b4396e45e97bf3de" onclick="toggle(&quot;6256b2b3b4396e45e97bf3de&quot;)"><table><tr><td style="padding-left: 4px">Grouping Structures</td><td><span class="glyphicon glyphicon-triangle-top" id="glyph6256b2b3b4396e45e97bf3de"></span></td></tr></table></div><div class="item show" id="62fbafaf3b6e49562fa5c055"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/grouping-structures/overview-grouping-structures">Overview: Grouping Structures</a></td></tr></table></div><div class="item show" id="6081c10aec901916050494be"><table><tr><td class="title" style="padding-left: 24px"><a class="docs-index-link" href="/docs/grouping-structures/sequence-based-clustering">Sequence-based Clustering</a></td><td><span class="glyphicon glyphicon-chevron-right"></span></td></tr></table></div><div class="item show" id="6256b3269c3931864b07285b"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/grouping-structures/grouping-search-results">Grouping Search Results</a></td></tr></table></div><div class="item show" id="6256b35e9c3931864b07285c"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/grouping-structures/group-summary-pages">Group Summary Pages</a></td></tr></table></div><div class="item show" id="6364336066d6046810db7f11"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/grouping-structures/explore-sequence-alignments-in-3d">Explore Sequence Alignments in 3D</a></td></tr></table></div><div class="group show" id="5fd3e3a6eb210c2c5632d098" onclick="toggle(&quot;5fd3e3a6eb210c2c5632d098&quot;)"><table><tr><td style="padding-left: 4px">3D Viewers</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph5fd3e3a6eb210c2c5632d098"></span></td></tr></table></div><div class="group hidden" id="5f98cc9614cc37a34de620ea" onclick="toggle(&quot;5f98cc9614cc37a34de620ea&quot;)"><table><tr><td style="padding-left: 24px">Mol*</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph5f98cc9614cc37a34de620ea"></span></td></tr></table></div><div class="item hidden" id="5ee0fc4d25aa7b208a9fe39e"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/3d-viewers/mol*/getting-started">Getting Started</a></td></tr></table></div><div class="item hidden" id="5ee107b225aa7b208a9fe3a1"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/3d-viewers/mol*/maneuvering-in-mol*">Maneuvering in Mol*</a></td></tr></table></div><div class="item hidden" id="5ee10ad725aa7b208a9fe3a2"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/3d-viewers/mol*/making-selections">Making Selections</a></td></tr></table></div><div class="item hidden" id="5ee1046625aa7b208a9fe3a0"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/3d-viewers/mol*/navigating-by-sequence">Navigating by Sequence</a></td></tr></table></div><div class="item hidden" id="5ee1192f25aa7b208a9fe3a3"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/3d-viewers/mol*/managing-the-display">Managing the Display</a></td></tr></table></div><div class="item hidden" id="5ee13ac17f50f44e6aa4fb1f"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/3d-viewers/mol*/common-actions">Common Actions</a></td></tr></table></div><div class="item hidden" id="5ee231607f50f44e6aa4fb20"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/3d-viewers/mol*/faqs-scenarios">FAQs/Scenarios</a></td></tr></table></div><div class="item hidden" id="5ee253237f50f44e6aa4fb22"><table><tr><td class="title" style="padding-left: 44px"><a href="/docs/3d-viewers/mol*/mol*-cheat-sheet">Mol* Cheat Sheet</a></td></tr></table></div><div class="item hidden" id="60075352c5ab5836659ab2e3"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/3d-viewers/jmol">Jmol</a></td></tr></table></div><div class="item hidden" id="65a4b499c76ca3abcc925d0d"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/3d-viewers/ngl-to-mol*-ui-migration-guide">NGL to Mol* UI Migration Guide</a></td></tr></table></div><div class="group show" id="5fd3e3f4eb210c2c56332c65" onclick="toggle(&quot;5fd3e3f4eb210c2c56332c65&quot;)"><table><tr><td style="padding-left: 4px">Sequence Viewers</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph5fd3e3f4eb210c2c56332c65"></span></td></tr></table></div><div class="item hidden" id="60103d1ab1afe64903398251"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/sequence-viewers/sequence-annotations-viewer">Sequence Annotations Viewer</a></td></tr></table></div><div class="item hidden" id="60342ff52087e87def0d0b09"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/sequence-viewers/sequence-annotations-in-3d">Sequence Annotations in 3D</a></td></tr></table></div><div class="item hidden" id="5fc7f2843fb4b83beb6a7a3d"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/sequence-viewers/genome-view">Genome View</a></td></tr></table></div><div class="item hidden" id="60182dc1ecb9a74be53123aa"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/sequence-viewers/protein-sequence-alignment-view">Protein Sequence Alignment View</a></td></tr></table></div><div class="group show" id="60132e62aeeea33d3f095fa8" onclick="toggle(&quot;60132e62aeeea33d3f095fa8&quot;)"><table><tr><td style="padding-left: 4px">Tools</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph60132e62aeeea33d3f095fa8"></span></td></tr></table></div><div class="item hidden" id="60132e6a610d04019e01d4c2"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/tools/pairwise-structure-alignment">Pairwise Structure Alignment</a></td></tr></table></div><div class="group show" id="601024f3244a4309df5d6630" onclick="toggle(&quot;601024f3244a4309df5d6630&quot;)"><table><tr><td style="padding-left: 4px">Additional Resources</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph601024f3244a4309df5d6630"></span></td></tr></table></div><div class="item hidden" id="6010260ee244795fc6dcb836"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/3d-printing">3D Printing</a></td></tr></table></div><div class="item hidden" id="6010260ee244795fc6dcb839"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/databases-and-knowledgebases">Databases and Knowledgebases</a></td></tr></table></div><div class="item hidden" id="6010260ee244795fc6dcb838"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/crystallography-software">Crystallography Software</a></td></tr></table></div><div class="item hidden" id="63ee50cac031758bf1c30ff4"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/electron-microscopy-software">Electron Microscopy Software</a></td></tr></table></div><div class="item hidden" id="60135c8f236b8b22a9824a4a"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/modeling-and-simulation-software">Modeling and Simulation Software</a></td></tr></table></div><div class="item hidden" id="6010260ee244795fc6dcb83a"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/file-readers">File Readers</a></td></tr></table></div><div class="item hidden" id="6010260ee244795fc6dcb83d"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/nmr-software">NMR Software</a></td></tr></table></div><div class="item hidden" id="6010260ee244795fc6dcb83c"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/molecular-graphics-software">Molecular Graphics Software</a></td></tr></table></div><div class="item hidden" id="6168521eef055f03d1f2231b"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/sars-cov-2-and-covid-19">SARS-CoV-2 and COVID-19</a></td></tr></table></div><div class="item hidden" id="60102b1ab1afe6490339824f"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/sequence-analysis">Sequence Analysis</a></td></tr></table></div><div class="item hidden" id="6010260ee244795fc6dcb83e"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/structure-classification-and-analysis">Structure Classification and Analysis</a></td></tr></table></div><div class="item hidden" id="6317770e831916e52206a1ea"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/structure-prediction">Structure Prediction</a></td></tr></table></div><div class="item hidden" id="63dc03c2c031758bf1c30ff0"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/data-management-standards-and-best-practices">Data Management Standards and Best Practices</a></td></tr></table></div><div class="item hidden" id="6010260ee244795fc6dcb837"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/additional-resources/structure-validation-and-quality">Structure Validation and Quality</a></td></tr></table></div><div class="group show" id="600217ee5b6ad53203751b79" onclick="toggle(&quot;600217ee5b6ad53203751b79&quot;)"><table><tr><td style="padding-left: 4px">Programmatic Access</td><td><span class="glyphicon glyphicon-triangle-bottom" id="glyph600217ee5b6ad53203751b79"></span></td></tr></table></div><div class="item hidden" id="602d94713fed9e549afd7926"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/programmatic-access/file-download-services">File Download Services</a></td></tr></table></div><div class="item hidden" id="60398336fec59804432bfc37"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/programmatic-access/web-apis-overview">Web APIs Overview</a></td></tr></table></div><div class="item hidden" id="60183326ecb9a74be53123ab"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/programmatic-access/batch-downloads-with-shell-script">Batch Downloads with Shell Script</a></td></tr></table></div><div class="item hidden" id="610337d7ef055f03d1f222b9"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/programmatic-access/migrating-from-legacy-apis">Migrating from Legacy APIs</a></td></tr></table></div><div class="item hidden" id="60033e6ccff89d5fc8f8a3f2"><table><tr><td class="title" style="padding-left: 24px"><a href="/docs/programmatic-access/access-to-legacy-theoretical-models">Access to Legacy Theoretical Models</a></td></tr></table></div></div></div></div><div class="col-lg-9 col-md-8 col-sm-12 content-item"><div data-elastic-include><h5 class="menu-path">Grouping Structures</h5><h1>Sequence-based Clustering</h1><div><div style="padding-left:20px;">● <a href="#introduction">Introduction</a></div> <div style="padding-left:40px;">○ <a href="#sequences-and-sequence-clusters">Sequences and Sequence Clusters</a></div> <div style="padding-left:40px;">○ <a href="#what-are-sequence-clusters">What are Sequence Clusters?</a></div> <div style="padding-left:40px;">○ <a href="#why-use-sequence-clusters">Why use Sequence Clusters?</a></div> <div style="padding-left:20px;">● <a href="#documentation">Documentation</a></div> <div style="padding-left:40px;">○ <a href="#how-are-protein-sequences-in-the-pdb-clustered">How are protein sequences in the PDB clustered?</a></div> <div style="padding-left:40px;">○ <a href="#how-to-use-sequence-clusters-to-explore-the-3d-structures-in-rcsborg">How to use sequence clusters to explore the 3D structures in RCSB.org?</a></div> <div style="padding-left:20px;">● <a href="#references">References</a></div> <a class="content-anchor" id="introduction"></a> <h2>Introduction</h2> <p>The amino acid sequence of a protein directs its folding into shapes that enable specific functions. For most of the proteins in cells, protein folding is a rapid and in most cases repeatable process (<a href="https://doi.org/10.1126/science.181.4096.223" target="_blank">Anfinsen, 1973</a>) suggesting that protein sequences have the necessary information to fold into functional proteins and that each protein sequence forms a characteristic structure. While local regions of the protein may adopt slightly different conformations in different biological contexts, the overall structure remains the same. In a few exceptions a protein may adopt a completely different shape in the presence of a specific environment or binding partner(s). Research directed towards predicting protein structure from sequence has been ongoing for more than 50 years. Recently, our ability to compute the 3D shapes of proteins using their amino acid sequence has made tremendous progress by applying machine learning techniques to the archived experimental structural data in the PDB (<a href="https://doi.org/10.1126/science.abj8754" target="_blank">Baek et al., 2021</a>, <a href="https://doi.org/10.1038/s41586-021-03819-2" target="_blank">Jumper et al., 2021</a>). <br /><br />When exploring PDB structures, the level of similarity between the amino acid sequences of two or more proteins can be used to infer their structural and functional similarity (<a href="https://doi.org/10.1002/prot.340090107" target="_blank">Sander and Schneider, 1991</a>). Protein sequences that are 100% identical to each other belong to the same protein, but high levels of sequence identity (e.g., >90%) is also indicative of the same protein, perhaps with a few mutations or variations due to different sources of the protein. Lower levels of sequence similarity between protein sequences may indicate some relationship between their structures and functions. The threshold of sequence similarity that indicates structural homology depends on the length of the alignment. As a rule of thumb for protein sequences that are longer than 100 amino acids, >25% sequence identity indicates similar structure and function (<a href="https://doi.org/10.1002/prot.340090107" target="_blank">Sander and Schneider, 1991</a>).</p> <a class="content-anchor" id="sequences-and-sequence-clusters"></a> <h3>Sequences and Sequence Clusters</h3> <p>As the single worldwide repository for macromolecular structures, the Protein Data Bank holds many structures with the same or similar sequence and structures. This redundancy enables deep understanding of the biology of these proteins. However, some bioinformatics analyses may benefit from grouping these redundant sequences and structures. For example, all protein structures of the same protein have the exact same sequence. These may be grouped together. Protein sequences where 90% of the sequence is identical is said to have a 90% sequence identity, while proteins whose sequences are only 30% identical have a 30% sequence identity. Grouping proteins into clusters by sequence identity is a way to reduce/remove redundancy in 3D structures (including experimental structures and Computed Structure Models or CSMs). The sequences in a particular cluster are expected to share structural and functional properties depending on the level of sequence identity.</p> <a class="content-anchor" id="what-are-sequence-clusters"></a> <h3>What are Sequence Clusters?</h3> <p>The amino acid sequences of all proteins, whose 3D structures are available from RCSB.org (including experimental structures and CSMs) are grouped at different levels of sequence identity (e.g., 100%, 95%, 90%, 70%, 50% and 30%) to yield sequence clusters. These pre-computed sequence groups are available for exploring the PDB archive and <a href="/docs/grouping-structures/grouping-search-results" target="_blank">grouping search results</a>.</p> <a class="content-anchor" id="why-use-sequence-clusters"></a> <h3>Why use Sequence Clusters?</h3> <p>Instead of using all sequences of the 3D structures available from RCSB.org for analysis, representative sequences from each of the sequence clusters can be used. Depending on the level of sequence similarity, properties and features of the representative proteins can be extended to other members in the cluster. Using sequence clusters has the following advantage:</p> <ul style="list-style-type:disc;"> <li>It reduces the size of the sequence data set of all 3D structures available and can help simplify, optimize, and make their analysis more efficient.</li> <li>Monitoring growth in the non-redundant sequence clusters enables monitoring the variety of structures being deposited to the PDB </li> <li>It can be used to organize sequences from both experimental structures and CSMs to explore evolutionary relationships between specific proteins.</li> </ul> <div style="height: 20px;"></div><a class="content-anchor" id="documentation"></a> <h2>Documentation</h2> <a class="content-anchor" id="how-are-protein-sequences-in-the-pdb-clustered"></a> <h3>How are protein sequences in the PDB clustered?</h3> <p>Sequence clusters are calculated using the MMseqs2 software (<a href="https://doi.org/10.1038/nbt.3988" target="_blank">Steinegger and Söding, 2017</a>). Currently, only protein sequences are subject to clustering. The rationale for clustering considers the following points:</p> <ul style="list-style-type:disc;"> <li>All protein chains of at least 10 amino acids are included in the clusters. </li> <li>Sequence identity is defined as the percentage of identical residues between the two amino acid sequences in the alignment. </li> <li>The sequence clustering process begins with an all by all comparison of protein sequences in the PDB.</li> <li>Only alignments with sequence identity scores above the threshold (100%, 95%, 90%, 70%, 50% and 30%) and covering at least 80% (-c 0.80) of both sequences are retained.</li> <li>The clustering is run with the following parameters of the MMseqs2 software:</li> <ul style="list-style-type:disc;"> <li><b>The clustering uses --cluster-mode 1</b>, which corresponds to the connected component algorithm.</li> <li><b>50% sequence identity and above: computed with easy-linclust</b></li> <li><b>Below 50%: computed with easy-cluster and sensitivity is set to (-s 8)</b> for MMseqs2's highest alignment sensitivity for clustering</li> </ul> <li>For more details on the procedure, please refer to <a href="https://github.com/soedinglab/mmseqs2/wiki" target="_blank">the mmseqs2 user guide</a>.</li> </ul> <div style="height: 20px;"></div><p>Note: The sequence clusters are subject to change over time as new protein sequences continue to be added to the archive.</p> <a class="content-anchor" id="how-to-use-sequence-clusters-to-explore-the-3d-structures-in-rcsborg"></a> <h3>How to use sequence clusters to explore the 3D structures in RCSB.org?</h3> <p>Each week, RCSB PDB computes sequence clusters for all protein sequences available from RCSB.org [including experimental (PDB) structures, and available CSMs]. You can use these pre-computed clusters the following ways:</p> <ul style="list-style-type:disc;"> <li>Examine and explore growth of sequences in experimental (PDB) structures: </li> <ul style="list-style-type:disc;"> <li>Learn about the number of unique protein sequences added to the PDB annually - review the <a href="/stats/nr/cluster-ids-95" target="_blank">non-redundant protein sequences statistics</a> and <a href="/search?request=%7B%22query%22%3A%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22terminal%22%2C%22service%22%3A%22text%22%2C%22parameters%22%3A%7B%22attribute%22%3A%22rcsb_accession_info.initial_release_date%22%2C%22operator%22%3A%22range%22%2C%22value%22%3A%7B%22from%22%3A%222022-01-01T00%3A00%3A00Z%22%2C%22to%22%3A%222022-12-31T23%3A59%3A59Z%22%2C%22include_lower%22%3Atrue%2C%22include_upper%22%3Atrue%7D%7D%7D%5D%2C%22logical_operator%22%3A%22and%22%7D%5D%2C%22logical_operator%22%3A%22and%22%2C%22label%22%3A%22text%22%7D%5D%2C%22logical_operator%22%3A%22and%22%7D%2C%22return_type%22%3A%22polymer_entity%22%2C%22request_options%22%3A%7B%22group_by_return_type%22%3A%22groups%22%2C%22group_by%22%3A%7B%22aggregation_method%22%3A%22sequence_identity%22%2C%22ranking_criteria_type%22%3A%7B%22sort_by%22%3A%22rcsb_entry_info.resolution_combined%22%2C%22direction%22%3A%22asc%22%7D%2C%22similarity_cutoff%22%3A95%7D%2C%22paginate%22%3A%7B%22start%22%3A0%2C%22rows%22%3A25%7D%2C%22results_content_type%22%3A%5B%22experimental%22%5D%2C%22sort%22%3A%5B%7B%22sort_by%22%3A%22score%22%2C%22direction%22%3A%22desc%22%7D%2C%7B%22sort_by%22%3A%22size%22%2C%22direction%22%3A%22desc%22%7D%5D%2C%22scoring_strategy%22%3A%22combined%22%7D%2C%22request_info%22%3A%7B%22query_id%22%3A%22b4143ed29b9293e6aefe9753a6c6485f%22%7D%7D" target="_blank">explore groups of structures with these sequences</a> for further analysis.</li> <li>Learn about the <a href="/stats/growth/nr/cluster-ids-95" target="_blank">cumulative growth of unique protein sequences in the PDB</a> and <a href="/search?request=%7B%22query%22%3A%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22group%22%2C%22nodes%22%3A%5B%7B%22type%22%3A%22terminal%22%2C%22service%22%3A%22text%22%2C%22parameters%22%3A%7B%22attribute%22%3A%22rcsb_accession_info.initial_release_date%22%2C%22operator%22%3A%22range%22%2C%22value%22%3A%7B%22from%22%3A%221976-01-01T00%3A00%3A00Z%22%2C%22to%22%3A%222022-12-31T23%3A59%3A59Z%22%2C%22include_lower%22%3Atrue%2C%22include_upper%22%3Atrue%7D%7D%7D%5D%2C%22logical_operator%22%3A%22and%22%7D%5D%2C%22logical_operator%22%3A%22and%22%2C%22label%22%3A%22text%22%7D%5D%2C%22logical_operator%22%3A%22and%22%7D%2C%22return_type%22%3A%22polymer_entity%22%2C%22request_options%22%3A%7B%22group_by_return_type%22%3A%22groups%22%2C%22group_by%22%3A%7B%22aggregation_method%22%3A%22sequence_identity%22%2C%22ranking_criteria_type%22%3A%7B%22sort_by%22%3A%22rcsb_entry_info.resolution_combined%22%2C%22direction%22%3A%22asc%22%7D%2C%22similarity_cutoff%22%3A95%7D%2C%22paginate%22%3A%7B%22start%22%3A0%2C%22rows%22%3A25%7D%2C%22results_content_type%22%3A%5B%22experimental%22%5D%2C%22sort%22%3A%5B%7B%22sort_by%22%3A%22score%22%2C%22direction%22%3A%22desc%22%7D%2C%7B%22sort_by%22%3A%22size%22%2C%22direction%22%3A%22desc%22%7D%5D%2C%22scoring_strategy%22%3A%22combined%22%7D%2C%22request_info%22%3A%7B%22query_id%22%3A%22d539143568bccba474811f454038aa2c%22%7D%7D" target="_blank">explore groups of structures with these sequences</a> for further analysis.</li> </ul> <li>Organize search results (including experimental structures and CSMs) based on sequence similarity: </li> <ul style="list-style-type:disc;"> <li><a href="/docs/grouping-structures/grouping-search-results" target="_blank">Group search results by sequence identity</a> and either view representative members of the group or explore all members of these groups (using the <a href="/docs/grouping-structures/group-summary-pages">Group Summary Pages</a>).</li> <li>Explore the sequences, structural features, and ligand interactions of other sequences in the same protein sequence cluster to gather structural and functional insights and develop hypotheses.</li> </ul> </ul> <div style="height: 20px;"></div><ul style="list-style-type:disc;"> <li>Learn about the number of unique protein sequences added to the PDB annually - review the <a href="/stats/nr/cluster-ids-95" target="_blank">non-redundant protein sequences statistics</a> and download these sequences.</li> <li>Learn about the <a href="/stats/growth/nr/cluster-ids-95" target="_blank">cumulative growth of unique protein sequences</a> in the PDB and download them.</li> <li>Organize <a href="/docs/grouping-structures/grouping-search-results" target="_blank">search results by sequence identity</a> into meaningful/manageable groups and explore representatives or as groups (using the <a href="/docs/grouping-structures/group-summary-pages" target="_blank">Group Summary Pages</a>). </li> <li>Explore the pre-computed clusters that include a specific polymer entity in a PDB entry. </li> </ul> <div style="height: 20px;"></div><a class="content-anchor" id="references"></a> <h2>References</h2> <ul style="list-style-type:disc;"> <li>Anfinsen, C. (1973), Science, 181, 223-230; doi: <a href="https://doi.org/10.1126/science.181.4096.223" target="_blank">10.1126/science.181.4096.223</a></li> <li>Baek, M., DiMaio, F., Anishchenko, I., Dauparas, J., Ovchinnikov, S., Lee, G. R., Wang, J., Cong, Q., Kinch, L. N., Schaeffer, R. D., Millán, C., Park, H., Adams, C., Glassman, C. R., DeGiovanni, A., Pereira, J. H., Rodrigues, A. V., van Dijk, A. A., Ebrecht, A. C., Opperman, D. J., Sagmeister, T., Buhlheller, C., Pavkov-Keller, T., Rathinaswamy, M. K., Dalwadi, U., Yip, C. K., Burke, J. E., Garcia K. C., Grishin, N. V., Adams, P. D., Read, R. J., Baker, D. (2021). Accurate prediction of protein structures and interactions using a three-track neural network. Science (New York, N.Y.), 373, 871–876; doi: <a href="https://doi.org/10.1126/science.abj8754" target="_blank">10.1126/science.abj8754</a></li> <li>Jumper, J., Evans, R., Pritzel, A., Green, T., Figurnov, M., Ronneberger, O., Tunyasuvunakool, K., Bates, R., Žídek, A., Potapenko, A., Bridgland, A., Meyer, C., Kohl, S., Ballard, A. J., Cowie, A., Romera-Paredes, B., Nikolov, S., Jain, R., Adler, J., Back, T., Petersen, S., Reiman, D., Clancy, E.,, Zielinski, M., Steinegger, M., Pacholska, M., Berghammer, T., Bodenstein, S., Silver, D., Vinyals, O., Senior, A. W., Kavukcuoglu, K., Kohli, P., Hassabis, D. (2021). Highly accurate protein structure prediction with AlphaFold. Nature, 596, 583–589; doi: <a href="https://doi.org/10.1038/s41586-021-03819-2" target="_blank">10.1038/s41586-021-03819-2</a></li> <li>Sander, C., Schneider, R. (1991). Database of homology-derived protein structures and the structural meaning of sequence alignment. Proteins, 9, 56–68; doi: <a href="https://doi.org/10.1002/prot.340090107" target="_blank">10.1002/prot.340090107</a></li> <li>Steinegger, M., Söding, J. (2017). MMseqs2 enables sensitive protein sequence searching for the analysis of massive data sets. Nat Biotechnol 35, 1026–1028. <a href="https://doi.org/10.1038/nbt.3988" target="_blank">https://doi.org/10.1038/nbt.3988</a></li> </ul> <div style="height: 20px;"></div></div></div><br><hr><div class="item-info"><div>Please report any encountered broken links to <a href='mailto:info@rcsb.org'>info@rcsb.org</a></div><div>Last updated: 5/1/2023</div></div></div></div></div></div><div data-elastic-exclude><div class="hidden-print" id="footer_main"><div class="container" style="padding:0"><div class="row"><div class="col-md-6 col-sm-12" style="padding-left:0"> <div class="row"><div class="col-sm-4"><ul><li><span class="row_header">About</span></li><li><a href="/pages/about-us/index">About Us</a></li><li><a href="/pages/policies#References">Citing Us</a></li><li><a href="/pages/publications">Publications</a></li><li><a href="/pages/team">Team</a></li><li><a href="/pages/jobs">Careers</a></li><li><a href="/pages/policies">Usage & Privacy</a></li></ul></div><div class="col-sm-4" style="padding-left:0"><ul><li><span class="row_header">Support</span></li><li><a href="/pages/contactus">Contact Us</a></li><li><a href="/help">Help</a></li><li><a href="/docs/general-help/website-faq">Website FAQ</a></li><li><a href="/docs/general-help/glossary">Glossary</a></li><li><a href="https://status.rcsb.org/" target="_blank">Service Status</a></li></ul></div><div class="col-md-4 hidden-sm"></div></div></div><div class="col-md-6 col-sm-12" style="padding-left:5px"> <div class="row"><div class="col-sm-4"><p class="row_header">RCSB PDB is hosted by</p><div class="footerLogos"><hr><a href="http://www.rutgers.edu/"><img class="Rutgerslogo" src="https://cdn.rcsb.org/rcsb-pdb//v2/common/images/Logo_Rutgers-2024.png" alt="Rutgers University logo"></a><hr><a href="https://ucsd.edu/"><img class="UCSDlogo" src="https://cdn.rcsb.org/rcsb-pdb//v2/common/images/Logo_UCSD-navy.png" alt="Uiversity of California San Diego logo"></a><a href="https://www.sdsc.edu/"><img class="SDSClogo" src="https://cdn.rcsb.org/rcsb-pdb//v2/common/images/Logo_SDSC-black.png" alt="San Diego Supercomputer Center logo"></a><hr><a href="https://www.ucsf.edu/"><img class="UCSFlogo" src="https://cdn.rcsb.org/rcsb-pdb//v2/common/images/Logo_UCSF.png" alt="University of California San Francisco Logo"></a></div></div><div class="col-sm-4"><p class="row_header">RCSB PDB is a member of the</p><div class="footerLogos"><span id="pdbmembers_footer"><hr><a href="https://www.wwpdb.org" target="_blank" rel="noopener"><img class="wwpdblogo" src="https://cdn.rcsb.org/rcsb-pdb//v2/common/images/Logo_wwpdb.png" alt="wwPDB"></a><hr><a href="https://www.emdataresource.org" target="_blank" rel="noopener"><img id="emdatabanklogo_footer" src="https://cdn.rcsb.org/rcsb-pdb//v2/common/images/EMDataResourcelogo.png" alt="EMDataResource"></a></span></div></div><div class="col-sm-4"><ul><li><span class="row_header">RCSB Partners</span></li><li><a href="https://nakb.org/" target="_blank" rel="noopener">Nucleic Acid Knowledgebase</a></li></ul><ul><li><span class="row_header"><a href="https://www.wwpdb.org/" target="_blank" rel="noopener" style="text-decoration: none; color: black">wwPDB Partners</a></span></li><li><a href="/">RCSB PDB</a></li><li><a href="https://www.ebi.ac.uk/pdbe/" target="_blank" rel="noopener">PDBe</a></li><li><a href="https://www.pdbj.org/" target="_blank" rel="noopener">PDBj</a></li><li><a href="https://bmrb.io/" target="_blank" rel="noopener">BMRB</a></li><li><a href="https://emdb-empiar.org/" target="_blank" rel="noopener">EMDB</a></li></ul></div></div></div></div></div></div><div id="footer_grant"><div class="container"><div class="row"><p>RCSB PDB Core Operations are funded by the <a href="http://www.nsf.gov/" target="_blank" rel="noopener">U.S. National Science Foundation</a> (DBI-2321666), the <a href="http://science.energy.gov/" target="_blank" rel="noopener">US Department of Energy</a> (DE-SC0019749), and the <a href="http://www.cancer.gov/" target="_blank" rel="noopener">National Cancer Institute</a>, <a href="http://www.niaid.nih.gov/" target="_blank" rel="noopener">National Institute of Allergy and Infectious Diseases</a>, and <a href="http://www.nigms.nih.gov/" target="_blank" rel="noopener">National Institute of General Medical Sciences</a> of the <a href="http://www.nih.gov/" target="_blank" rel="noopener">National Institutes of Health</a> under grant R01GM157729.</p></div></div></div><div id="jira-fdbck"></div></div></div></body></html>

Pages: 1 2 3 4 5 6 7 8 9 10