CINXE.COM

<!doctype html><html lang="en"><head><title data-rh="true">Categorizing learning content. How Coursera generated course… | by Chris Liu | Coursera Engineering | Medium</title><meta data-rh="true" charset="utf-8"/><meta data-rh="true" name="viewport" content="width=device-width,minimum-scale=1,initial-scale=1,maximum-scale=1"/><meta data-rh="true" name="theme-color" content="#000000"/><meta data-rh="true" name="twitter:app:name:iphone" content="Medium"/><meta data-rh="true" name="twitter:app:id:iphone" content="828256236"/><meta data-rh="true" property="al:ios:app_name" content="Medium"/><meta data-rh="true" property="al:ios:app_store_id" content="828256236"/><meta data-rh="true" property="al:android:package" content="com.medium.reader"/><meta data-rh="true" property="fb:app_id" content="542599432471018"/><meta data-rh="true" property="og:site_name" content="Medium"/><meta data-rh="true" property="og:type" content="article"/><meta data-rh="true" property="article:published_time" content="2019-01-22T17:27:19.046Z"/><meta data-rh="true" name="title" content="Categorizing learning content. How Coursera generated course… | by Chris Liu | Coursera Engineering | Medium"/><meta data-rh="true" property="og:title" content="Data Driven Content Categorization"/><meta data-rh="true" property="al:android:url" content="medium://p/89de0104bcbd"/><meta data-rh="true" property="al:ios:url" content="medium://p/89de0104bcbd"/><meta data-rh="true" property="al:android:app_name" content="Medium"/><meta data-rh="true" name="description" content="Courses on Coursera have a scale and breadth of diversity makes them hard to categorize. This post explains how we took a data driven approach to create relevant and useful categories."/><meta data-rh="true" property="og:description" content="How Coursera generated course categories from thousands of courses using a data driven clustering approach."/><meta data-rh="true" property="og:url" content="https://medium.com/coursera-engineering/data-driven-content-categorization-89de0104bcbd"/><meta data-rh="true" property="al:web:url" content="https://medium.com/coursera-engineering/data-driven-content-categorization-89de0104bcbd"/><meta data-rh="true" property="og:image" content="https://miro.medium.com/v2/resize:fit:1092/1*A-lEgYtSuSKQZ21ves4JOw.png"/><meta data-rh="true" property="article:author" content="https://medium.com/@cliu_88389"/><meta data-rh="true" name="author" content="Chris Liu"/><meta data-rh="true" name="robots" content="index,noarchive,follow,max-image-preview:large"/><meta data-rh="true" name="referrer" content="unsafe-url"/><meta data-rh="true" property="twitter:title" content="Data Driven Content Categorization"/><meta data-rh="true" name="twitter:site" content="@CourseraEng"/><meta data-rh="true" name="twitter:app:url:iphone" content="medium://p/89de0104bcbd"/><meta data-rh="true" property="twitter:description" content="How Coursera generated course categories from thousands of courses using a data driven clustering approach."/><meta data-rh="true" name="twitter:image:src" content="https://miro.medium.com/v2/resize:fit:1092/1*A-lEgYtSuSKQZ21ves4JOw.png"/><meta data-rh="true" name="twitter:card" content="summary_large_image"/><meta data-rh="true" name="twitter:label1" content="Reading time"/><meta data-rh="true" name="twitter:data1" content="5 min read"/><link data-rh="true" rel="icon" href="https://miro.medium.com/v2/5d8de952517e8160e40ef9841c781cdc14a5db313057fa3c3de41c6f5b494b19"/><link data-rh="true" rel="search" type="application/opensearchdescription+xml" title="Medium" href="/osd.xml"/><link data-rh="true" rel="apple-touch-icon" sizes="152x152" href="https://miro.medium.com/v2/resize:fill:304:304/10fd5c419ac61637245384e7099e131627900034828f4f386bdaa47a74eae156"/><link data-rh="true" rel="apple-touch-icon" sizes="120x120" href="https://miro.medium.com/v2/resize:fill:240:240/10fd5c419ac61637245384e7099e131627900034828f4f386bdaa47a74eae156"/><link data-rh="true" rel="apple-touch-icon" sizes="76x76" href="https://miro.medium.com/v2/resize:fill:152:152/10fd5c419ac61637245384e7099e131627900034828f4f386bdaa47a74eae156"/><link data-rh="true" rel="apple-touch-icon" sizes="60x60" href="https://miro.medium.com/v2/resize:fill:120:120/10fd5c419ac61637245384e7099e131627900034828f4f386bdaa47a74eae156"/><link data-rh="true" rel="mask-icon" href="https://miro.medium.com/v2/resize:fill:1000:1000/7*GAOKVe--MXbEJmV9230oOQ.png" color="#171717"/><link data-rh="true" rel="preconnect" href="https://glyph.medium.com" crossOrigin=""/><link data-rh="true" id="glyph_preload_link" rel="preload" as="style" type="text/css" href="https://glyph.medium.com/css/unbound.css"/><link data-rh="true" id="glyph_link" rel="stylesheet" type="text/css" href="https://glyph.medium.com/css/unbound.css"/><link data-rh="true" rel="author" href="https://medium.com/@cliu_88389"/><link data-rh="true" rel="canonical" href="https://medium.com/coursera-engineering/data-driven-content-categorization-89de0104bcbd"/><link data-rh="true" rel="alternate" href="android-app://com.medium.reader/https/medium.com/p/89de0104bcbd"/><script data-rh="true" type="application/ld+json">{"@context":"http:\u002F\u002Fschema.org","@type":"NewsArticle","image":["https:\u002F\u002Fmiro.medium.com\u002Fv2\u002Fresize:fit:1200\u002F1*A-lEgYtSuSKQZ21ves4JOw.png"],"url":"https:\u002F\u002Fmedium.com\u002Fcoursera-engineering\u002Fdata-driven-content-categorization-89de0104bcbd","dateCreated":"2018-09-12T04:13:40.251Z","datePublished":"2018-09-12T04:13:40.251Z","dateModified":"2019-01-22T17:27:19.046Z","headline":"Categorizing learning content - Coursera Engineering - Medium","name":"Categorizing learning content - Coursera Engineering - Medium","description":"Courses on Coursera have a scale and breadth of diversity makes them hard to categorize. This post explains how we took a data driven approach to create relevant and useful categories.","identifier":"89de0104bcbd","author":{"@type":"Person","name":"Chris Liu","url":"https:\u002F\u002Fmedium.com\u002F@cliu_88389"},"creator":["Chris Liu"],"publisher":{"@type":"Organization","name":"Coursera Engineering","url":"https:\u002F\u002Fmedium.com\u002Fcoursera-engineering","logo":{"@type":"ImageObject","width":422,"height":60,"url":"https:\u002F\u002Fmiro.medium.com\u002Fv2\u002Fresize:fit:844\u002F1*zXjOKA4JKHH04Ipi2NI0jA.png"}},"mainEntityOfPage":"https:\u002F\u002Fmedium.com\u002Fcoursera-engineering\u002Fdata-driven-content-categorization-89de0104bcbd"}</script><style type="text/css" data-fela-rehydration="571" data-fela-type="STATIC">html{box-sizing:border-box;-webkit-text-size-adjust:100%}*, *:before, *:after{box-sizing:inherit}body{margin:0;padding:0;text-rendering:optimizeLegibility;-webkit-font-smoothing:antialiased;color:rgba(0,0,0,0.8);position:relative;min-height:100vh}h1, h2, h3, h4, h5, h6, dl, dd, ol, ul, menu, figure, blockquote, p, pre, form{margin:0}menu, ol, ul{padding:0;list-style:none;list-style-image:none}main{display:block}a{color:inherit;text-decoration:none}a, button, input{-webkit-tap-highlight-color:transparent}img, svg{vertical-align:middle}button{background:transparent;overflow:visible}button, input, optgroup, select, textarea{margin:0}:root{--reach-tabs:1;--reach-menu-button:1}#speechify-root{font-family:Sohne, sans-serif}div[data-popper-reference-hidden="true"]{visibility:hidden;pointer-events:none}.grecaptcha-badge{visibility:hidden} /*XCode style (c) Angel Garcia <angelgarcia.mail@gmail.com>*/.hljs {background: #fff;color: black; }/* Gray DOCTYPE selectors like WebKit */ .xml .hljs-meta {color: #c0c0c0; }.hljs-comment, .hljs-quote {color: #007400; }.hljs-tag, .hljs-attribute, .hljs-keyword, .hljs-selector-tag, .hljs-literal, .hljs-name {color: #aa0d91; }.hljs-variable, .hljs-template-variable {color: #3F6E74; }.hljs-code, .hljs-string, .hljs-meta .hljs-string {color: #c41a16; }.hljs-regexp, .hljs-link {color: #0E0EFF; }.hljs-title, .hljs-symbol, .hljs-bullet, .hljs-number {color: #1c00cf; }.hljs-section, .hljs-meta {color: #643820; }.hljs-title.class_, .hljs-class .hljs-title, .hljs-type, .hljs-built_in, .hljs-params {color: #5c2699; }.hljs-attr {color: #836C28; }.hljs-subst {color: #000; }.hljs-formula {background-color: #eee;font-style: italic; }.hljs-addition {background-color: #baeeba; }.hljs-deletion {background-color: #ffc8bd; }.hljs-selector-id, .hljs-selector-class {color: #9b703f; }.hljs-doctag, .hljs-strong {font-weight: bold; }.hljs-emphasis {font-style: italic; } </style><style type="text/css" data-fela-rehydration="571" data-fela-type="KEYFRAME">@-webkit-keyframes k1{0%{opacity:0.8}50%{opacity:0.5}100%{opacity:0.8}}@-moz-keyframes k1{0%{opacity:0.8}50%{opacity:0.5}100%{opacity:0.8}}@keyframes k1{0%{opacity:0.8}50%{opacity:0.5}100%{opacity:0.8}}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE">.a{font-family:medium-content-sans-serif-font, -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Oxygen, Ubuntu, Cantarell, "Open Sans", "Helvetica Neue", sans-serif}.b{font-weight:400}.c{background-color:rgba(255, 255, 255, 1)}.l{display:block}.m{position:sticky}.n{top:0}.o{z-index:500}.p{padding:0 24px}.q{align-items:center}.r{border-bottom:solid 1px #F2F2F2}.y{height:41px}.z{line-height:20px}.ab{display:flex}.ac{height:57px}.ae{flex:1 0 auto}.af{color:inherit}.ag{fill:inherit}.ah{font-size:inherit}.ai{border:inherit}.aj{font-family:inherit}.ak{letter-spacing:inherit}.al{font-weight:inherit}.am{padding:0}.an{margin:0}.ao{cursor:pointer}.ap:disabled{cursor:not-allowed}.aq:disabled{color:#6B6B6B}.ar:disabled{fill:#6B6B6B}.au{width:auto}.av path{fill:#242424}.aw{height:25px}.ax{margin-left:16px}.ay{border:none}.az{border-radius:20px}.ba{width:240px}.bb{background:#F9F9F9}.bc path{fill:#6B6B6B}.be{outline:none}.bf{font-family:sohne, "Helvetica Neue", Helvetica, Arial, sans-serif}.bg{font-size:14px}.bh{width:100%}.bi{padding:10px 20px 10px 0}.bj{background-color:transparent}.bk{color:#242424}.bl::placeholder{color:#6B6B6B}.bm{display:inline-block}.bn{margin-left:12px}.bo{margin-right:12px}.bp{border-radius:4px}.bq{margin-left:24px}.br{height:24px}.bx{background-color:#F9F9F9}.by{border-radius:50%}.bz{height:32px}.ca{width:32px}.cb{justify-content:center}.ch{max-width:680px}.ci{min-width:0}.cj{animation:k1 1.2s ease-in-out infinite}.ck{height:100vh}.cl{margin-bottom:16px}.cm{margin-top:48px}.cn{align-items:flex-start}.co{flex-direction:column}.cp{justify-content:space-between}.cq{margin-bottom:24px}.cw{width:80%}.cx{background-color:#F2F2F2}.dd{height:44px}.de{width:44px}.df{margin:auto 0}.dg{margin-bottom:4px}.dh{height:16px}.di{width:120px}.dj{width:80px}.dp{margin-bottom:8px}.dq{width:96%}.dr{width:98%}.ds{width:81%}.dt{margin-left:8px}.du{color:#6B6B6B}.dv{font-size:13px}.dw{height:100%}.ep{color:#FFFFFF}.eq{fill:#FFFFFF}.er{background:rgba(99, 136, 191, 1)}.es{border-color:rgba(99, 136, 191, 1)}.ew:disabled{cursor:inherit !important}.ex:disabled{opacity:0.3}.ey:disabled:hover{background:rgba(99, 136, 191, 1)}.ez:disabled:hover{border-color:rgba(99, 136, 191, 1)}.fa{border-radius:99em}.fb{border-width:1px}.fc{border-style:solid}.fd{box-sizing:border-box}.fe{text-decoration:none}.ff{text-align:center}.fi{margin-right:32px}.fj{position:relative}.fk{fill:#6B6B6B}.fn{background:transparent}.fo svg{margin-left:4px}.fp svg{fill:#6B6B6B}.fr{box-shadow:inset 0 0 0 1px rgba(0, 0, 0, 0.05)}.fs{position:absolute}.fz{margin:0 24px}.gd{background:rgba(255, 255, 255, 1)}.ge{border:1px solid #F2F2F2}.gf{box-shadow:0 1px 4px #F2F2F2}.gg{max-height:100vh}.gh{overflow-y:auto}.gi{left:0}.gj{top:calc(100vh + 100px)}.gk{bottom:calc(100vh + 100px)}.gl{width:10px}.gm{pointer-events:none}.gn{word-break:break-word}.go{word-wrap:break-word}.gp:after{display:block}.gq:after{content:""}.gr:after{clear:both}.gs{line-height:1.23}.gt{letter-spacing:0}.gu{font-style:normal}.gv{font-weight:700}.hq{margin-bottom:-0.27em}.hr{line-height:1.394}.im{align-items:baseline}.in{width:48px}.io{height:48px}.ip{border:2px solid rgba(255, 255, 255, 1)}.iq{z-index:0}.ir{box-shadow:none}.is{border:1px solid rgba(0, 0, 0, 0.05)}.it{margin-left:-12px}.iu{width:28px}.iv{height:28px}.iw{z-index:1}.ix{width:24px}.iy{margin-bottom:2px}.iz{flex-wrap:nowrap}.ja{font-size:16px}.jb{line-height:24px}.jd{margin:0 8px}.je{display:inline}.jf{color:rgba(99, 136, 191, 1)}.jg{fill:rgba(99, 136, 191, 1)}.jj{flex:0 0 auto}.jm{flex-wrap:wrap}.jn{white-space:pre-wrap}.jo{margin-right:4px}.jp{overflow:hidden}.jq{max-height:20px}.jr{text-overflow:ellipsis}.js{display:-webkit-box}.jt{-webkit-line-clamp:1}.ju{-webkit-box-orient:vertical}.jv{word-break:break-all}.jx{padding-left:8px}.jy{padding-right:8px}.kz> *{flex-shrink:0}.la{overflow-x:scroll}.lb::-webkit-scrollbar{display:none}.lc{scrollbar-width:none}.ld{-ms-overflow-style:none}.le{width:74px}.lf{flex-direction:row}.lg{z-index:2}.lj{-webkit-user-select:none}.lk{border:0}.ll{fill:rgba(117, 117, 117, 1)}.lo{outline:0}.lp{user-select:none}.lq> svg{pointer-events:none}.lz{cursor:progress}.ma{margin-left:4px}.mb{margin-top:0px}.mc{opacity:1}.md{padding:4px 0}.mg{width:16px}.mi{display:inline-flex}.mo{max-width:100%}.mp{padding:8px 2px}.mq svg{color:#6B6B6B}.nh{line-height:1.58}.ni{letter-spacing:-0.004em}.nj{font-family:source-serif-pro, Georgia, Cambria, "Times New Roman", Times, serif}.oc{margin-bottom:-0.46em}.od{text-decoration:underline}.oe{line-height:1.12}.of{letter-spacing:-0.022em}.og{font-weight:600}.oz{margin-bottom:-0.28em}.pf{list-style-type:decimal}.pg{margin-left:30px}.ph{padding-left:0px}.pn{margin-left:auto}.po{margin-right:auto}.pp{max-width:811px}.pv{clear:both}.px{cursor:zoom-in}.py{z-index:auto}.qa{height:auto}.qb{margin-top:10px}.qc{max-width:728px}.qf{max-width:1292px}.qg{list-style-type:disc}.qh{max-width:1332px}.qi{max-width:1092px}.qj{line-height:1.18}.qx{margin-bottom:-0.31em}.qy{font-style:italic}.qz{margin-bottom:26px}.ra{margin-top:6px}.rb{margin-top:8px}.rc{margin-right:8px}.rd{padding:8px 16px}.re{border-radius:100px}.rf{transition:background 300ms ease}.rh{white-space:nowrap}.ri{border-top:none}.rj{margin-bottom:50px}.rk{height:52px}.rl{max-height:52px}.rm{box-sizing:content-box}.rn{position:static}.rp{max-width:155px}.rv{margin-right:20px}.rw{margin-bottom:64px}.rx{margin-bottom:48px}.sl{border-radius:2px}.sn{height:64px}.so{width:64px}.sp{align-self:flex-end}.sq{flex:1 1 auto}.sw{padding-right:4px}.sx{font-weight:500}.te{margin-top:16px}.tf{color:rgba(255, 255, 255, 1)}.tg{fill:rgba(255, 255, 255, 1)}.th{background:rgba(25, 25, 25, 1)}.ti{border-color:rgba(25, 25, 25, 1)}.tl:disabled{opacity:0.1}.tm:disabled:hover{background:rgba(25, 25, 25, 1)}.tn:disabled:hover{border-color:rgba(25, 25, 25, 1)}.tt{height:0px}.tu{gap:18px}.tv{fill:rgba(61, 61, 61, 1)}.tx{padding-bottom:6px}.ty{border-bottom:1px solid #F2F2F2}.ue{margin-top:32px}.uf{fill:#242424}.ug{background:0}.uh{border-color:#242424}.ui:disabled:hover{color:#242424}.uj:disabled:hover{fill:#242424}.uk:disabled:hover{border-color:#242424}.uv{border-bottom:solid 1px #E5E5E5}.uw{margin-top:72px}.ux{padding:24px 0}.uy{margin-bottom:0px}.uz{margin-right:16px}.as:hover:not(:disabled){color:rgba(25, 25, 25, 1)}.at:hover:not(:disabled){fill:rgba(25, 25, 25, 1)}.et:hover{background:rgba(87, 117, 161, 1)}.eu:hover{border-color:rgba(87, 117, 161, 1)}.ev:hover{cursor:pointer}.fl:hover{color:#242424}.fm:hover{fill:#242424}.fq:hover svg{fill:#242424}.ft:hover{background-color:rgba(0, 0, 0, 0.1)}.jc:hover{text-decoration:underline}.jh:hover:not(:disabled){color:rgba(87, 117, 161, 1)}.ji:hover:not(:disabled){fill:rgba(87, 117, 161, 1)}.ln:hover{fill:rgba(8, 8, 8, 1)}.me:hover{fill:#000000}.mf:hover p{color:#000000}.mh:hover{color:#000000}.mr:hover svg{color:#000000}.rg:hover{background-color:#F2F2F2}.sm:hover{background-color:none}.tj:hover{background:#000000}.tk:hover{border-color:#242424}.tw:hover{fill:rgba(25, 25, 25, 1)}.bd:focus-within path{fill:#242424}.lm:focus{fill:rgba(8, 8, 8, 1)}.ms:focus svg{color:#000000}.pz:focus{transform:scale(1.01)}.lr:active{border-style:none}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="all and (min-width: 1080px)">.d{display:none}.bw{width:64px}.cg{margin:0 64px}.cv{height:48px}.dc{margin-bottom:52px}.do{margin-bottom:48px}.ef{font-size:14px}.eg{line-height:20px}.em{font-size:13px}.eo{padding:5px 12px}.fh{display:flex}.fy{margin-bottom:50px}.gc{max-width:680px}.hm{font-size:42px}.hn{margin-top:1.19em}.ho{line-height:52px}.hp{letter-spacing:-0.011em}.ie{font-size:22px}.if{margin-top:0.92em}.ig{line-height:28px}.il{align-items:center}.kl{border-top:solid 1px #F2F2F2}.km{border-bottom:solid 1px #F2F2F2}.kn{margin:32px 0 0}.ko{padding:3px 8px}.kx> *{margin-right:24px}.ky> :last-child{margin-right:0}.ly{margin-top:0px}.mn{margin:0}.ny{font-size:20px}.nz{margin-top:2.14em}.oa{line-height:32px}.ob{letter-spacing:-0.003em}.ov{font-size:24px}.ow{margin-top:1.95em}.ox{line-height:30px}.oy{letter-spacing:-0.016em}.pe{margin-top:0.94em}.pm{margin-top:1.14em}.pu{margin-top:56px}.qu{margin-top:1.72em}.qv{line-height:24px}.qw{letter-spacing:0}.ru{display:inline-block}.ry{flex-direction:row}.sb{margin-bottom:0}.sc{margin-right:20px}.sr{max-width:500px}.ts{margin-bottom:88px}.ud{margin:40px 0 16px}.up{width:min-width}.uu{padding-top:72px}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="all and (max-width: 1079.98px)">.e{display:none}.lx{margin-top:0px}.qd{margin-left:auto}.qe{text-align:center}.rt{display:inline-block}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="all and (max-width: 903.98px)">.f{display:none}.lw{margin-top:0px}.rs{display:inline-block}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="all and (max-width: 727.98px)">.g{display:none}.lu{margin-top:0px}.lv{margin-right:0px}.rr{display:inline-block}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="all and (max-width: 551.98px)">.h{display:none}.s{display:flex}.t{justify-content:space-between}.bs{width:24px}.cc{margin:0 24px}.cr{height:40px}.cy{margin-bottom:44px}.dk{margin-bottom:32px}.dx{font-size:13px}.dy{line-height:20px}.eh{padding:0px 8px 1px}.fu{margin-bottom:2px}.gw{font-size:32px}.gx{margin-top:1.01em}.gy{line-height:38px}.gz{letter-spacing:-0.014em}.hs{font-size:18px}.ht{margin-top:0.79em}.hu{line-height:24px}.ih{align-items:flex-start}.jk{flex-direction:column}.jz{margin:24px -24px 0}.ka{padding:0}.kp> *{margin-right:8px}.kq> :last-child{margin-right:24px}.lh{margin-left:0px}.ls{margin-top:0px}.lt{margin-right:0px}.mj{margin:0}.mt{border:1px solid #F2F2F2}.mu{border-radius:99em}.mv{padding:0px 16px 0px 12px}.mw{height:38px}.mx{align-items:center}.mz svg{margin-right:8px}.nk{margin-top:1.56em}.nl{line-height:28px}.nm{letter-spacing:-0.003em}.oh{font-size:20px}.oi{margin-top:1.2em}.oj{letter-spacing:0}.pa{margin-top:0.67em}.pi{margin-top:1.34em}.pq{margin-top:40px}.qk{font-size:16px}.ql{margin-top:1.23em}.rq{display:inline-block}.sj{margin-bottom:20px}.sk{margin-right:0}.sv{max-width:100%}.sy{font-size:24px}.sz{line-height:30px}.ta{letter-spacing:-0.016em}.to{margin-bottom:64px}.tz{margin:32px 0 16px}.ul{width:100%}.uq{padding-top:48px}.my:hover{border-color:#E5E5E5}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="all and (min-width: 904px) and (max-width: 1079.98px)">.i{display:none}.bv{width:64px}.cf{margin:0 64px}.cu{height:48px}.db{margin-bottom:52px}.dn{margin-bottom:48px}.ed{font-size:14px}.ee{line-height:20px}.ek{font-size:13px}.el{padding:5px 12px}.fg{display:flex}.fx{margin-bottom:50px}.gb{max-width:680px}.hi{font-size:42px}.hj{margin-top:1.19em}.hk{line-height:52px}.hl{letter-spacing:-0.011em}.ib{font-size:22px}.ic{margin-top:0.92em}.id{line-height:28px}.ik{align-items:center}.kh{border-top:solid 1px #F2F2F2}.ki{border-bottom:solid 1px #F2F2F2}.kj{margin:32px 0 0}.kk{padding:3px 8px}.kv> *{margin-right:24px}.kw> :last-child{margin-right:0}.mm{margin:0}.nu{font-size:20px}.nv{margin-top:2.14em}.nw{line-height:32px}.nx{letter-spacing:-0.003em}.or{font-size:24px}.os{margin-top:1.95em}.ot{line-height:30px}.ou{letter-spacing:-0.016em}.pd{margin-top:0.94em}.pl{margin-top:1.14em}.pt{margin-top:56px}.qr{margin-top:1.72em}.qs{line-height:24px}.qt{letter-spacing:0}.rz{flex-direction:row}.sd{margin-bottom:0}.se{margin-right:20px}.ss{max-width:500px}.tr{margin-bottom:88px}.uc{margin:40px 0 16px}.uo{width:min-width}.ut{padding-top:72px}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="all and (min-width: 728px) and (max-width: 903.98px)">.j{display:none}.w{display:flex}.x{justify-content:space-between}.bu{width:64px}.ce{margin:0 48px}.ct{height:48px}.da{margin-bottom:52px}.dm{margin-bottom:48px}.eb{font-size:13px}.ec{line-height:20px}.ej{padding:0px 8px 1px}.fw{margin-bottom:50px}.ga{max-width:680px}.he{font-size:42px}.hf{margin-top:1.19em}.hg{line-height:52px}.hh{letter-spacing:-0.011em}.hy{font-size:22px}.hz{margin-top:0.92em}.ia{line-height:28px}.ij{align-items:center}.kd{border-top:solid 1px #F2F2F2}.ke{border-bottom:solid 1px #F2F2F2}.kf{margin:32px 0 0}.kg{padding:3px 8px}.kt> *{margin-right:24px}.ku> :last-child{margin-right:0}.ml{margin:0}.nq{font-size:20px}.nr{margin-top:2.14em}.ns{line-height:32px}.nt{letter-spacing:-0.003em}.on{font-size:24px}.oo{margin-top:1.95em}.op{line-height:30px}.oq{letter-spacing:-0.016em}.pc{margin-top:0.94em}.pk{margin-top:1.14em}.ps{margin-top:56px}.qo{margin-top:1.72em}.qp{line-height:24px}.qq{letter-spacing:0}.sa{flex-direction:row}.sf{margin-bottom:0}.sg{margin-right:20px}.st{max-width:500px}.tq{margin-bottom:88px}.ub{margin:40px 0 16px}.un{width:min-width}.us{padding-top:72px}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="all and (min-width: 552px) and (max-width: 727.98px)">.k{display:none}.u{display:flex}.v{justify-content:space-between}.bt{width:24px}.cd{margin:0 24px}.cs{height:40px}.cz{margin-bottom:44px}.dl{margin-bottom:32px}.dz{font-size:13px}.ea{line-height:20px}.ei{padding:0px 8px 1px}.fv{margin-bottom:2px}.ha{font-size:32px}.hb{margin-top:1.01em}.hc{line-height:38px}.hd{letter-spacing:-0.014em}.hv{font-size:18px}.hw{margin-top:0.79em}.hx{line-height:24px}.ii{align-items:flex-start}.jl{flex-direction:column}.kb{margin:24px 0 0}.kc{padding:0}.kr> *{margin-right:8px}.ks> :last-child{margin-right:8px}.li{margin-left:0px}.mk{margin:0}.na{border:1px solid #F2F2F2}.nb{border-radius:99em}.nc{padding:0px 16px 0px 12px}.nd{height:38px}.ne{align-items:center}.ng svg{margin-right:8px}.nn{margin-top:1.56em}.no{line-height:28px}.np{letter-spacing:-0.003em}.ok{font-size:20px}.ol{margin-top:1.2em}.om{letter-spacing:0}.pb{margin-top:0.67em}.pj{margin-top:1.34em}.pr{margin-top:40px}.qm{font-size:16px}.qn{margin-top:1.23em}.sh{margin-bottom:20px}.si{margin-right:0}.su{max-width:100%}.tb{font-size:24px}.tc{line-height:30px}.td{letter-spacing:-0.016em}.tp{margin-bottom:64px}.ua{margin:32px 0 16px}.um{width:100%}.ur{padding-top:48px}.nf:hover{border-color:#E5E5E5}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="print">.ro{display:none}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="(orientation: landscape) and (max-width: 903.98px)">.jw{max-height:none}</style><style type="text/css" data-fela-rehydration="571" data-fela-type="RULE" media="(prefers-reduced-motion: no-preference)">.pw{transition:transform 300ms cubic-bezier(0.2, 0, 0.2, 1)}</style></head><body><div id="root"><div class="a b c"><div class="d e f g h i j k"></div><script>document.domain = document.domain;</script><div class="l c"><div class="l m n o c"><div class="p q r s t u v w x i d y z"><a class="du ag dv bf ak b am an ao ap aq ar as at s u w i d q dw z" href="https://rsci.app.link/?%24canonical_url=https%3A%2F%2Fmedium.com%2Fp%2F89de0104bcbd&amp;%7Efeature=LoOpenInAppButton&amp;%7Echannel=ShowPostUnderCollection&amp;source=---top_nav_layout_nav-----------------------------------------" rel="noopener follow">Open in app<svg xmlns="http://www.w3.org/2000/svg" width="10" height="10" fill="none" viewBox="0 0 10 10" class="dt"><path fill="currentColor" d="M.985 8.485a.375.375 0 1 0 .53.53zM8.75 1.25h.375A.375.375 0 0 0 8.75.875zM8.375 6.5a.375.375 0 1 0 .75 0zM3.5.875a.375.375 0 1 0 0 .75zm-1.985 8.14 7.5-7.5-.53-.53-7.5 7.5zm6.86-7.765V6.5h.75V1.25zM3.5 1.625h5.25v-.75H3.5z"></path></svg></a><div class="ab q"><p class="bf b dx dy dz ea eb ec ed ee ef eg du"><span><button class="bf b dx dy eh dz ea ei eb ec ej ek ee el em eg eo ep eq er es et eu ev ew ex ey ez fa fb fc fd bm fe ff" data-testid="headerSignUpButton">Sign up</button></span></p><div class="ax l"><p class="bf b dx dy dz ea eb ec ed ee ef eg du"><span><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="headerSignInButton" rel="noopener follow" href="/m/signin?operation=login&amp;redirect=https%3A%2F%2Fmedium.com%2Fcoursera-engineering%2Fdata-driven-content-categorization-89de0104bcbd&amp;source=post_page---top_nav_layout_nav-----------------------global_nav------------------">Sign in</a></span></p></div></div></div><div class="p q r ab ac"><div class="ab q ae"><a class="af ag ah ai aj ak al am an ao ap aq ar as at ab" aria-label="Homepage" data-testid="headerMediumLogo" rel="noopener follow" href="/?source=---top_nav_layout_nav-----------------------------------------"><svg xmlns="http://www.w3.org/2000/svg" width="719" height="160" fill="none" viewBox="0 0 719 160" class="au av aw"><path fill="#242424" d="m174.104 9.734.215-.047V8.02H130.39L89.6 103.89 48.81 8.021H1.472v1.666l.212.047c8.018 1.81 12.09 4.509 12.09 14.242V137.93c0 9.734-4.087 12.433-12.106 14.243l-.212.047v1.671h32.118v-1.665l-.213-.048c-8.018-1.809-12.089-4.509-12.089-14.242V30.586l52.399 123.305h2.972l53.925-126.743V140.75c-.687 7.688-4.721 10.062-11.982 11.701l-.215.05v1.652h55.948v-1.652l-.215-.05c-7.269-1.639-11.4-4.013-12.087-11.701l-.037-116.774h.037c0-9.733 4.071-12.432 12.087-14.242m25.555 75.488c.915-20.474 8.268-35.252 20.606-35.507 3.806.063 6.998 1.312 9.479 3.714 5.272 5.118 7.751 15.812 7.368 31.793zm-.553 5.77h65.573v-.275c-.186-15.656-4.721-27.834-13.466-36.196-7.559-7.227-18.751-11.203-30.507-11.203h-.263c-6.101 0-13.584 1.48-18.909 4.16-6.061 2.807-11.407 7.003-15.855 12.511-7.161 8.874-11.499 20.866-12.554 34.343q-.05.606-.092 1.212a50 50 0 0 0-.065 1.151 85.807 85.807 0 0 0-.094 5.689c.71 30.524 17.198 54.917 46.483 54.917 25.705 0 40.675-18.791 44.407-44.013l-1.886-.664c-6.557 13.556-18.334 21.771-31.738 20.769-18.297-1.369-32.314-19.922-31.042-42.395m139.722 41.359c-2.151 5.101-6.639 7.908-12.653 7.908s-11.513-4.129-15.418-11.63c-4.197-8.053-6.405-19.436-6.405-32.92 0-28.067 8.729-46.22 22.24-46.22 5.657 0 10.111 2.807 12.236 7.704zm43.499 20.008c-8.019-1.897-12.089-4.722-12.089-14.951V1.309l-48.716 14.353v1.757l.299-.024c6.72-.543 11.278.386 13.925 2.83 2.072 1.915 3.082 4.853 3.082 8.987v18.66c-4.803-3.067-10.516-4.56-17.448-4.56-14.059 0-26.909 5.92-36.176 16.672-9.66 11.205-14.767 26.518-14.767 44.278-.003 31.72 15.612 53.039 38.851 53.039 13.595 0 24.533-7.449 29.54-20.013v16.865h43.711v-1.746zM424.1 19.819c0-9.904-7.468-17.374-17.375-17.374-9.859 0-17.573 7.632-17.573 17.374s7.721 17.374 17.573 17.374c9.907 0 17.375-7.47 17.375-17.374m11.499 132.546c-8.019-1.897-12.089-4.722-12.089-14.951h-.035V43.635l-43.714 12.551v1.705l.263.024c9.458.842 12.047 4.1 12.047 15.152v81.086h43.751v-1.746zm112.013 0c-8.018-1.897-12.089-4.722-12.089-14.951V43.635l-41.621 12.137v1.71l.246.026c7.733.813 9.967 4.257 9.967 15.36v59.279c-2.578 5.102-7.415 8.131-13.274 8.336-9.503 0-14.736-6.419-14.736-18.073V43.638l-43.714 12.55v1.703l.262.024c9.459.84 12.05 4.097 12.05 15.152v50.17a56.3 56.3 0 0 0 .91 10.444l.787 3.423c3.701 13.262 13.398 20.197 28.59 20.197 12.868 0 24.147-7.966 29.115-20.43v17.311h43.714v-1.747zm169.818 1.788v-1.749l-.213-.05c-8.7-2.006-12.089-5.789-12.089-13.49v-63.79c0-19.89-11.171-31.761-29.883-31.761-13.64 0-25.141 7.882-29.569 20.16-3.517-13.01-13.639-20.16-28.606-20.16-13.146 0-23.449 6.938-27.869 18.657V43.643L545.487 55.68v1.715l.263.024c9.345.829 12.047 4.181 12.047 14.95v81.784h40.787v-1.746l-.215-.053c-6.941-1.631-9.181-4.606-9.181-12.239V66.998c1.836-4.289 5.537-9.37 12.853-9.37 9.086 0 13.692 6.296 13.692 18.697v77.828h40.797v-1.746l-.215-.053c-6.94-1.631-9.18-4.606-9.18-12.239V75.066a42 42 0 0 0-.578-7.26c1.947-4.661 5.86-10.177 13.475-10.177 9.214 0 13.691 6.114 13.691 18.696v77.828z"></path></svg></a><div class="ax h"><div class="ab ay az ba bb q bc bd"><div class="bm" aria-hidden="false" aria-describedby="searchResults" aria-labelledby="searchResults"></div><div class="bn bo ab"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="none" viewBox="0 0 24 24"><path fill="currentColor" fill-rule="evenodd" d="M4.092 11.06a6.95 6.95 0 1 1 13.9 0 6.95 6.95 0 0 1-13.9 0m6.95-8.05a8.05 8.05 0 1 0 5.13 14.26l3.75 3.75a.56.56 0 1 0 .79-.79l-3.73-3.73A8.05 8.05 0 0 0 11.042 3z" clip-rule="evenodd"></path></svg></div><input role="combobox" aria-controls="searchResults" aria-expanded="false" aria-label="search" data-testid="headerSearchInput" tabindex="0" class="ay be bf bg z bh bi bj bk bl" placeholder="Search" value=""/></div></div></div><div class="h k w fg fh"><div class="fi ab"><span><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="headerWriteButton" rel="noopener follow" href="/m/signin?operation=register&amp;redirect=https%3A%2F%2Fmedium.com%2Fnew-story&amp;source=---top_nav_layout_nav-----------------------new_post_topnav------------------"><div class="bf b bg z du fj fk ab q fl fm"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="none" viewBox="0 0 24 24" aria-label="Write"><path fill="currentColor" d="M14 4a.5.5 0 0 0 0-1zm7 6a.5.5 0 0 0-1 0zm-7-7H4v1h10zM3 4v16h1V4zm1 17h16v-1H4zm17-1V10h-1v10zm-1 1a1 1 0 0 0 1-1h-1zM3 20a1 1 0 0 0 1 1v-1zM4 3a1 1 0 0 0-1 1h1z"></path><path stroke="currentColor" d="m17.5 4.5-8.458 8.458a.25.25 0 0 0-.06.098l-.824 2.47a.25.25 0 0 0 .316.316l2.47-.823a.25.25 0 0 0 .098-.06L19.5 6.5m-2-2 2.323-2.323a.25.25 0 0 1 .354 0l1.646 1.646a.25.25 0 0 1 0 .354L19.5 6.5m-2-2 2 2"></path></svg><div class="dt l">Write</div></div></a></span></div></div><div class="k j i d"><div class="fi ab"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="headerSearchButton" rel="noopener follow" href="/search?source=---top_nav_layout_nav-----------------------------------------"><div class="bf b bg z du fj fk ab q fl fm"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="none" viewBox="0 0 24 24" aria-label="Search"><path fill="currentColor" fill-rule="evenodd" d="M4.092 11.06a6.95 6.95 0 1 1 13.9 0 6.95 6.95 0 0 1-13.9 0m6.95-8.05a8.05 8.05 0 1 0 5.13 14.26l3.75 3.75a.56.56 0 1 0 .79-.79l-3.73-3.73A8.05 8.05 0 0 0 11.042 3z" clip-rule="evenodd"></path></svg></div></a></div></div><div class="fi h k j"><div class="ab q"><p class="bf b dx dy dz ea eb ec ed ee ef eg du"><span><button class="bf b dx dy eh dz ea ei eb ec ej ek ee el em eg eo ep eq er es et eu ev ew ex ey ez fa fb fc fd bm fe ff" data-testid="headerSignUpButton">Sign up</button></span></p><div class="ax l"><p class="bf b dx dy dz ea eb ec ed ee ef eg du"><span><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="headerSignInButton" rel="noopener follow" href="/m/signin?operation=login&amp;redirect=https%3A%2F%2Fmedium.com%2Fcoursera-engineering%2Fdata-driven-content-categorization-89de0104bcbd&amp;source=post_page---top_nav_layout_nav-----------------------global_nav------------------">Sign in</a></span></p></div></div></div><div class="l" aria-hidden="false"><button class="ay fn am ab q ao fo fp fq" aria-label="user options menu" data-testid="headerUserIcon"><div class="l fj"><img alt="" class="l fd by bz ca cx" src="https://miro.medium.com/v2/resize:fill:64:64/1*dmbNkD5D-u45r44go_cf0g.png" width="32" height="32" loading="lazy" role="presentation"/><div class="fr by l bz ca fs n ay ft"></div></div></button></div></div></div><div class="l"><div class="fu fv fw fx fy l"><div class="ab cb"><div class="ci bh fz ga gb gc"></div></div><article><div class="l"><div class="l"><span class="l"></span><section><div><div class="fs gi gj gk gl gm"></div><div class="gn go gp gq gr"><div class="ab cb"><div class="ci bh fz ga gb gc"><div><h1 id="fd1b" class="pw-post-title gs gt gu bf gv gw gx gy gz ha hb hc hd he hf hg hh hi hj hk hl hm hn ho hp hq bk" data-testid="storyTitle">Categorizing learning content</h1></div><div><h2 id="dddb" class="pw-subtitle-paragraph hr gt gu bf b hs ht hu hv hw hx hy hz ia ib ic id ie if ig cq du">From hand-coded to an algorithmic approach</h2><div><div class="speechify-ignore ab cp"><div class="speechify-ignore bh l"><div class="ih ii ij ik il ab"><div><div class="ab im"><div><div class="bm" aria-hidden="false"><a rel="noopener follow" href="/@cliu_88389?source=post_page---byline--89de0104bcbd---------------------------------------"><div class="l in io by ip iq"><div class="l fj"><img alt="Chris Liu" class="l fd by dd de cx" src="https://miro.medium.com/v2/resize:fill:88:88/0*ECSDCjFKbFRqqOIr." width="44" height="44" loading="lazy" data-testid="authorPhoto"/><div class="ir by l dd de fs n is ft"></div></div></div></a></div></div><div class="it ab fj"><div><div class="bm" aria-hidden="false"><a href="https://medium.com/coursera-engineering?source=post_page---byline--89de0104bcbd---------------------------------------" rel="noopener follow"><div class="l iu iv by ip iw"><div class="l fj"><img alt="Coursera Engineering" class="l fd by br ix cx" src="https://miro.medium.com/v2/resize:fill:48:48/1*j2vLJO9qZg435iRYfd2Mfg.png" width="24" height="24" loading="lazy" data-testid="publicationPhoto"/><div class="ir by l br ix fs n is ft"></div></div></div></a></div></div></div></div></div><div class="bn bh l"><div class="ab"><div style="flex:1"><span class="bf b bg z bk"><div class="iy ab q"><div class="ab q iz"><div class="ab q"><div><div class="bm" aria-hidden="false"><p class="bf b ja jb bk"><a class="af ag ah ai aj ak al am an ao ap aq ar jc" data-testid="authorName" rel="noopener follow" href="/@cliu_88389?source=post_page---byline--89de0104bcbd---------------------------------------">Chris Liu</a></p></div></div></div><span class="jd je" aria-hidden="true"><span class="bf b bg z du">·</span></span><p class="bf b ja jb du"><span><a class="jf jg ah ai aj ak al am an ao ap aq ar ex jh ji" rel="noopener follow" href="/m/signin?actionUrl=https%3A%2F%2Fmedium.com%2F_%2Fsubscribe%2Fuser%2F70814e310ce3&amp;operation=register&amp;redirect=https%3A%2F%2Fmedium.com%2Fcoursera-engineering%2Fdata-driven-content-categorization-89de0104bcbd&amp;user=Chris+Liu&amp;userId=70814e310ce3&amp;source=post_page-70814e310ce3--byline--89de0104bcbd---------------------post_header------------------">Follow</a></span></p></div></div></span></div></div><div class="l jj"><span class="bf b bg z du"><div class="ab cn jk jl jm"><div class="fu fv ab"><div class="bf b bg z du ab jn"><span class="jo l jj">Published in</span><div><div class="l" aria-hidden="false"><a class="af ag ah ai aj ak al am an ao ap aq ar jc ab q" data-testid="publicationName" href="https://medium.com/coursera-engineering?source=post_page---byline--89de0104bcbd---------------------------------------" rel="noopener follow"><p class="bf b bg z jp jq jr js jt ju jv jw bk">Coursera Engineering</p></a></div></div></div><div class="h k"><span class="jd je" aria-hidden="true"><span class="bf b bg z du">·</span></span></div></div><span class="bf b bg z du"><div class="ab ae"><span data-testid="storyReadTime">5 min read</span><div class="jx jy l" aria-hidden="true"><span class="l" aria-hidden="true"><span class="bf b bg z du">·</span></span></div><span data-testid="storyPublishDate">Sep 12, 2018</span></div></span></div></span></div></div></div><div class="ab cp jz ka kb kc kd ke kf kg kh ki kj kk kl km kn ko"><div class="h k w fg fh q"><div class="le l"><div class="ab q lf lg"><div class="pw-multi-vote-icon fj jo lh li lj"><span><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="headerClapButton" rel="noopener follow" href="/m/signin?actionUrl=https%3A%2F%2Fmedium.com%2F_%2Fvote%2Fcoursera-engineering%2F89de0104bcbd&amp;operation=register&amp;redirect=https%3A%2F%2Fmedium.com%2Fcoursera-engineering%2Fdata-driven-content-categorization-89de0104bcbd&amp;user=Chris+Liu&amp;userId=70814e310ce3&amp;source=---header_actions--89de0104bcbd---------------------clap_footer------------------"><div><div class="bm" aria-hidden="false"><div class="lk ao ll lm ln lo am lp lq lr lj"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" viewBox="0 0 24 24" aria-label="clap"><path fill-rule="evenodd" d="M11.37.828 12 3.282l.63-2.454zM13.916 3.953l1.523-2.112-1.184-.39zM8.589 1.84l1.522 2.112-.337-2.501zM18.523 18.92c-.86.86-1.75 1.246-2.62 1.33a6 6 0 0 0 .407-.372c2.388-2.389 2.86-4.951 1.399-7.623l-.912-1.603-.79-1.672c-.26-.56-.194-.98.203-1.288a.7.7 0 0 1 .546-.132c.283.046.546.231.728.5l2.363 4.157c.976 1.624 1.141 4.237-1.324 6.702m-10.999-.438L3.37 14.328a.828.828 0 0 1 .585-1.408.83.83 0 0 1 .585.242l2.158 2.157a.365.365 0 0 0 .516-.516l-2.157-2.158-1.449-1.449a.826.826 0 0 1 1.167-1.17l3.438 3.44a.363.363 0 0 0 .516 0 .364.364 0 0 0 0-.516L5.293 9.513l-.97-.97a.826.826 0 0 1 0-1.166.84.84 0 0 1 1.167 0l.97.968 3.437 3.436a.36.36 0 0 0 .517 0 .366.366 0 0 0 0-.516L6.977 7.83a.82.82 0 0 1-.241-.584.82.82 0 0 1 .824-.826c.219 0 .43.087.584.242l5.787 5.787a.366.366 0 0 0 .587-.415l-1.117-2.363c-.26-.56-.194-.98.204-1.289a.7.7 0 0 1 .546-.132c.283.046.545.232.727.501l2.193 3.86c1.302 2.38.883 4.59-1.277 6.75-1.156 1.156-2.602 1.627-4.19 1.367-1.418-.236-2.866-1.033-4.079-2.246M10.75 5.971l2.12 2.12c-.41.502-.465 1.17-.128 1.89l.22.465-3.523-3.523a.8.8 0 0 1-.097-.368c0-.22.086-.428.241-.584a.847.847 0 0 1 1.167 0m7.355 1.705c-.31-.461-.746-.758-1.23-.837a1.44 1.44 0 0 0-1.11.275c-.312.24-.505.543-.59.881a1.74 1.74 0 0 0-.906-.465 1.47 1.47 0 0 0-.82.106l-2.182-2.182a1.56 1.56 0 0 0-2.2 0 1.54 1.54 0 0 0-.396.701 1.56 1.56 0 0 0-2.21-.01 1.55 1.55 0 0 0-.416.753c-.624-.624-1.649-.624-2.237-.037a1.557 1.557 0 0 0 0 2.2c-.239.1-.501.238-.715.453a1.56 1.56 0 0 0 0 2.2l.516.515a1.556 1.556 0 0 0-.753 2.615L7.01 19c1.32 1.319 2.909 2.189 4.475 2.449q.482.08.971.08c.85 0 1.653-.198 2.393-.579.231.033.46.054.686.054 1.266 0 2.457-.52 3.505-1.567 2.763-2.763 2.552-5.734 1.439-7.586z" clip-rule="evenodd"></path></svg></div></div></div></a></span></div><div class="pw-multi-vote-count l ls lt lu lv lw lx ly"><p class="bf b dv z du"><span class="lz">--</span></p></div></div></div><div><div class="bm" aria-hidden="false"><button class="ao lk mc md ab q fk me mf" aria-label="responses"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" viewBox="0 0 24 24" class="mb"><path d="M18.006 16.803c1.533-1.456 2.234-3.325 2.234-5.321C20.24 7.357 16.709 4 12.191 4S4 7.357 4 11.482c0 4.126 3.674 7.482 8.191 7.482.817 0 1.622-.111 2.393-.327.231.2.48.391.744.559 1.06.693 2.203 1.044 3.399 1.044.224-.008.4-.112.486-.287a.49.49 0 0 0-.042-.518c-.495-.67-.845-1.364-1.04-2.057a4 4 0 0 1-.125-.598zm-3.122 1.055-.067-.223-.315.096a8 8 0 0 1-2.311.338c-4.023 0-7.292-2.955-7.292-6.587 0-3.633 3.269-6.588 7.292-6.588 4.014 0 7.112 2.958 7.112 6.593 0 1.794-.608 3.469-2.027 4.72l-.195.168v.255c0 .056 0 .151.016.295.025.231.081.478.154.733.154.558.398 1.117.722 1.659a5.3 5.3 0 0 1-2.165-.845c-.276-.176-.714-.383-.941-.59z"></path></svg><p class="bf b dv z du"><span class="pw-responses-count ma mb">4</span></p></button></div></div></div><div class="ab q kp kq kr ks kt ku kv kw kx ky kz la lb lc ld"><div class="mg k j i d"></div><div class="h k"><div><div class="bm" aria-hidden="false"><span><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="headerBookmarkButton" rel="noopener follow" href="/m/signin?actionUrl=https%3A%2F%2Fmedium.com%2F_%2Fbookmark%2Fp%2F89de0104bcbd&amp;operation=register&amp;redirect=https%3A%2F%2Fmedium.com%2Fcoursera-engineering%2Fdata-driven-content-categorization-89de0104bcbd&amp;source=---header_actions--89de0104bcbd---------------------bookmark_footer------------------"><svg xmlns="http://www.w3.org/2000/svg" width="25" height="25" fill="none" viewBox="0 0 25 25" class="du mh" aria-label="Add to list bookmark button"><path fill="currentColor" d="M18 2.5a.5.5 0 0 1 1 0V5h2.5a.5.5 0 0 1 0 1H19v2.5a.5.5 0 1 1-1 0V6h-2.5a.5.5 0 0 1 0-1H18zM7 7a1 1 0 0 1 1-1h3.5a.5.5 0 0 0 0-1H8a2 2 0 0 0-2 2v14a.5.5 0 0 0 .805.396L12.5 17l5.695 4.396A.5.5 0 0 0 19 21v-8.5a.5.5 0 0 0-1 0v7.485l-5.195-4.012a.5.5 0 0 0-.61 0L7 19.985z"></path></svg></a></span></div></div></div><div class="fd mi cn"><div class="l ae"><div class="ab cb"><div class="mj mk ml mm mn mo ci bh"><div class="ab"><div class="bm" aria-hidden="false"><div><div class="bm" aria-hidden="false"><button aria-label="Listen" data-testid="audioPlayButton" class="af fk ah ai aj ak al mp an ao ap ex mq mr mf ms mt mu mv mw s mx my mz na nb nc nd u ne nf ng"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="none" viewBox="0 0 24 24"><path fill="currentColor" fill-rule="evenodd" d="M3 12a9 9 0 1 1 18 0 9 9 0 0 1-18 0m9-10C6.477 2 2 6.477 2 12s4.477 10 10 10 10-4.477 10-10S17.523 2 12 2m3.376 10.416-4.599 3.066a.5.5 0 0 1-.777-.416V8.934a.5.5 0 0 1 .777-.416l4.599 3.066a.5.5 0 0 1 0 .832" clip-rule="evenodd"></path></svg><div class="j i d"><p class="bf b bg z du">Listen</p></div></button></div></div></div></div></div></div></div></div><div class="bm" aria-hidden="false" aria-describedby="postFooterSocialMenu" aria-labelledby="postFooterSocialMenu"><div><div class="bm" aria-hidden="false"><button aria-controls="postFooterSocialMenu" aria-expanded="false" aria-label="Share Post" data-testid="headerSocialShareButton" class="af fk ah ai aj ak al mp an ao ap ex mq mr mf ms mt mu mv mw s mx my mz na nb nc nd u ne nf ng"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="none" viewBox="0 0 24 24"><path fill="currentColor" fill-rule="evenodd" d="M15.218 4.931a.4.4 0 0 1-.118.132l.012.006a.45.45 0 0 1-.292.074.5.5 0 0 1-.3-.13l-2.02-2.02v7.07c0 .28-.23.5-.5.5s-.5-.22-.5-.5v-7.04l-2 2a.45.45 0 0 1-.57.04h-.02a.4.4 0 0 1-.16-.3.4.4 0 0 1 .1-.32l2.8-2.8a.5.5 0 0 1 .7 0l2.8 2.79a.42.42 0 0 1 .068.498m-.106.138.008.004v-.01zM16 7.063h1.5a2 2 0 0 1 2 2v10a2 2 0 0 1-2 2h-11c-1.1 0-2-.9-2-2v-10a2 2 0 0 1 2-2H8a.5.5 0 0 1 .35.15.5.5 0 0 1 .15.35.5.5 0 0 1-.15.35.5.5 0 0 1-.35.15H6.4c-.5 0-.9.4-.9.9v10.2a.9.9 0 0 0 .9.9h11.2c.5 0 .9-.4.9-.9v-10.2c0-.5-.4-.9-.9-.9H16a.5.5 0 0 1 0-1" clip-rule="evenodd"></path></svg><div class="j i d"><p class="bf b bg z du">Share</p></div></button></div></div></div></div></div></div></div></div></div><p id="1140" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">Courses on Coursera cover topics ranging from<a class="af od" href="https://www.coursera.org/learn/photography" rel="noopener ugc nofollow" target="_blank"> photography</a> to<a class="af od" href="https://www.coursera.org/learn/probabilistic-graphical-models" rel="noopener ugc nofollow" target="_blank"> probabilistic graphical models</a> to<a class="af od" href="https://www.coursera.org/learn/muslim-world" rel="noopener ugc nofollow" target="_blank"> constitutional struggles in the Muslim world</a>. This diversity makes them hard to categorize. A couple of years ago we overhauled our course categories and implemented a new categorization system we call domains and subdomains. This post covers how we defined and implemented that new system.</p><h1 id="1df7" class="oe of gu bf og oh oi hu oj ok ol hx om on oo op oq or os ot ou ov ow ox oy oz bk">The Previous Course Categories</h1><p id="be48" class="pw-post-body-paragraph nh ni gu nj b hs pa nl nm hv pb no np nq pc ns nt nu pd nw nx ny pe oa ob oc gn bk">Coursera’s original categorization scheme dated back to our founding in 2012, and was heavily influenced by the content available at the time. For example, we had five categories of computer science subfields, but only one category for all of the humanities. The categories were also manually and arbitrarily defined, resulting in redundancies (e.g., “Food and Nutrition” being nearly a subset of “Health and Society”) and vagueness (e.g., “Information, Tech &amp; Design”).</p><p id="095b" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">Critically, the original categorization scheme was not meeting our need of effectively matching learner to content. For example, the “Medicine” category attracted two distinct groups of learners — because it contained two distinct groups of courses. The first were courses that appealed to healthcare practitioners (e.g., on <a class="af od" href="https://www.coursera.org/learn/clinical-kidney-transplantation" rel="noopener ugc nofollow" target="_blank">clinical kidney transplantation</a> or <a class="af od" href="https://www.coursera.org/learn/biocontainment" rel="noopener ugc nofollow" target="_blank">biocontainment for infectious diseases</a>). The second were courses on public health issues that appealed to non-practitioners.</p><p id="89d4" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">As our catalog expands to thousands of courses, we need a principled organization technique. We want categories that help the learner find the best content for them. This translates to the following criteria:</p><ol class=""><li id="c30c" class="nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc pf pg ph bk">Simple (as few categories as possible)</li><li id="237c" class="nh ni gu nj b hs pi nl nm hv pj no np nq pk ns nt nu pl nw nx ny pm oa ob oc pf pg ph bk">Minimally redundant (as mutually exclusive as possible)</li></ol><h1 id="abce" class="oe of gu bf og oh oi hu oj ok ol hx om on oo op oq or os ot ou ov ow ox oy oz bk">t-SNE to the rescue</h1><p id="fe80" class="pw-post-body-paragraph nh ni gu nj b hs pa nl nm hv pb no np nq pc ns nt nu pd nw nx ny pe oa ob oc gn bk">Rather than re-coding by hand, or replicating traditional university departments, we took a data-driven approach.</p><p id="21d1" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">We sought to group our courses so that someone interested in one course in that group, say, <a class="af od" href="https://www.coursera.org/learn/guitar" rel="noopener ugc nofollow" target="_blank">playing the guitar</a>, might also be interested in other courses in that group, say, <a class="af od" href="https://www.coursera.org/learn/songwriting-lyrics" rel="noopener ugc nofollow" target="_blank">songwriting</a> or <a class="af od" href="https://www.coursera.org/learn/jazz-improvisation" rel="noopener ugc nofollow" target="_blank">jazz improvisation</a>. The algorithm known as t-distributed stochastic neighbor embedding (<a class="af od" href="https://lvdmaaten.github.io/tsne/" rel="noopener ugc nofollow" target="_blank">t-SNE</a>) satisfies this requirement.</p><p id="058d" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">t-SNE identifies an arrangement of courses such that courses sharing common learners are close and courses that do not share common learners are far apart. For example, <a class="af od" href="https://www.coursera.org/learn/complex-analysis" rel="noopener ugc nofollow" target="_blank">Complex Analysis</a> and <a class="af od" href="https://www.coursera.org/learn/galois" rel="noopener ugc nofollow" target="_blank">Galois Theory</a> are close together since many learners take both, while <a class="af od" href="https://www.coursera.org/learn/horse-care" rel="noopener ugc nofollow" target="_blank">Taking Care of Horses</a> and <a class="af od" href="https://www.coursera.org/learn/general-relativity" rel="noopener ugc nofollow" target="_blank">General Relativity</a> are farther apart as the two courses do not share many learners.</p><p id="e67e" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">We utilized the t-SNE algorithm on courses in 2015 to produce the scatterplot output as shown below. Each dot represents a single course. We then group these courses into categories by clustering (represented by the coloring).</p><figure class="pq pr ps pt pu pv pn po paragraph-image"><div role="button" tabindex="0" class="pw px fj py bh pz"><div class="pn po pp"><picture><source srcSet="https://miro.medium.com/v2/resize:fit:640/format:webp/0*MKkkbhhYA7Tcus_L 640w, https://miro.medium.com/v2/resize:fit:720/format:webp/0*MKkkbhhYA7Tcus_L 720w, https://miro.medium.com/v2/resize:fit:750/format:webp/0*MKkkbhhYA7Tcus_L 750w, https://miro.medium.com/v2/resize:fit:786/format:webp/0*MKkkbhhYA7Tcus_L 786w, https://miro.medium.com/v2/resize:fit:828/format:webp/0*MKkkbhhYA7Tcus_L 828w, https://miro.medium.com/v2/resize:fit:1100/format:webp/0*MKkkbhhYA7Tcus_L 1100w, https://miro.medium.com/v2/resize:fit:1400/format:webp/0*MKkkbhhYA7Tcus_L 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px" type="image/webp"/><source data-testid="og" srcSet="https://miro.medium.com/v2/resize:fit:640/0*MKkkbhhYA7Tcus_L 640w, https://miro.medium.com/v2/resize:fit:720/0*MKkkbhhYA7Tcus_L 720w, https://miro.medium.com/v2/resize:fit:750/0*MKkkbhhYA7Tcus_L 750w, https://miro.medium.com/v2/resize:fit:786/0*MKkkbhhYA7Tcus_L 786w, https://miro.medium.com/v2/resize:fit:828/0*MKkkbhhYA7Tcus_L 828w, https://miro.medium.com/v2/resize:fit:1100/0*MKkkbhhYA7Tcus_L 1100w, https://miro.medium.com/v2/resize:fit:1400/0*MKkkbhhYA7Tcus_L 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px"/><img alt="" class="bh mo qa c" width="700" height="687" loading="lazy" role="presentation"/></picture></div></div><figcaption class="qb ff qc pn po qd qe bf b bg z du">Figure 1: t-SNE visualization of courses colored by cluster, circa 2015.</figcaption></figure><h1 id="8d62" class="oe of gu bf og oh oi hu oj ok ol hx om on oo op oq or os ot ou ov ow ox oy oz bk">The general structure of our content</h1><figure class="pq pr ps pt pu pv pn po paragraph-image"><div role="button" tabindex="0" class="pw px fj py bh pz"><div class="pn po qf"><picture><source srcSet="https://miro.medium.com/v2/resize:fit:640/format:webp/1*c_utWA_Qi-HFw4tVDU3JyA.png 640w, https://miro.medium.com/v2/resize:fit:720/format:webp/1*c_utWA_Qi-HFw4tVDU3JyA.png 720w, https://miro.medium.com/v2/resize:fit:750/format:webp/1*c_utWA_Qi-HFw4tVDU3JyA.png 750w, https://miro.medium.com/v2/resize:fit:786/format:webp/1*c_utWA_Qi-HFw4tVDU3JyA.png 786w, https://miro.medium.com/v2/resize:fit:828/format:webp/1*c_utWA_Qi-HFw4tVDU3JyA.png 828w, https://miro.medium.com/v2/resize:fit:1100/format:webp/1*c_utWA_Qi-HFw4tVDU3JyA.png 1100w, https://miro.medium.com/v2/resize:fit:1400/format:webp/1*c_utWA_Qi-HFw4tVDU3JyA.png 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px" type="image/webp"/><source data-testid="og" srcSet="https://miro.medium.com/v2/resize:fit:640/1*c_utWA_Qi-HFw4tVDU3JyA.png 640w, https://miro.medium.com/v2/resize:fit:720/1*c_utWA_Qi-HFw4tVDU3JyA.png 720w, https://miro.medium.com/v2/resize:fit:750/1*c_utWA_Qi-HFw4tVDU3JyA.png 750w, https://miro.medium.com/v2/resize:fit:786/1*c_utWA_Qi-HFw4tVDU3JyA.png 786w, https://miro.medium.com/v2/resize:fit:828/1*c_utWA_Qi-HFw4tVDU3JyA.png 828w, https://miro.medium.com/v2/resize:fit:1100/1*c_utWA_Qi-HFw4tVDU3JyA.png 1100w, https://miro.medium.com/v2/resize:fit:1400/1*c_utWA_Qi-HFw4tVDU3JyA.png 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px"/><img alt="" class="bh mo qa c" width="700" height="416" loading="lazy" role="presentation"/></picture></div></div><figcaption class="qb ff qc pn po qd qe bf b bg z du">Figure 2. General subject area of courses.</figcaption></figure><p id="98ec" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">Looking at Figures 1 and 2, the first thing we see is that courses are organized in a globally consistent way: humanities, social sciences, and business courses are in the top right half of the plot, while natural sciences, engineering, and computational sciences courses fall in the bottom left half.</p><p id="724c" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">Digging in more granularly reveals additional nuance:</p><ul class=""><li id="cf60" class="nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc qg pg ph bk">Courses on business and finance are clustered together on the right</li><li id="11c1" class="nh ni gu nj b hs pi nl nm hv pj no np nq pk ns nt nu pl nw nx ny pm oa ob oc qg pg ph bk">Courses about the natural sciences (physics, chemistry, and biology) are on the left</li><li id="5b6b" class="nh ni gu nj b hs pi nl nm hv pj no np nq pk ns nt nu pl nw nx ny pm oa ob oc qg pg ph bk">Courses on the computational sciences (math, cs, and statistics) are at the bottom</li><li id="02ce" class="nh ni gu nj b hs pi nl nm hv pj no np nq pk ns nt nu pl nw nx ny pm oa ob oc qg pg ph bk">Courses on the social sciences and humanities are at the top</li></ul><figure class="pq pr ps pt pu pv pn po paragraph-image"><div role="button" tabindex="0" class="pw px fj py bh pz"><div class="pn po qh"><picture><source srcSet="https://miro.medium.com/v2/resize:fit:640/format:webp/1*-yZ59kN7MjqgnKq2tXTlQA.png 640w, https://miro.medium.com/v2/resize:fit:720/format:webp/1*-yZ59kN7MjqgnKq2tXTlQA.png 720w, https://miro.medium.com/v2/resize:fit:750/format:webp/1*-yZ59kN7MjqgnKq2tXTlQA.png 750w, https://miro.medium.com/v2/resize:fit:786/format:webp/1*-yZ59kN7MjqgnKq2tXTlQA.png 786w, https://miro.medium.com/v2/resize:fit:828/format:webp/1*-yZ59kN7MjqgnKq2tXTlQA.png 828w, https://miro.medium.com/v2/resize:fit:1100/format:webp/1*-yZ59kN7MjqgnKq2tXTlQA.png 1100w, https://miro.medium.com/v2/resize:fit:1400/format:webp/1*-yZ59kN7MjqgnKq2tXTlQA.png 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px" type="image/webp"/><source data-testid="og" srcSet="https://miro.medium.com/v2/resize:fit:640/1*-yZ59kN7MjqgnKq2tXTlQA.png 640w, https://miro.medium.com/v2/resize:fit:720/1*-yZ59kN7MjqgnKq2tXTlQA.png 720w, https://miro.medium.com/v2/resize:fit:750/1*-yZ59kN7MjqgnKq2tXTlQA.png 750w, https://miro.medium.com/v2/resize:fit:786/1*-yZ59kN7MjqgnKq2tXTlQA.png 786w, https://miro.medium.com/v2/resize:fit:828/1*-yZ59kN7MjqgnKq2tXTlQA.png 828w, https://miro.medium.com/v2/resize:fit:1100/1*-yZ59kN7MjqgnKq2tXTlQA.png 1100w, https://miro.medium.com/v2/resize:fit:1400/1*-yZ59kN7MjqgnKq2tXTlQA.png 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px"/><img alt="" class="bh mo qa c" width="700" height="413" loading="lazy" role="presentation"/></picture></div></div><figcaption class="qb ff qc pn po qd qe bf b bg z du">Figure 3. General division of science and humanities courses.</figcaption></figure><figure class="pq pr ps pt pu pv pn po paragraph-image"><div role="button" tabindex="0" class="pw px fj py bh pz"><div class="pn po qi"><picture><source srcSet="https://miro.medium.com/v2/resize:fit:640/format:webp/1*A-lEgYtSuSKQZ21ves4JOw.png 640w, https://miro.medium.com/v2/resize:fit:720/format:webp/1*A-lEgYtSuSKQZ21ves4JOw.png 720w, https://miro.medium.com/v2/resize:fit:750/format:webp/1*A-lEgYtSuSKQZ21ves4JOw.png 750w, https://miro.medium.com/v2/resize:fit:786/format:webp/1*A-lEgYtSuSKQZ21ves4JOw.png 786w, https://miro.medium.com/v2/resize:fit:828/format:webp/1*A-lEgYtSuSKQZ21ves4JOw.png 828w, https://miro.medium.com/v2/resize:fit:1100/format:webp/1*A-lEgYtSuSKQZ21ves4JOw.png 1100w, https://miro.medium.com/v2/resize:fit:1400/format:webp/1*A-lEgYtSuSKQZ21ves4JOw.png 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px" type="image/webp"/><source data-testid="og" srcSet="https://miro.medium.com/v2/resize:fit:640/1*A-lEgYtSuSKQZ21ves4JOw.png 640w, https://miro.medium.com/v2/resize:fit:720/1*A-lEgYtSuSKQZ21ves4JOw.png 720w, https://miro.medium.com/v2/resize:fit:750/1*A-lEgYtSuSKQZ21ves4JOw.png 750w, https://miro.medium.com/v2/resize:fit:786/1*A-lEgYtSuSKQZ21ves4JOw.png 786w, https://miro.medium.com/v2/resize:fit:828/1*A-lEgYtSuSKQZ21ves4JOw.png 828w, https://miro.medium.com/v2/resize:fit:1100/1*A-lEgYtSuSKQZ21ves4JOw.png 1100w, https://miro.medium.com/v2/resize:fit:1400/1*A-lEgYtSuSKQZ21ves4JOw.png 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px"/><img alt="" class="bh mo qa c" width="700" height="557" loading="lazy" role="presentation"/></picture></div></div><figcaption class="qb ff qc pn po qd qe bf b bg z du">Figure 4. Substructure of courses within each half of the plot.</figcaption></figure><p id="5fd8" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">Dissecting each of these large regions further, we see that even within each grouping, courses are arranged logically. For example, courses in natural history span a continuum roughly from the biological sciences to the physical sciences. Similarly, courses in humanities and social science range roughly from music to the visual arts, humanities, and social sciences, and then practical business.</p><p id="9577" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">Even at the level of individual courses, t-SNE captures the interdisciplinary nature of courses. Courses in business law, for example, fall on the boundary between business and law, and courses on quantitative methods for the social sciences fall between math and the social sciences.</p><figure class="pq pr ps pt pu pv pn po paragraph-image"><div role="button" tabindex="0" class="pw px fj py bh pz"><div class="pn po qf"><picture><source srcSet="https://miro.medium.com/v2/resize:fit:640/format:webp/1*_uuoe43USer2SKMxm98igA.png 640w, https://miro.medium.com/v2/resize:fit:720/format:webp/1*_uuoe43USer2SKMxm98igA.png 720w, https://miro.medium.com/v2/resize:fit:750/format:webp/1*_uuoe43USer2SKMxm98igA.png 750w, https://miro.medium.com/v2/resize:fit:786/format:webp/1*_uuoe43USer2SKMxm98igA.png 786w, https://miro.medium.com/v2/resize:fit:828/format:webp/1*_uuoe43USer2SKMxm98igA.png 828w, https://miro.medium.com/v2/resize:fit:1100/format:webp/1*_uuoe43USer2SKMxm98igA.png 1100w, https://miro.medium.com/v2/resize:fit:1400/format:webp/1*_uuoe43USer2SKMxm98igA.png 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px" type="image/webp"/><source data-testid="og" srcSet="https://miro.medium.com/v2/resize:fit:640/1*_uuoe43USer2SKMxm98igA.png 640w, https://miro.medium.com/v2/resize:fit:720/1*_uuoe43USer2SKMxm98igA.png 720w, https://miro.medium.com/v2/resize:fit:750/1*_uuoe43USer2SKMxm98igA.png 750w, https://miro.medium.com/v2/resize:fit:786/1*_uuoe43USer2SKMxm98igA.png 786w, https://miro.medium.com/v2/resize:fit:828/1*_uuoe43USer2SKMxm98igA.png 828w, https://miro.medium.com/v2/resize:fit:1100/1*_uuoe43USer2SKMxm98igA.png 1100w, https://miro.medium.com/v2/resize:fit:1400/1*_uuoe43USer2SKMxm98igA.png 1400w" sizes="(min-resolution: 4dppx) and (max-width: 700px) 50vw, (-webkit-min-device-pixel-ratio: 4) and (max-width: 700px) 50vw, (min-resolution: 3dppx) and (max-width: 700px) 67vw, (-webkit-min-device-pixel-ratio: 3) and (max-width: 700px) 65vw, (min-resolution: 2.5dppx) and (max-width: 700px) 80vw, (-webkit-min-device-pixel-ratio: 2.5) and (max-width: 700px) 80vw, (min-resolution: 2dppx) and (max-width: 700px) 100vw, (-webkit-min-device-pixel-ratio: 2) and (max-width: 700px) 100vw, 700px"/><img alt="" class="bh mo qa c" width="700" height="397" loading="lazy" role="presentation"/></picture></div></div><figcaption class="qb ff qc pn po qd qe bf b bg z du">Figure 5. Interdisciplinary courses sit roughly between the right clusters.</figcaption></figure><p id="9737" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">Returning to the set of courses previously categorized as “medicine,” we now have three sub-categories. First is a relatively disjointed cluster of courses targeted to the medical professional (e.g., “<a class="af od" href="https://www.coursera.org/learn/ebola-essentials-for-health-professionals" rel="noopener ugc nofollow" target="_blank">Ebola: Essential Knowledge for the Healthcare Professional</a>”). Second is a cluster of courses on healthcare policy (e.g., “<a class="af od" href="https://www.coursera.org/learn/systems-thinking" rel="noopener ugc nofollow" target="_blank">Systems Thinking in Public Health</a>”), and lastly, we have a cluster on basic biology (e.g., “I<a class="af od" href="https://www.coursera.org/learn/genetics-evolution" rel="noopener ugc nofollow" target="_blank">ntroduction to Genetics and Evolution</a>”).</p><p id="25bc" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">The result is noteworthy because there is no strong reason why t-SNE should arrange our courses by subject matter. We weren’t feeding in course descriptions or transcripts, just the enrollment behavior of learners. We attribute the clusterability of courses to the fact that learners are much more likely to be interested in multiple courses in a particular subject area rather than to be influenced in their course decision by non-subject-matter factors such as the style of instruction or the institution offering the course.</p><p id="664e" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">That said, this assumption does not hold across the full catalog. For example, among non-English content, the language of instruction is more a driver of enrollment than the subject area. Correspondingly, a French or Russian course is more likely to be grouped with other courses taught in the respective language than it is to be grouped with other courses on the same subject.</p><p id="478e" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk">After some clean up, we landed at 36 course clusters, which rolled up into nine larger clusters. On the Coursera platform today, we term the original clusters “subdomains” and the larger clusters “domains.” We launched the new system of domains and subdomains in summer 2015. In the past three years, it has become an integral part of Coursera’s content discovery experience, allowing us to scale content categorization and drive personalization for each and every learner on our platform.</p><h2 id="c134" class="qj of gu bf og qk ql dy oj qm qn ea om nq qo qp qq nu qr qs qt ny qu qv qw qx bk">Acknowledgements</h2><p id="4ee7" class="pw-post-body-paragraph nh ni gu nj b hs pa nl nm hv pb no np nq pc ns nt nu pd nw nx ny pe oa ob oc gn bk"><em class="qy">Credit for the t-SNE approach goes to </em><a class="af od" href="https://www.linkedin.com/in/zhenghao-chen-44865036/" rel="noopener ugc nofollow" target="_blank"><em class="qy">Zhenghao Chen</em></a><em class="qy">, a previous Coursera data scientist.</em></p><p id="e9e1" class="pw-post-body-paragraph nh ni gu nj b hs nk nl nm hv nn no np nq nr ns nt nu nv nw nx ny nz oa ob oc gn bk"><em class="qy">I also want to thank</em><a class="af od" href="https://www.linkedin.com/in/egsands/" rel="noopener ugc nofollow" target="_blank"><em class="qy"> Emily Glassberg Sands</em></a><em class="qy"> for reading through and giving feedback on drafts.</em></p></div></div></div></div></section></div></div></article></div><div class="ab cb"><div class="ci bh fz ga gb gc"><div class="qz ra ab jm"><div class="rb ab"><a class="rc ay am ao" rel="noopener follow" href="/tag/data-science?source=post_page-----89de0104bcbd---------------------------------------"><div class="rd fj cx re ge rf rg bf b bg z bk rh">Data Science</div></a></div><div class="rb ab"><a class="rc ay am ao" rel="noopener follow" href="/tag/education?source=post_page-----89de0104bcbd---------------------------------------"><div class="rd fj cx re ge rf rg bf b bg z bk rh">Education</div></a></div><div class="rb ab"><a class="rc ay am ao" rel="noopener follow" href="/tag/technology?source=post_page-----89de0104bcbd---------------------------------------"><div class="rd fj cx re ge rf rg bf b bg z bk rh">Technology</div></a></div></div></div></div><div class="l"></div><footer class="ri rj rk rl rm ab q rn iw c"><div class="l ae"><div class="ab cb"><div class="ci bh fz ga gb gc"><div class="ab cp ro"><div class="ab q lf"><div class="rp l"><span class="l rq rr rs e d"><div class="ab q lf lg"><div class="pw-multi-vote-icon fj jo lh li lj"><span><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="footerClapButton" rel="noopener follow" href="/m/signin?actionUrl=https%3A%2F%2Fmedium.com%2F_%2Fvote%2Fcoursera-engineering%2F89de0104bcbd&amp;operation=register&amp;redirect=https%3A%2F%2Fmedium.com%2Fcoursera-engineering%2Fdata-driven-content-categorization-89de0104bcbd&amp;user=Chris+Liu&amp;userId=70814e310ce3&amp;source=---footer_actions--89de0104bcbd---------------------clap_footer------------------"><div><div class="bm" aria-hidden="false"><div class="lk ao ll lm ln lo am lp lq lr lj"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" viewBox="0 0 24 24" aria-label="clap"><path fill-rule="evenodd" d="M11.37.828 12 3.282l.63-2.454zM13.916 3.953l1.523-2.112-1.184-.39zM8.589 1.84l1.522 2.112-.337-2.501zM18.523 18.92c-.86.86-1.75 1.246-2.62 1.33a6 6 0 0 0 .407-.372c2.388-2.389 2.86-4.951 1.399-7.623l-.912-1.603-.79-1.672c-.26-.56-.194-.98.203-1.288a.7.7 0 0 1 .546-.132c.283.046.546.231.728.5l2.363 4.157c.976 1.624 1.141 4.237-1.324 6.702m-10.999-.438L3.37 14.328a.828.828 0 0 1 .585-1.408.83.83 0 0 1 .585.242l2.158 2.157a.365.365 0 0 0 .516-.516l-2.157-2.158-1.449-1.449a.826.826 0 0 1 1.167-1.17l3.438 3.44a.363.363 0 0 0 .516 0 .364.364 0 0 0 0-.516L5.293 9.513l-.97-.97a.826.826 0 0 1 0-1.166.84.84 0 0 1 1.167 0l.97.968 3.437 3.436a.36.36 0 0 0 .517 0 .366.366 0 0 0 0-.516L6.977 7.83a.82.82 0 0 1-.241-.584.82.82 0 0 1 .824-.826c.219 0 .43.087.584.242l5.787 5.787a.366.366 0 0 0 .587-.415l-1.117-2.363c-.26-.56-.194-.98.204-1.289a.7.7 0 0 1 .546-.132c.283.046.545.232.727.501l2.193 3.86c1.302 2.38.883 4.59-1.277 6.75-1.156 1.156-2.602 1.627-4.19 1.367-1.418-.236-2.866-1.033-4.079-2.246M10.75 5.971l2.12 2.12c-.41.502-.465 1.17-.128 1.89l.22.465-3.523-3.523a.8.8 0 0 1-.097-.368c0-.22.086-.428.241-.584a.847.847 0 0 1 1.167 0m7.355 1.705c-.31-.461-.746-.758-1.23-.837a1.44 1.44 0 0 0-1.11.275c-.312.24-.505.543-.59.881a1.74 1.74 0 0 0-.906-.465 1.47 1.47 0 0 0-.82.106l-2.182-2.182a1.56 1.56 0 0 0-2.2 0 1.54 1.54 0 0 0-.396.701 1.56 1.56 0 0 0-2.21-.01 1.55 1.55 0 0 0-.416.753c-.624-.624-1.649-.624-2.237-.037a1.557 1.557 0 0 0 0 2.2c-.239.1-.501.238-.715.453a1.56 1.56 0 0 0 0 2.2l.516.515a1.556 1.556 0 0 0-.753 2.615L7.01 19c1.32 1.319 2.909 2.189 4.475 2.449q.482.08.971.08c.85 0 1.653-.198 2.393-.579.231.033.46.054.686.054 1.266 0 2.457-.52 3.505-1.567 2.763-2.763 2.552-5.734 1.439-7.586z" clip-rule="evenodd"></path></svg></div></div></div></a></span></div><div class="pw-multi-vote-count l ls lt lu lv lw lx ly"><p class="bf b dv z du"><span class="lz">--</span></p></div></div></span><span class="l h g f rt ru"><div class="ab q lf lg"><div class="pw-multi-vote-icon fj jo lh li lj"><span><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="footerClapButton" rel="noopener follow" href="/m/signin?actionUrl=https%3A%2F%2Fmedium.com%2F_%2Fvote%2Fcoursera-engineering%2F89de0104bcbd&amp;operation=register&amp;redirect=https%3A%2F%2Fmedium.com%2Fcoursera-engineering%2Fdata-driven-content-categorization-89de0104bcbd&amp;user=Chris+Liu&amp;userId=70814e310ce3&amp;source=---footer_actions--89de0104bcbd---------------------clap_footer------------------"><div><div class="bm" aria-hidden="false"><div class="lk ao ll lm ln lo am lp lq lr lj"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" viewBox="0 0 24 24" aria-label="clap"><path fill-rule="evenodd" d="M11.37.828 12 3.282l.63-2.454zM13.916 3.953l1.523-2.112-1.184-.39zM8.589 1.84l1.522 2.112-.337-2.501zM18.523 18.92c-.86.86-1.75 1.246-2.62 1.33a6 6 0 0 0 .407-.372c2.388-2.389 2.86-4.951 1.399-7.623l-.912-1.603-.79-1.672c-.26-.56-.194-.98.203-1.288a.7.7 0 0 1 .546-.132c.283.046.546.231.728.5l2.363 4.157c.976 1.624 1.141 4.237-1.324 6.702m-10.999-.438L3.37 14.328a.828.828 0 0 1 .585-1.408.83.83 0 0 1 .585.242l2.158 2.157a.365.365 0 0 0 .516-.516l-2.157-2.158-1.449-1.449a.826.826 0 0 1 1.167-1.17l3.438 3.44a.363.363 0 0 0 .516 0 .364.364 0 0 0 0-.516L5.293 9.513l-.97-.97a.826.826 0 0 1 0-1.166.84.84 0 0 1 1.167 0l.97.968 3.437 3.436a.36.36 0 0 0 .517 0 .366.366 0 0 0 0-.516L6.977 7.83a.82.82 0 0 1-.241-.584.82.82 0 0 1 .824-.826c.219 0 .43.087.584.242l5.787 5.787a.366.366 0 0 0 .587-.415l-1.117-2.363c-.26-.56-.194-.98.204-1.289a.7.7 0 0 1 .546-.132c.283.046.545.232.727.501l2.193 3.86c1.302 2.38.883 4.59-1.277 6.75-1.156 1.156-2.602 1.627-4.19 1.367-1.418-.236-2.866-1.033-4.079-2.246M10.75 5.971l2.12 2.12c-.41.502-.465 1.17-.128 1.89l.22.465-3.523-3.523a.8.8 0 0 1-.097-.368c0-.22.086-.428.241-.584a.847.847 0 0 1 1.167 0m7.355 1.705c-.31-.461-.746-.758-1.23-.837a1.44 1.44 0 0 0-1.11.275c-.312.24-.505.543-.59.881a1.74 1.74 0 0 0-.906-.465 1.47 1.47 0 0 0-.82.106l-2.182-2.182a1.56 1.56 0 0 0-2.2 0 1.54 1.54 0 0 0-.396.701 1.56 1.56 0 0 0-2.21-.01 1.55 1.55 0 0 0-.416.753c-.624-.624-1.649-.624-2.237-.037a1.557 1.557 0 0 0 0 2.2c-.239.1-.501.238-.715.453a1.56 1.56 0 0 0 0 2.2l.516.515a1.556 1.556 0 0 0-.753 2.615L7.01 19c1.32 1.319 2.909 2.189 4.475 2.449q.482.08.971.08c.85 0 1.653-.198 2.393-.579.231.033.46.054.686.054 1.266 0 2.457-.52 3.505-1.567 2.763-2.763 2.552-5.734 1.439-7.586z" clip-rule="evenodd"></path></svg></div></div></div></a></span></div><div class="pw-multi-vote-count l ls lt lu lv lw lx ly"><p class="bf b dv z du"><span class="lz">--</span></p></div></div></span></div><div class="bq ab"><div><div class="bm" aria-hidden="false"><button class="ao lk mc md ab q fk me mf" aria-label="responses"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" viewBox="0 0 24 24" class="mb"><path d="M18.006 16.803c1.533-1.456 2.234-3.325 2.234-5.321C20.24 7.357 16.709 4 12.191 4S4 7.357 4 11.482c0 4.126 3.674 7.482 8.191 7.482.817 0 1.622-.111 2.393-.327.231.2.48.391.744.559 1.06.693 2.203 1.044 3.399 1.044.224-.008.4-.112.486-.287a.49.49 0 0 0-.042-.518c-.495-.67-.845-1.364-1.04-2.057a4 4 0 0 1-.125-.598zm-3.122 1.055-.067-.223-.315.096a8 8 0 0 1-2.311.338c-4.023 0-7.292-2.955-7.292-6.587 0-3.633 3.269-6.588 7.292-6.588 4.014 0 7.112 2.958 7.112 6.593 0 1.794-.608 3.469-2.027 4.72l-.195.168v.255c0 .056 0 .151.016.295.025.231.081.478.154.733.154.558.398 1.117.722 1.659a5.3 5.3 0 0 1-2.165-.845c-.276-.176-.714-.383-.941-.59z"></path></svg><p class="bf b bg z du"><span class="pw-responses-count ma mb">4</span></p></button></div></div></div></div><div class="ab q"><div class="rv l jj"><div><div class="bm" aria-hidden="false"><span><a class="af ag ah ai aj ak al am an ao ap aq ar as at" data-testid="footerBookmarkButton" rel="noopener follow" href="/m/signin?actionUrl=https%3A%2F%2Fmedium.com%2F_%2Fbookmark%2Fp%2F89de0104bcbd&amp;operation=register&amp;redirect=https%3A%2F%2Fmedium.com%2Fcoursera-engineering%2Fdata-driven-content-categorization-89de0104bcbd&amp;source=---footer_actions--89de0104bcbd---------------------bookmark_footer------------------"><svg xmlns="http://www.w3.org/2000/svg" width="25" height="25" fill="none" viewBox="0 0 25 25" class="du mh" aria-label="Add to list bookmark button"><path fill="currentColor" d="M18 2.5a.5.5 0 0 1 1 0V5h2.5a.5.5 0 0 1 0 1H19v2.5a.5.5 0 1 1-1 0V6h-2.5a.5.5 0 0 1 0-1H18zM7 7a1 1 0 0 1 1-1h3.5a.5.5 0 0 0 0-1H8a2 2 0 0 0-2 2v14a.5.5 0 0 0 .805.396L12.5 17l5.695 4.396A.5.5 0 0 0 19 21v-8.5a.5.5 0 0 0-1 0v7.485l-5.195-4.012a.5.5 0 0 0-.61 0L7 19.985z"></path></svg></a></span></div></div></div><div class="rv l jj"><div class="bm" aria-hidden="false" aria-describedby="postFooterSocialMenu" aria-labelledby="postFooterSocialMenu"><div><div class="bm" aria-hidden="false"><button aria-controls="postFooterSocialMenu" aria-expanded="false" aria-label="Share Post" data-testid="footerSocialShareButton" class="af fk ah ai aj ak al mp an ao ap ex mq mr mf ms"><svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="none" viewBox="0 0 24 24"><path fill="currentColor" fill-rule="evenodd" d="M15.218 4.931a.4.4 0 0 1-.118.132l.012.006a.45.45 0 0 1-.292.074.5.5 0 0 1-.3-.13l-2.02-2.02v7.07c0 .28-.23.5-.5.5s-.5-.22-.5-.5v-7.04l-2 2a.45.45 0 0 1-.57.04h-.02a.4.4 0 0 1-.16-.3.4.4 0 0 1 .1-.32l2.8-2.8a.5.5 0 0 1 .7 0l2.8 2.79a.42.42 0 0 1 .068.498m-.106.138.008.004v-.01zM16 7.063h1.5a2 2 0 0 1 2 2v10a2 2 0 0 1-2 2h-11c-1.1 0-2-.9-2-2v-10a2 2 0 0 1 2-2H8a.5.5 0 0 1 .35.15.5.5 0 0 1 .15.35.5.5 0 0 1-.15.35.5.5 0 0 1-.35.15H6.4c-.5 0-.9.4-.9.9v10.2a.9.9 0 0 0 .9.9h11.2c.5 0 .9-.4.9-.9v-10.2c0-.5-.4-.9-.9-.9H16a.5.5 0 0 1 0-1" clip-rule="evenodd"></path></svg></button></div></div></div></div></div></div></div></div></div></footer><div class="rw l"><div><div class="ab cb"><div class="ci bh fz ga gb gc"><div class="rx l"><div class="ab ry rz sa jl jk"><div class="sb sc sd se sf sg sh si sj sk ab cp"><div class="h k"><a href="https://medium.com/coursera-engineering?source=post_page---post_publication_info--89de0104bcbd---------------------------------------" rel="noopener follow"><div class="fj ab"><img alt="Coursera Engineering" class="sl in io cx" src="https://miro.medium.com/v2/resize:fill:96:96/1*j2vLJO9qZg435iRYfd2Mfg.png" width="48" height="48" loading="lazy"/><div class="sl l io in fs n fr sm"></div></div></a></div><div class="j i d"><a href="https://medium.com/coursera-engineering?source=post_page---post_publication_info--89de0104bcbd---------------------------------------" rel="noopener follow"><div class="fj ab"><img alt="Coursera Engineering" class="sl so sn cx" src="https://miro.medium.com/v2/resize:fill:128:128/1*j2vLJO9qZg435iRYfd2Mfg.png" width="64" height="64" loading="lazy"/><div class="sl l sn so fs n fr sm"></div></div></a></div><div class="j i d sp jj"><div class="ab"></div></div></div><div class="ab co sq"><div class="sr ss st su sv l"><a class="af ag ah aj ak al am an ao ap aq ar as at ab q" href="https://medium.com/coursera-engineering?source=post_page---post_publication_info--89de0104bcbd---------------------------------------" rel="noopener follow"><h2 class="pw-author-name bf sx sy sz ta tb tc td nq qp qq nu qs qt ny qv qw bk"><span class="gn sw">Published in <!-- -->Coursera Engineering</span></h2></a><div class="rb ab im"><div class="l jj"><span class="pw-follower-count bf b bg z du"><a class="af ag ah ai aj ak al am an ao ap aq ar jc" rel="noopener follow" href="/coursera-engineering/followers?source=post_page---post_publication_info--89de0104bcbd---------------------------------------">3.8K Followers</a></span></div><div class="bf b bg z du ab jn"><span class="jd l" aria-hidden="true"><span class="bf b bg z du">·</span></span><a class="af ag ah ai aj ak al am an ao ap aq ar jc" rel="noopener follow" href="/coursera-engineering/two-easy-ways-to-determine-right-size-for-aws-rds-instance-through-request-mirroring-load-test-9cd6e8ac8b5c?source=post_page---post_publication_info--89de0104bcbd---------------------------------------">Last published <span>Jan 3, 2023</span></a></div></div><div class="te l"><p class="bf b bg z bk"><span class="gn">We&#x27;re changing the way the world learns! Posts from Coursera engineers and data scientists.</span></p></div></div></div><div class="h k"><div class="ab"></div></div></div></div><div class="ab ry rz sa jl jk"><div class="sb sc sd se sf sg sh si sj sk ab cp"><div class="h k"><a tabindex="0" rel="noopener follow" href="/@cliu_88389?source=post_page---post_author_info--89de0104bcbd---------------------------------------"><div class="l fj"><img alt="Chris Liu" class="l fd by io in cx" src="https://miro.medium.com/v2/resize:fill:96:96/0*ECSDCjFKbFRqqOIr." width="48" height="48" loading="lazy"/><div class="fr by l io in fs n ay sm"></div></div></a></div><div class="j i d"><a tabindex="0" rel="noopener follow" href="/@cliu_88389?source=post_page---post_author_info--89de0104bcbd---------------------------------------"><div class="l fj"><img alt="Chris Liu" class="l fd by sn so cx" src="https://miro.medium.com/v2/resize:fill:128:128/0*ECSDCjFKbFRqqOIr." width="64" height="64" loading="lazy"/><div class="fr by l sn so fs n ay sm"></div></div></a></div><div class="j i d sp jj"><div class="ab"><span><button class="bf b bg z tf rd tg th ti tj tk ev ew tl tm tn fa fb fc fd bm fe ff">Follow</button></span></div></div></div><div class="ab co sq"><div class="sr ss st su sv l"><a class="af ag ah aj ak al am an ao ap aq ar as at ab q" rel="noopener follow" href="/@cliu_88389?source=post_page---post_author_info--89de0104bcbd---------------------------------------"><h2 class="pw-author-name bf sx sy sz ta tb tc td nq qp qq nu qs qt ny qv qw bk"><span class="gn sw">Written by <!-- -->Chris Liu</span></h2></a><div class="rb ab im"><div class="l jj"><span class="pw-follower-count bf b bg z du"><a class="af ag ah ai aj ak al am an ao ap aq ar jc" rel="noopener follow" href="/@cliu_88389/followers?source=post_page---post_author_info--89de0104bcbd---------------------------------------">103 Followers</a></span></div><div class="bf b bg z du ab jn"><span class="jd l" aria-hidden="true"><span class="bf b bg z du">·</span></span><a class="af ag ah ai aj ak al am an ao ap aq ar jc" rel="noopener follow" href="/@cliu_88389/following?source=post_page---post_author_info--89de0104bcbd---------------------------------------">4 Following</a></div></div><div class="te l"><p class="bf b bg z bk"><span class="gn">Passionate about education and solving hard problems in a collaborative fashion.</span></p></div></div></div><div class="h k"><div class="ab"><span><button class="bf b bg z tf rd tg th ti tj tk ev ew tl tm tn fa fb fc fd bm fe ff">Follow</button></span></div></div></div></div></div></div></div><div class="to tp tq tr ts l"><div class="tt bh r rw"></div><div class="ab cb"><div class="ci bh fz ga gb gc"><div class="ab q cp"><h2 class="bf sx oh hu oj ok hx om on op oq or ot ou ov ox oy bk">Responses (<!-- -->4<!-- -->)</h2><div class="ab tu"><div><div class="bm" aria-hidden="false"><a class="tv tw" href="https://policy.medium.com/medium-rules-30e5502c4eb4?source=post_page---post_responses--89de0104bcbd---------------------------------------" rel="noopener follow" target="_blank"><svg xmlns="http://www.w3.org/2000/svg" width="25" height="25" viewBox="0 0 25 25"><path fill-rule="evenodd" d="M11.987 5.036a.754.754 0 0 1 .914-.01c.972.721 1.767 1.218 2.6 1.543.828.322 1.719.485 2.887.505a.755.755 0 0 1 .741.757c-.018 3.623-.43 6.256-1.449 8.21-1.034 1.984-2.662 3.209-4.966 4.083a.75.75 0 0 1-.537-.003c-2.243-.874-3.858-2.095-4.897-4.074-1.024-1.951-1.457-4.583-1.476-8.216a.755.755 0 0 1 .741-.757c1.195-.02 2.1-.182 2.923-.503.827-.322 1.6-.815 2.519-1.535m.468.903c-.897.69-1.717 1.21-2.623 1.564-.898.35-1.856.527-3.026.565.037 3.45.469 5.817 1.36 7.515.884 1.684 2.25 2.762 4.284 3.571 2.092-.81 3.465-1.89 4.344-3.575.886-1.698 1.299-4.065 1.334-7.512-1.149-.039-2.091-.217-2.99-.567-.906-.353-1.745-.873-2.683-1.561m-.009 9.155a2.672 2.672 0 1 0 0-5.344 2.672 2.672 0 0 0 0 5.344m0 1a3.672 3.672 0 1 0 0-7.344 3.672 3.672 0 0 0 0 7.344m-1.813-3.777.525-.526.916.917 1.623-1.625.526.526-2.149 2.152z" clip-rule="evenodd"></path></svg></a></div></div></div></div><div class="tx ty tz ua ub uc ud l"></div><div class="ue l"><button class="bf b bg z bk rd uf ug uh mh me tk ev ew ex ui uj uk fa ul um un uo up fb fc fd bm fe ff">See all responses</button></div></div></div></div><div class="uq ur us ut uu l bx"><div class="h k j"><div class="tt bh uv uw"></div><div class="ab cb"><div class="ci bh fz ga gb gc"><div class="ux ab lf jm"><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" href="https://help.medium.com/hc/en-us?source=post_page-----89de0104bcbd---------------------------------------" rel="noopener follow"><p class="bf b dv z du">Help</p></a></div><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" href="https://medium.statuspage.io/?source=post_page-----89de0104bcbd---------------------------------------" rel="noopener follow"><p class="bf b dv z du">Status</p></a></div><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" rel="noopener follow" href="/about?autoplay=1&amp;source=post_page-----89de0104bcbd---------------------------------------"><p class="bf b dv z du">About</p></a></div><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" rel="noopener follow" href="/jobs-at-medium/work-at-medium-959d1a85284e?source=post_page-----89de0104bcbd---------------------------------------"><p class="bf b dv z du">Careers</p></a></div><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" href="mailto:pressinquiries@medium.com" rel="noopener follow"><p class="bf b dv z du">Press</p></a></div><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" href="https://blog.medium.com/?source=post_page-----89de0104bcbd---------------------------------------" rel="noopener follow"><p class="bf b dv z du">Blog</p></a></div><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" href="https://policy.medium.com/medium-privacy-policy-f03bf92035c9?source=post_page-----89de0104bcbd---------------------------------------" rel="noopener follow"><p class="bf b dv z du">Privacy</p></a></div><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" href="https://policy.medium.com/medium-terms-of-service-9db0094a1e0f?source=post_page-----89de0104bcbd---------------------------------------" rel="noopener follow"><p class="bf b dv z du">Terms</p></a></div><div class="uy uz l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" href="https://speechify.com/medium?source=post_page-----89de0104bcbd---------------------------------------" rel="noopener follow"><p class="bf b dv z du">Text to speech</p></a></div><div class="uy l"><a class="af ag ah ai aj ak al am an ao ap aq ar as at" rel="noopener follow" href="/business?source=post_page-----89de0104bcbd---------------------------------------"><p class="bf b dv z du">Teams</p></a></div></div></div></div></div></div></div></div></div></div><script>window.__BUILD_ID__="main-20250214-225023-b6ac233ec4"</script><script>window.__GRAPHQL_URI__ = "https://medium.com/_/graphql"</script><script>window.__PRELOADED_STATE__ = {"algolia":{"queries":{}},"cache":{"experimentGroupSet":true,"reason":"","group":"enabled","tags":["group-edgeCachePosts","post-89de0104bcbd","user-70814e310ce3","collection-532b19e4043c"],"serverVariantState":"44136fa355b3678a1146ad16f7e8649e94fb4fc21fe77e8310c060f61caaff8a","middlewareEnabled":true,"cacheStatus":"DYNAMIC","shouldUseCache":true,"vary":[],"pubFeaturingPostPageLabelEnabled":false},"client":{"hydrated":false,"isUs":false,"isNativeMedium":false,"isSafariMobile":false,"isSafari":false,"isFirefox":false,"routingEntity":{"type":"DEFAULT","explicit":false},"viewerIsBot":false},"debug":{"requestId":"e94350ce-3d47-4b44-b9dd-bd640e63fc70","requestTag":"","hybridDevServices":[],"originalSpanCarrier":{"traceparent":"00-0dfc3b2caf3abffd5ea3f30c639854d9-89e0c20928b7b634-01"}},"multiVote":{"clapsPerPost":{}},"navigation":{"branch":{"show":null,"hasRendered":null,"blockedByCTA":false},"hideGoogleOneTap":false,"hasRenderedAlternateUserBanner":null,"currentLocation":"https:\u002F\u002Fmedium.com\u002Fcoursera-engineering\u002Fdata-driven-content-categorization-89de0104bcbd","host":"medium.com","hostname":"medium.com","referrer":"","hasSetReferrer":false,"susiModal":{"step":null,"operation":"register"},"postRead":false,"partnerProgram":{"selectedCountryCode":null},"queryString":"","currentHash":""},"config":{"nodeEnv":"production","version":"main-20250214-225023-b6ac233ec4","target":"production","productName":"Medium","publicUrl":"https:\u002F\u002Fcdn-client.medium.com\u002Flite","authDomain":"medium.com","authGoogleClientId":"216296035834-k1k6qe060s2tp2a2jam4ljdcms00sttg.apps.googleusercontent.com","favicon":"production","glyphUrl":"https:\u002F\u002Fglyph.medium.com","branchKey":"key_live_ofxXr2qTrrU9NqURK8ZwEhknBxiI6KBm","algolia":{"appId":"MQ57UUUQZ2","apiKeySearch":"394474ced050e3911ae2249ecc774921","indexPrefix":"medium_","host":"-dsn.algolia.net"},"recaptchaKey":"6Lfc37IUAAAAAKGGtC6rLS13R1Hrw_BqADfS1LRk","recaptcha3Key":"6Lf8R9wUAAAAABMI_85Wb8melS7Zj6ziuf99Yot5","recaptchaEnterpriseKeyId":"6Le-uGgpAAAAAPprRaokM8AKthQ9KNGdoxaGUvVp","datadog":{"applicationId":"6702d87d-a7e0-42fe-bbcb-95b469547ea0","clientToken":"pub853ea8d17ad6821d9f8f11861d23dfed","rumToken":"pubf9cc52896502b9413b68ba36fc0c7162","context":{"deployment":{"target":"production","tag":"main-20250214-225023-b6ac233ec4","commit":"b6ac233ec4e33c48e304b373b7df8c338a410ef2"}},"datacenter":"us"},"googleAnalyticsCode":"G-7JY7T788PK","googlePay":{"apiVersion":"2","apiVersionMinor":"0","merchantId":"BCR2DN6TV7EMTGBM","merchantName":"Medium","instanceMerchantId":"13685562959212738550"},"applePay":{"version":3},"signInWallCustomDomainCollectionIds":["3a8144eabfe3","336d898217ee","61061eb0c96b","138adf9c44c","819cc2aaeee0"],"mediumMastodonDomainName":"me.dm","mediumOwnedAndOperatedCollectionIds":["8a9336e5bb4","b7e45b22fec3","193b68bd4fba","8d6b8a439e32","54c98c43354d","3f6ecf56618","d944778ce714","92d2092dc598","ae2a65f35510","1285ba81cada","544c7006046e","fc8964313712","40187e704f1c","88d9857e584e","7b6769f2748b","bcc38c8f6edf","cef6983b292","cb8577c9149e","444d13b52878","713d7dbc99b0","ef8e90590e66","191186aaafa0","55760f21cdc5","9dc80918cc93","bdc4052bbdba","8ccfed20cbb2"],"tierOneDomains":["medium.com","thebolditalic.com","arcdigital.media","towardsdatascience.com","uxdesign.cc","codeburst.io","psiloveyou.xyz","writingcooperative.com","entrepreneurshandbook.co","prototypr.io","betterhumans.coach.me","theascent.pub"],"topicsToFollow":["d61cf867d93f","8a146bc21b28","1eca0103fff3","4d562ee63426","aef1078a3ef5","e15e46793f8d","6158eb913466","55f1c20aba7a","3d18b94f6858","4861fee224fd","63c6f1f93ee","1d98b3a9a871","decb52b64abf","ae5d4995e225","830cded25262"],"topicToTagMappings":{"accessibility":"accessibility","addiction":"addiction","android-development":"android-development","art":"art","artificial-intelligence":"artificial-intelligence","astrology":"astrology","basic-income":"basic-income","beauty":"beauty","biotech":"biotech","blockchain":"blockchain","books":"books","business":"business","cannabis":"cannabis","cities":"cities","climate-change":"climate-change","comics":"comics","coronavirus":"coronavirus","creativity":"creativity","cryptocurrency":"cryptocurrency","culture":"culture","cybersecurity":"cybersecurity","data-science":"data-science","design":"design","digital-life":"digital-life","disability":"disability","economy":"economy","education":"education","equality":"equality","family":"family","feminism":"feminism","fiction":"fiction","film":"film","fitness":"fitness","food":"food","freelancing":"freelancing","future":"future","gadgets":"gadgets","gaming":"gaming","gun-control":"gun-control","health":"health","history":"history","humor":"humor","immigration":"immigration","ios-development":"ios-development","javascript":"javascript","justice":"justice","language":"language","leadership":"leadership","lgbtqia":"lgbtqia","lifestyle":"lifestyle","machine-learning":"machine-learning","makers":"makers","marketing":"marketing","math":"math","media":"media","mental-health":"mental-health","mindfulness":"mindfulness","money":"money","music":"music","neuroscience":"neuroscience","nonfiction":"nonfiction","outdoors":"outdoors","parenting":"parenting","pets":"pets","philosophy":"philosophy","photography":"photography","podcasts":"podcast","poetry":"poetry","politics":"politics","privacy":"privacy","product-management":"product-management","productivity":"productivity","programming":"programming","psychedelics":"psychedelics","psychology":"psychology","race":"race","relationships":"relationships","religion":"religion","remote-work":"remote-work","san-francisco":"san-francisco","science":"science","self":"self","self-driving-cars":"self-driving-cars","sexuality":"sexuality","social-media":"social-media","society":"society","software-engineering":"software-engineering","space":"space","spirituality":"spirituality","sports":"sports","startups":"startup","style":"style","technology":"technology","transportation":"transportation","travel":"travel","true-crime":"true-crime","tv":"tv","ux":"ux","venture-capital":"venture-capital","visual-design":"visual-design","work":"work","world":"world","writing":"writing"},"defaultImages":{"avatar":{"imageId":"1*dmbNkD5D-u45r44go_cf0g.png","height":150,"width":150},"orgLogo":{"imageId":"7*V1_7XP4snlmqrc_0Njontw.png","height":110,"width":500},"postLogo":{"imageId":"bd978bb536350a710e8efb012513429cabdc4c28700604261aeda246d0f980b7","height":810,"width":1440},"postPreviewImage":{"imageId":"1*hn4v1tCaJy7cWMyb0bpNpQ.png","height":386,"width":579}},"collectionStructuredData":{"8d6b8a439e32":{"name":"Elemental","data":{"@type":"NewsMediaOrganization","ethicsPolicy":"https:\u002F\u002Fhelp.medium.com\u002Fhc\u002Fen-us\u002Farticles\u002F360043290473","logo":{"@type":"ImageObject","url":"https:\u002F\u002Fcdn-images-1.medium.com\u002Fmax\u002F980\u002F1*9ygdqoKprhwuTVKUM0DLPA@2x.png","width":980,"height":159}}},"3f6ecf56618":{"name":"Forge","data":{"@type":"NewsMediaOrganization","ethicsPolicy":"https:\u002F\u002Fhelp.medium.com\u002Fhc\u002Fen-us\u002Farticles\u002F360043290473","logo":{"@type":"ImageObject","url":"https:\u002F\u002Fcdn-images-1.medium.com\u002Fmax\u002F596\u002F1*uULpIlImcO5TDuBZ6lm7Lg@2x.png","width":596,"height":183}}},"ae2a65f35510":{"name":"GEN","data":{"@type":"NewsMediaOrganization","ethicsPolicy":"https:\u002F\u002Fhelp.medium.com\u002Fhc\u002Fen-us\u002Farticles\u002F360043290473","logo":{"@type":"ImageObject","url":"https:\u002F\u002Fmiro.medium.com\u002Fmax\u002F264\u002F1*RdVZMdvfV3YiZTw6mX7yWA.png","width":264,"height":140}}},"88d9857e584e":{"name":"LEVEL","data":{"@type":"NewsMediaOrganization","ethicsPolicy":"https:\u002F\u002Fhelp.medium.com\u002Fhc\u002Fen-us\u002Farticles\u002F360043290473","logo":{"@type":"ImageObject","url":"https:\u002F\u002Fmiro.medium.com\u002Fmax\u002F540\u002F1*JqYMhNX6KNNb2UlqGqO2WQ.png","width":540,"height":108}}},"7b6769f2748b":{"name":"Marker","data":{"@type":"NewsMediaOrganization","ethicsPolicy":"https:\u002F\u002Fhelp.medium.com\u002Fhc\u002Fen-us\u002Farticles\u002F360043290473","logo":{"@type":"ImageObject","url":"https:\u002F\u002Fcdn-images-1.medium.com\u002Fmax\u002F383\u002F1*haCUs0wF6TgOOvfoY-jEoQ@2x.png","width":383,"height":92}}},"444d13b52878":{"name":"OneZero","data":{"@type":"NewsMediaOrganization","ethicsPolicy":"https:\u002F\u002Fhelp.medium.com\u002Fhc\u002Fen-us\u002Farticles\u002F360043290473","logo":{"@type":"ImageObject","url":"https:\u002F\u002Fmiro.medium.com\u002Fmax\u002F540\u002F1*cw32fIqCbRWzwJaoQw6BUg.png","width":540,"height":123}}},"8ccfed20cbb2":{"name":"Zora","data":{"@type":"NewsMediaOrganization","ethicsPolicy":"https:\u002F\u002Fhelp.medium.com\u002Fhc\u002Fen-us\u002Farticles\u002F360043290473","logo":{"@type":"ImageObject","url":"https:\u002F\u002Fmiro.medium.com\u002Fmax\u002F540\u002F1*tZUQqRcCCZDXjjiZ4bDvgQ.png","width":540,"height":106}}}},"embeddedPostIds":{"coronavirus":"cd3010f9d81f"},"sharedCdcMessaging":{"COVID_APPLICABLE_TAG_SLUGS":[],"COVID_APPLICABLE_TOPIC_NAMES":[],"COVID_APPLICABLE_TOPIC_NAMES_FOR_TOPIC_PAGE":[],"COVID_MESSAGES":{"tierA":{"text":"For more information on the novel coronavirus and Covid-19, visit cdc.gov.","markups":[{"start":66,"end":73,"href":"https:\u002F\u002Fwww.cdc.gov\u002Fcoronavirus\u002F2019-nCoV"}]},"tierB":{"text":"Anyone can publish on Medium per our Policies, but we don’t fact-check every story. For more info about the coronavirus, see cdc.gov.","markups":[{"start":37,"end":45,"href":"https:\u002F\u002Fhelp.medium.com\u002Fhc\u002Fen-us\u002Fcategories\u002F201931128-Policies-Safety"},{"start":125,"end":132,"href":"https:\u002F\u002Fwww.cdc.gov\u002Fcoronavirus\u002F2019-nCoV"}]},"paywall":{"text":"This article has been made free for everyone, thanks to Medium Members. For more information on the novel coronavirus and Covid-19, visit cdc.gov.","markups":[{"start":56,"end":70,"href":"https:\u002F\u002Fmedium.com\u002Fmembership"},{"start":138,"end":145,"href":"https:\u002F\u002Fwww.cdc.gov\u002Fcoronavirus\u002F2019-nCoV"}]},"unbound":{"text":"This article is free for everyone, thanks to Medium Members. For more information on the novel coronavirus and Covid-19, visit cdc.gov.","markups":[{"start":45,"end":59,"href":"https:\u002F\u002Fmedium.com\u002Fmembership"},{"start":127,"end":134,"href":"https:\u002F\u002Fwww.cdc.gov\u002Fcoronavirus\u002F2019-nCoV"}]}},"COVID_BANNER_POST_ID_OVERRIDE_WHITELIST":["3b31a67bff4a"]},"sharedVoteMessaging":{"TAGS":["politics","election-2020","government","us-politics","election","2020-presidential-race","trump","donald-trump","democrats","republicans","congress","republican-party","democratic-party","biden","joe-biden","maga"],"TOPICS":["politics","election"],"MESSAGE":{"text":"Find out more about the U.S. election results here.","markups":[{"start":46,"end":50,"href":"https:\u002F\u002Fcookpolitical.com\u002F2020-national-popular-vote-tracker"}]},"EXCLUDE_POSTS":["397ef29e3ca5"]},"embedPostRules":[],"recircOptions":{"v1":{"limit":3},"v2":{"limit":8}},"braintreeClientKey":"production_zjkj96jm_m56f8fqpf7ngnrd4","braintree":{"enabled":true,"merchantId":"m56f8fqpf7ngnrd4","merchantAccountId":{"usd":"AMediumCorporation_instant","eur":"amediumcorporation_EUR","cad":"amediumcorporation_CAD"},"publicKey":"ds2nn34bg2z7j5gd","braintreeEnvironment":"production","dashboardUrl":"https:\u002F\u002Fwww.braintreegateway.com\u002Fmerchants","gracePeriodDurationInDays":14,"mediumMembershipPlanId":{"monthly":"ce105f8c57a3","monthlyV2":"e8a5e126-792b-4ee6-8fba-d574c1b02fc5","monthlyWithTrial":"d5ee3dbe3db8","monthlyPremium":"fa741a9b47a2","yearly":"a40ad4a43185","yearlyV2":"3815d7d6-b8ca-4224-9b8c-182f9047866e","yearlyStaff":"d74fb811198a","yearlyWithTrial":"b3bc7350e5c7","yearlyPremium":"e21bd2c12166","monthlyOneYearFree":"e6c0637a-2bad-4171-ab4f-3c268633d83c","monthly25PercentOffFirstYear":"235ecc62-0cdb-49ae-9378-726cd21c504b","monthly20PercentOffFirstYear":"ba518864-9c13-4a99-91ca-411bf0cac756","monthly15PercentOffFirstYear":"594c029b-9f89-43d5-88f8-8173af4e070e","monthly10PercentOffFirstYear":"c6c7bc9a-40f2-4b51-8126-e28511d5bdb0","monthlyForStudents":"629ebe51-da7d-41fd-8293-34cd2f2030a8","yearlyOneYearFree":"78ba7be9-0d9f-4ece-aa3e-b54b826f2bf1","yearly25PercentOffFirstYear":"2dbb010d-bb8f-4eeb-ad5c-a08509f42d34","yearly20PercentOffFirstYear":"47565488-435b-47f8-bf93-40d5fbe0ebc8","yearly15PercentOffFirstYear":"8259809b-0881-47d9-acf7-6c001c7f720f","yearly10PercentOffFirstYear":"9dd694fb-96e1-472c-8d9e-3c868d5c1506","yearlyForStudents":"e29345ef-ab1c-4234-95c5-70e50fe6bc23","monthlyCad":"p52orjkaceei","yearlyCad":"h4q9g2up9ktt"},"braintreeDiscountId":{"oneMonthFree":"MONTHS_FREE_01","threeMonthsFree":"MONTHS_FREE_03","sixMonthsFree":"MONTHS_FREE_06","fiftyPercentOffOneYear":"FIFTY_PERCENT_OFF_ONE_YEAR"},"3DSecureVersion":"2","defaultCurrency":"usd","providerPlanIdCurrency":{"4ycw":"usd","rz3b":"usd","3kqm":"usd","jzw6":"usd","c2q2":"usd","nnsw":"usd","q8qw":"usd","d9y6":"usd","fx7w":"cad","nwf2":"cad"}},"paypalClientId":"AXj1G4fotC2GE8KzWX9mSxCH1wmPE3nJglf4Z2ig_amnhvlMVX87otaq58niAg9iuLktVNF_1WCMnN7v","paypal":{"host":"https:\u002F\u002Fapi.paypal.com:443","clientMode":"production","serverMode":"live","webhookId":"4G466076A0294510S","monthlyPlan":{"planId":"P-9WR0658853113943TMU5FDQA","name":"Medium Membership (Monthly) with setup fee","description":"Unlimited access to the best and brightest stories on Medium. Membership billed monthly."},"yearlyPlan":{"planId":"P-7N8963881P8875835MU5JOPQ","name":"Medium Membership (Annual) with setup fee","description":"Unlimited access to the best and brightest stories on Medium. Membership billed annually."},"oneYearGift":{"name":"Medium Membership (1 Year, Digital Gift Code)","description":"Unlimited access to the best and brightest stories on Medium. Gift codes can be redeemed at medium.com\u002Fredeem.","price":"50.00","currency":"USD","sku":"membership-gift-1-yr"},"oldMonthlyPlan":{"planId":"P-96U02458LM656772MJZUVH2Y","name":"Medium Membership (Monthly)","description":"Unlimited access to the best and brightest stories on Medium. Membership billed monthly."},"oldYearlyPlan":{"planId":"P-59P80963JF186412JJZU3SMI","name":"Medium Membership (Annual)","description":"Unlimited access to the best and brightest stories on Medium. Membership billed annually."},"monthlyPlanWithTrial":{"planId":"P-66C21969LR178604GJPVKUKY","name":"Medium Membership (Monthly) with setup fee","description":"Unlimited access to the best and brightest stories on Medium. Membership billed monthly."},"yearlyPlanWithTrial":{"planId":"P-6XW32684EX226940VKCT2MFA","name":"Medium Membership (Annual) with setup fee","description":"Unlimited access to the best and brightest stories on Medium. Membership billed annually."},"oldMonthlyPlanNoSetupFee":{"planId":"P-4N046520HR188054PCJC7LJI","name":"Medium Membership (Monthly)","description":"Unlimited access to the best and brightest stories on Medium. Membership billed monthly."},"oldYearlyPlanNoSetupFee":{"planId":"P-7A4913502Y5181304CJEJMXQ","name":"Medium Membership (Annual)","description":"Unlimited access to the best and brightest stories on Medium. Membership billed annually."},"sdkUrl":"https:\u002F\u002Fwww.paypal.com\u002Fsdk\u002Fjs"},"stripePublishableKey":"pk_live_7FReX44VnNIInZwrIIx6ghjl","log":{"json":true,"level":"info"},"imageUploadMaxSizeMb":25,"staffPicks":{"title":"Staff Picks","catalogId":"c7bc6e1ee00f"}},"session":{"xsrf":""}}</script><script>window.__APOLLO_STATE__ = {"ROOT_QUERY":{"__typename":"Query","viewer":null,"collectionByDomainOrSlug({\"domainOrSlug\":\"coursera-engineering\"})":{"__ref":"Collection:532b19e4043c"},"postResult({\"id\":\"89de0104bcbd\"})":{"__ref":"Post:89de0104bcbd"}},"ImageMetadata:":{"__typename":"ImageMetadata","id":""},"Collection:532b19e4043c":{"__typename":"Collection","id":"532b19e4043c","favicon":{"__ref":"ImageMetadata:"},"customStyleSheet":null,"colorPalette":{"__typename":"ColorPalette","highlightSpectrum":{"__typename":"ColorSpectrum","backgroundColor":"#FFFFFFFF","colorPoints":[{"__typename":"ColorPoint","color":"#FFECF3FF","point":0},{"__typename":"ColorPoint","color":"#FFE8F2FF","point":0.1},{"__typename":"ColorPoint","color":"#FFE5F0FF","point":0.2},{"__typename":"ColorPoint","color":"#FFE1EFFF","point":0.3},{"__typename":"ColorPoint","color":"#FFDDEDFF","point":0.4},{"__typename":"ColorPoint","color":"#FFD9EBFF","point":0.5},{"__typename":"ColorPoint","color":"#FFD6EAFF","point":0.6},{"__typename":"ColorPoint","color":"#FFD2E8FF","point":0.7},{"__typename":"ColorPoint","color":"#FFCEE6FF","point":0.8},{"__typename":"ColorPoint","color":"#FFCAE5FF","point":0.9},{"__typename":"ColorPoint","color":"#FFC6E3FF","point":1}]},"defaultBackgroundSpectrum":{"__typename":"ColorSpectrum","backgroundColor":"#FFFFFFFF","colorPoints":[{"__typename":"ColorPoint","color":"#FF6388BF","point":0},{"__typename":"ColorPoint","color":"#FF5D7EB0","point":0.1},{"__typename":"ColorPoint","color":"#FF5775A1","point":0.2},{"__typename":"ColorPoint","color":"#FF516B91","point":0.3},{"__typename":"ColorPoint","color":"#FF4A6182","point":0.4},{"__typename":"ColorPoint","color":"#FF435673","point":0.5},{"__typename":"ColorPoint","color":"#FF3C4B63","point":0.6},{"__typename":"ColorPoint","color":"#FF334054","point":0.7},{"__typename":"ColorPoint","color":"#FF2A3444","point":0.8},{"__typename":"ColorPoint","color":"#FF202833","point":0.9},{"__typename":"ColorPoint","color":"#FF151B23","point":1}]},"tintBackgroundSpectrum":{"__typename":"ColorSpectrum","backgroundColor":"#FF82A8E1","colorPoints":[{"__typename":"ColorPoint","color":"#FF82A8E1","point":0},{"__typename":"ColorPoint","color":"#FF8FB1E6","point":0.1},{"__typename":"ColorPoint","color":"#FF9CBBEA","point":0.2},{"__typename":"ColorPoint","color":"#FFA8C4EF","point":0.3},{"__typename":"ColorPoint","color":"#FFB4CDF3","point":0.4},{"__typename":"ColorPoint","color":"#FFC0D6F7","point":0.5},{"__typename":"ColorPoint","color":"#FFCCDEFB","point":0.6},{"__typename":"ColorPoint","color":"#FFD8E7FF","point":0.7},{"__typename":"ColorPoint","color":"#FFE3EFFF","point":0.8},{"__typename":"ColorPoint","color":"#FFEFF7FF","point":0.9},{"__typename":"ColorPoint","color":"#FFFAFFFF","point":1}]}},"domain":null,"slug":"coursera-engineering","googleAnalyticsId":null,"name":"Coursera Engineering","avatar":{"__ref":"ImageMetadata:1*j2vLJO9qZg435iRYfd2Mfg.png"},"description":"We're changing the way the world learns! Posts from Coursera engineers and data scientists.","subscriberCount":3814,"latestPostsConnection({\"paging\":{\"limit\":1}})":{"__typename":"PostConnection","posts":[{"__ref":"Post:9cd6e8ac8b5c"}]},"isAuroraVisible":false,"tintColor":"#FF82A8E1","newsletterV3":null,"viewerEdge":{"__ref":"CollectionViewerEdge:collectionId:532b19e4043c-viewerId:lo_f0984db7dad6"},"twitterUsername":"CourseraEng","facebookPageId":null,"logo":{"__ref":"ImageMetadata:1*zXjOKA4JKHH04Ipi2NI0jA.png"}},"ImageMetadata:1*j2vLJO9qZg435iRYfd2Mfg.png":{"__typename":"ImageMetadata","id":"1*j2vLJO9qZg435iRYfd2Mfg.png"},"User:dbd909ab7ead":{"__typename":"User","id":"dbd909ab7ead","customDomainState":{"__typename":"CustomDomainState","live":{"__typename":"CustomDomain","domain":"mengying-li.medium.com"}},"hasSubdomain":true,"username":"mengying-li"},"Post:9cd6e8ac8b5c":{"__typename":"Post","id":"9cd6e8ac8b5c","firstPublishedAt":1672713676343,"creator":{"__ref":"User:dbd909ab7ead"},"collection":{"__ref":"Collection:532b19e4043c"},"isSeries":false,"mediumUrl":"https:\u002F\u002Fmedium.com\u002Fcoursera-engineering\u002Ftwo-easy-ways-to-determine-right-size-for-aws-rds-instance-through-request-mirroring-load-test-9cd6e8ac8b5c","sequence":null,"uniqueSlug":"two-easy-ways-to-determine-right-size-for-aws-rds-instance-through-request-mirroring-load-test-9cd6e8ac8b5c"},"LinkedAccounts:70814e310ce3":{"__typename":"LinkedAccounts","mastodon":null,"id":"70814e310ce3"},"User:70814e310ce3":{"__typename":"User","id":"70814e310ce3","linkedAccounts":{"__ref":"LinkedAccounts:70814e310ce3"},"isSuspended":false,"name":"Chris Liu","imageId":"0*ECSDCjFKbFRqqOIr.","customDomainState":null,"hasSubdomain":false,"username":"cliu_88389","verifications":{"__typename":"VerifiedInfo","isBookAuthor":false},"socialStats":{"__typename":"SocialStats","followerCount":103,"followingCount":3,"collectionFollowingCount":1},"bio":"Passionate about education and solving hard problems in a collaborative fashion.","membership":null,"allowNotes":true,"viewerEdge":{"__ref":"UserViewerEdge:userId:70814e310ce3-viewerId:lo_f0984db7dad6"},"twitterScreenName":""},"Topic:ae5d4995e225":{"__typename":"Topic","slug":"data-science","id":"ae5d4995e225","name":"Data Science"},"Paragraph:235d9560959f_0":{"__typename":"Paragraph","id":"235d9560959f_0","name":"fd1b","type":"H3","href":null,"layout":null,"metadata":null,"text":"Categorizing learning content","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_1":{"__typename":"Paragraph","id":"235d9560959f_1","name":"dddb","type":"H4","href":null,"layout":null,"metadata":null,"text":"From hand-coded to an algorithmic approach","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_2":{"__typename":"Paragraph","id":"235d9560959f_2","name":"1140","type":"P","href":null,"layout":null,"metadata":null,"text":"Courses on Coursera cover topics ranging from photography to probabilistic graphical models to constitutional struggles in the Muslim world. This diversity makes them hard to categorize. A couple of years ago we overhauled our course categories and implemented a new categorization system we call domains and subdomains. This post covers how we defined and implemented that new system.","hasDropCap":null,"dropCapImage":null,"markups":[{"__typename":"Markup","type":"A","start":45,"end":57,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fphotography","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":60,"end":91,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fprobabilistic-graphical-models","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":94,"end":139,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fmuslim-world","anchorType":"LINK","userId":null,"linkMetadata":null}],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_3":{"__typename":"Paragraph","id":"235d9560959f_3","name":"1df7","type":"H3","href":null,"layout":null,"metadata":null,"text":"The Previous Course Categories","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_4":{"__typename":"Paragraph","id":"235d9560959f_4","name":"be48","type":"P","href":null,"layout":null,"metadata":null,"text":"Coursera’s original categorization scheme dated back to our founding in 2012, and was heavily influenced by the content available at the time. For example, we had five categories of computer science subfields, but only one category for all of the humanities. The categories were also manually and arbitrarily defined, resulting in redundancies (e.g., “Food and Nutrition” being nearly a subset of “Health and Society”) and vagueness (e.g., “Information, Tech & Design”).","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_5":{"__typename":"Paragraph","id":"235d9560959f_5","name":"095b","type":"P","href":null,"layout":null,"metadata":null,"text":"Critically, the original categorization scheme was not meeting our need of effectively matching learner to content. For example, the “Medicine” category attracted two distinct groups of learners — because it contained two distinct groups of courses. The first were courses that appealed to healthcare practitioners (e.g., on clinical kidney transplantation or biocontainment for infectious diseases). The second were courses on public health issues that appealed to non-practitioners.","hasDropCap":null,"dropCapImage":null,"markups":[{"__typename":"Markup","type":"A","start":325,"end":356,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fclinical-kidney-transplantation","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":360,"end":398,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fbiocontainment","anchorType":"LINK","userId":null,"linkMetadata":null}],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_6":{"__typename":"Paragraph","id":"235d9560959f_6","name":"89d4","type":"P","href":null,"layout":null,"metadata":null,"text":"As our catalog expands to thousands of courses, we need a principled organization technique. We want categories that help the learner find the best content for them. This translates to the following criteria:","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_7":{"__typename":"Paragraph","id":"235d9560959f_7","name":"c30c","type":"OLI","href":null,"layout":null,"metadata":null,"text":"Simple (as few categories as possible)","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_8":{"__typename":"Paragraph","id":"235d9560959f_8","name":"237c","type":"OLI","href":null,"layout":null,"metadata":null,"text":"Minimally redundant (as mutually exclusive as possible)","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_9":{"__typename":"Paragraph","id":"235d9560959f_9","name":"abce","type":"H3","href":null,"layout":null,"metadata":null,"text":"t-SNE to the rescue","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_10":{"__typename":"Paragraph","id":"235d9560959f_10","name":"fe80","type":"P","href":null,"layout":null,"metadata":null,"text":"Rather than re-coding by hand, or replicating traditional university departments, we took a data-driven approach.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_11":{"__typename":"Paragraph","id":"235d9560959f_11","name":"21d1","type":"P","href":null,"layout":null,"metadata":null,"text":"We sought to group our courses so that someone interested in one course in that group, say, playing the guitar, might also be interested in other courses in that group, say, songwriting or jazz improvisation. The algorithm known as t-distributed stochastic neighbor embedding (t-SNE) satisfies this requirement.","hasDropCap":null,"dropCapImage":null,"markups":[{"__typename":"Markup","type":"A","start":92,"end":110,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fguitar","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":174,"end":185,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fsongwriting-lyrics","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":189,"end":207,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fjazz-improvisation","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":277,"end":282,"href":"https:\u002F\u002Flvdmaaten.github.io\u002Ftsne\u002F","anchorType":"LINK","userId":null,"linkMetadata":null}],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_12":{"__typename":"Paragraph","id":"235d9560959f_12","name":"058d","type":"P","href":null,"layout":null,"metadata":null,"text":"t-SNE identifies an arrangement of courses such that courses sharing common learners are close and courses that do not share common learners are far apart. For example, Complex Analysis and Galois Theory are close together since many learners take both, while Taking Care of Horses and General Relativity are farther apart as the two courses do not share many learners.","hasDropCap":null,"dropCapImage":null,"markups":[{"__typename":"Markup","type":"A","start":169,"end":185,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fcomplex-analysis","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":190,"end":203,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fgalois","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":260,"end":281,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fhorse-care","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":286,"end":304,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fgeneral-relativity","anchorType":"LINK","userId":null,"linkMetadata":null}],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_13":{"__typename":"Paragraph","id":"235d9560959f_13","name":"e67e","type":"P","href":null,"layout":null,"metadata":null,"text":"We utilized the t-SNE algorithm on courses in 2015 to produce the scatterplot output as shown below. Each dot represents a single course. We then group these courses into categories by clustering (represented by the coloring).","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"ImageMetadata:0*MKkkbhhYA7Tcus_L":{"__typename":"ImageMetadata","id":"0*MKkkbhhYA7Tcus_L","originalHeight":795,"originalWidth":811,"focusPercentX":null,"focusPercentY":null,"alt":null},"Paragraph:235d9560959f_14":{"__typename":"Paragraph","id":"235d9560959f_14","name":"bd3b","type":"IMG","href":null,"layout":"INSET_CENTER","metadata":{"__ref":"ImageMetadata:0*MKkkbhhYA7Tcus_L"},"text":"Figure 1: t-SNE visualization of courses colored by cluster, circa 2015.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_15":{"__typename":"Paragraph","id":"235d9560959f_15","name":"8d62","type":"H3","href":null,"layout":null,"metadata":null,"text":"The general structure of our content","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"ImageMetadata:1*c_utWA_Qi-HFw4tVDU3JyA.png":{"__typename":"ImageMetadata","id":"1*c_utWA_Qi-HFw4tVDU3JyA.png","originalHeight":766,"originalWidth":1292,"focusPercentX":null,"focusPercentY":null,"alt":null},"Paragraph:235d9560959f_16":{"__typename":"Paragraph","id":"235d9560959f_16","name":"87a0","type":"IMG","href":null,"layout":"INSET_CENTER","metadata":{"__ref":"ImageMetadata:1*c_utWA_Qi-HFw4tVDU3JyA.png"},"text":"Figure 2. General subject area of courses.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_17":{"__typename":"Paragraph","id":"235d9560959f_17","name":"98ec","type":"P","href":null,"layout":null,"metadata":null,"text":"Looking at Figures 1 and 2, the first thing we see is that courses are organized in a globally consistent way: humanities, social sciences, and business courses are in the top right half of the plot, while natural sciences, engineering, and computational sciences courses fall in the bottom left half.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_18":{"__typename":"Paragraph","id":"235d9560959f_18","name":"724c","type":"P","href":null,"layout":null,"metadata":null,"text":"Digging in more granularly reveals additional nuance:","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_19":{"__typename":"Paragraph","id":"235d9560959f_19","name":"cf60","type":"ULI","href":null,"layout":null,"metadata":null,"text":"Courses on business and finance are clustered together on the right","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_20":{"__typename":"Paragraph","id":"235d9560959f_20","name":"11c1","type":"ULI","href":null,"layout":null,"metadata":null,"text":"Courses about the natural sciences (physics, chemistry, and biology) are on the left","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_21":{"__typename":"Paragraph","id":"235d9560959f_21","name":"5b6b","type":"ULI","href":null,"layout":null,"metadata":null,"text":"Courses on the computational sciences (math, cs, and statistics) are at the bottom","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_22":{"__typename":"Paragraph","id":"235d9560959f_22","name":"02ce","type":"ULI","href":null,"layout":null,"metadata":null,"text":"Courses on the social sciences and humanities are at the top","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"ImageMetadata:1*-yZ59kN7MjqgnKq2tXTlQA.png":{"__typename":"ImageMetadata","id":"1*-yZ59kN7MjqgnKq2tXTlQA.png","originalHeight":784,"originalWidth":1332,"focusPercentX":null,"focusPercentY":null,"alt":null},"Paragraph:235d9560959f_23":{"__typename":"Paragraph","id":"235d9560959f_23","name":"36cc","type":"IMG","href":null,"layout":"INSET_CENTER","metadata":{"__ref":"ImageMetadata:1*-yZ59kN7MjqgnKq2tXTlQA.png"},"text":"Figure 3. General division of science and humanities courses.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"ImageMetadata:1*A-lEgYtSuSKQZ21ves4JOw.png":{"__typename":"ImageMetadata","id":"1*A-lEgYtSuSKQZ21ves4JOw.png","originalHeight":868,"originalWidth":1092,"focusPercentX":null,"focusPercentY":null,"alt":null},"Paragraph:235d9560959f_24":{"__typename":"Paragraph","id":"235d9560959f_24","name":"aed3","type":"IMG","href":null,"layout":"INSET_CENTER","metadata":{"__ref":"ImageMetadata:1*A-lEgYtSuSKQZ21ves4JOw.png"},"text":"Figure 4. Substructure of courses within each half of the plot.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_25":{"__typename":"Paragraph","id":"235d9560959f_25","name":"5fd8","type":"P","href":null,"layout":null,"metadata":null,"text":"Dissecting each of these large regions further, we see that even within each grouping, courses are arranged logically. For example, courses in natural history span a continuum roughly from the biological sciences to the physical sciences. Similarly, courses in humanities and social science range roughly from music to the visual arts, humanities, and social sciences, and then practical business.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_26":{"__typename":"Paragraph","id":"235d9560959f_26","name":"9577","type":"P","href":null,"layout":null,"metadata":null,"text":"Even at the level of individual courses, t-SNE captures the interdisciplinary nature of courses. Courses in business law, for example, fall on the boundary between business and law, and courses on quantitative methods for the social sciences fall between math and the social sciences.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"ImageMetadata:1*_uuoe43USer2SKMxm98igA.png":{"__typename":"ImageMetadata","id":"1*_uuoe43USer2SKMxm98igA.png","originalHeight":732,"originalWidth":1292,"focusPercentX":null,"focusPercentY":null,"alt":null},"Paragraph:235d9560959f_27":{"__typename":"Paragraph","id":"235d9560959f_27","name":"def3","type":"IMG","href":null,"layout":"INSET_CENTER","metadata":{"__ref":"ImageMetadata:1*_uuoe43USer2SKMxm98igA.png"},"text":"Figure 5. Interdisciplinary courses sit roughly between the right clusters.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_28":{"__typename":"Paragraph","id":"235d9560959f_28","name":"9737","type":"P","href":null,"layout":null,"metadata":null,"text":"Returning to the set of courses previously categorized as “medicine,” we now have three sub-categories. First is a relatively disjointed cluster of courses targeted to the medical professional (e.g., “Ebola: Essential Knowledge for the Healthcare Professional”). Second is a cluster of courses on healthcare policy (e.g., “Systems Thinking in Public Health”), and lastly, we have a cluster on basic biology (e.g., “Introduction to Genetics and Evolution”).","hasDropCap":null,"dropCapImage":null,"markups":[{"__typename":"Markup","type":"A","start":201,"end":259,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Febola-essentials-for-health-professionals","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":323,"end":356,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fsystems-thinking","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"A","start":416,"end":453,"href":"https:\u002F\u002Fwww.coursera.org\u002Flearn\u002Fgenetics-evolution","anchorType":"LINK","userId":null,"linkMetadata":null}],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_29":{"__typename":"Paragraph","id":"235d9560959f_29","name":"25bc","type":"P","href":null,"layout":null,"metadata":null,"text":"The result is noteworthy because there is no strong reason why t-SNE should arrange our courses by subject matter. We weren’t feeding in course descriptions or transcripts, just the enrollment behavior of learners. We attribute the clusterability of courses to the fact that learners are much more likely to be interested in multiple courses in a particular subject area rather than to be influenced in their course decision by non-subject-matter factors such as the style of instruction or the institution offering the course.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_30":{"__typename":"Paragraph","id":"235d9560959f_30","name":"664e","type":"P","href":null,"layout":null,"metadata":null,"text":"That said, this assumption does not hold across the full catalog. For example, among non-English content, the language of instruction is more a driver of enrollment than the subject area. Correspondingly, a French or Russian course is more likely to be grouped with other courses taught in the respective language than it is to be grouped with other courses on the same subject.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_31":{"__typename":"Paragraph","id":"235d9560959f_31","name":"478e","type":"P","href":null,"layout":null,"metadata":null,"text":"After some clean up, we landed at 36 course clusters, which rolled up into nine larger clusters. On the Coursera platform today, we term the original clusters “subdomains” and the larger clusters “domains.” We launched the new system of domains and subdomains in summer 2015. In the past three years, it has become an integral part of Coursera’s content discovery experience, allowing us to scale content categorization and drive personalization for each and every learner on our platform.","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_32":{"__typename":"Paragraph","id":"235d9560959f_32","name":"c134","type":"H4","href":null,"layout":null,"metadata":null,"text":"Acknowledgements","hasDropCap":null,"dropCapImage":null,"markups":[],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_33":{"__typename":"Paragraph","id":"235d9560959f_33","name":"4ee7","type":"P","href":null,"layout":null,"metadata":null,"text":"Credit for the t-SNE approach goes to Zhenghao Chen, a previous Coursera data scientist.","hasDropCap":null,"dropCapImage":null,"markups":[{"__typename":"Markup","type":"A","start":38,"end":51,"href":"https:\u002F\u002Fwww.linkedin.com\u002Fin\u002Fzhenghao-chen-44865036\u002F","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"EM","start":0,"end":88,"href":null,"anchorType":null,"userId":null,"linkMetadata":null}],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"Paragraph:235d9560959f_34":{"__typename":"Paragraph","id":"235d9560959f_34","name":"e9e1","type":"P","href":null,"layout":null,"metadata":null,"text":"I also want to thank Emily Glassberg Sands for reading through and giving feedback on drafts.","hasDropCap":null,"dropCapImage":null,"markups":[{"__typename":"Markup","type":"A","start":20,"end":42,"href":"https:\u002F\u002Fwww.linkedin.com\u002Fin\u002Fegsands\u002F","anchorType":"LINK","userId":null,"linkMetadata":null},{"__typename":"Markup","type":"EM","start":0,"end":93,"href":null,"anchorType":null,"userId":null,"linkMetadata":null}],"codeBlockMetadata":null,"iframe":null,"mixtapeMetadata":null},"CollectionViewerEdge:collectionId:532b19e4043c-viewerId:lo_f0984db7dad6":{"__typename":"CollectionViewerEdge","id":"collectionId:532b19e4043c-viewerId:lo_f0984db7dad6","isEditor":false,"isMuting":false},"UserViewerEdge:userId:70814e310ce3-viewerId:lo_f0984db7dad6":{"__typename":"UserViewerEdge","id":"userId:70814e310ce3-viewerId:lo_f0984db7dad6","isMuting":false},"ImageMetadata:1*zXjOKA4JKHH04Ipi2NI0jA.png":{"__typename":"ImageMetadata","id":"1*zXjOKA4JKHH04Ipi2NI0jA.png","originalWidth":1156,"originalHeight":164},"PostViewerEdge:postId:89de0104bcbd-viewerId:lo_f0984db7dad6":{"__typename":"PostViewerEdge","shouldIndexPostForExternalSearch":true,"id":"postId:89de0104bcbd-viewerId:lo_f0984db7dad6"},"Tag:data-science":{"__typename":"Tag","id":"data-science","displayTitle":"Data Science","normalizedTagSlug":"data-science"},"Tag:education":{"__typename":"Tag","id":"education","displayTitle":"Education","normalizedTagSlug":"education"},"Tag:technology":{"__typename":"Tag","id":"technology","displayTitle":"Technology","normalizedTagSlug":"technology"},"Post:89de0104bcbd":{"__typename":"Post","id":"89de0104bcbd","collection":{"__ref":"Collection:532b19e4043c"},"content({\"postMeteringOptions\":{\"referrer\":\"\"}})":{"__typename":"PostContent","isLockedPreviewOnly":false,"bodyModel":{"__typename":"RichText","sections":[{"__typename":"Section","name":"1821","startIndex":0,"textLayout":null,"imageLayout":null,"backgroundImage":null,"videoLayout":null,"backgroundVideo":null}],"paragraphs":[{"__ref":"Paragraph:235d9560959f_0"},{"__ref":"Paragraph:235d9560959f_1"},{"__ref":"Paragraph:235d9560959f_2"},{"__ref":"Paragraph:235d9560959f_3"},{"__ref":"Paragraph:235d9560959f_4"},{"__ref":"Paragraph:235d9560959f_5"},{"__ref":"Paragraph:235d9560959f_6"},{"__ref":"Paragraph:235d9560959f_7"},{"__ref":"Paragraph:235d9560959f_8"},{"__ref":"Paragraph:235d9560959f_9"},{"__ref":"Paragraph:235d9560959f_10"},{"__ref":"Paragraph:235d9560959f_11"},{"__ref":"Paragraph:235d9560959f_12"},{"__ref":"Paragraph:235d9560959f_13"},{"__ref":"Paragraph:235d9560959f_14"},{"__ref":"Paragraph:235d9560959f_15"},{"__ref":"Paragraph:235d9560959f_16"},{"__ref":"Paragraph:235d9560959f_17"},{"__ref":"Paragraph:235d9560959f_18"},{"__ref":"Paragraph:235d9560959f_19"},{"__ref":"Paragraph:235d9560959f_20"},{"__ref":"Paragraph:235d9560959f_21"},{"__ref":"Paragraph:235d9560959f_22"},{"__ref":"Paragraph:235d9560959f_23"},{"__ref":"Paragraph:235d9560959f_24"},{"__ref":"Paragraph:235d9560959f_25"},{"__ref":"Paragraph:235d9560959f_26"},{"__ref":"Paragraph:235d9560959f_27"},{"__ref":"Paragraph:235d9560959f_28"},{"__ref":"Paragraph:235d9560959f_29"},{"__ref":"Paragraph:235d9560959f_30"},{"__ref":"Paragraph:235d9560959f_31"},{"__ref":"Paragraph:235d9560959f_32"},{"__ref":"Paragraph:235d9560959f_33"},{"__ref":"Paragraph:235d9560959f_34"}]},"validatedShareKey":"","shareKeyCreator":null},"creator":{"__ref":"User:70814e310ce3"},"inResponseToEntityType":null,"isLocked":false,"isMarkedPaywallOnly":false,"lockedSource":"LOCKED_POST_SOURCE_NONE","mediumUrl":"https:\u002F\u002Fmedium.com\u002Fcoursera-engineering\u002Fdata-driven-content-categorization-89de0104bcbd","primaryTopic":{"__ref":"Topic:ae5d4995e225"},"topics":[{"__typename":"Topic","slug":"education"},{"__typename":"Topic","slug":"data-science"}],"isLimitedState":false,"isPublished":true,"allowResponses":true,"latestPublishedVersion":"235d9560959f","visibility":"PUBLIC","postResponses":{"__typename":"PostResponses","count":4},"responseDistribution":"NOT_DISTRIBUTED","clapCount":780,"title":"Data Driven Content Categorization","isSeries":false,"sequence":null,"uniqueSlug":"data-driven-content-categorization-89de0104bcbd","socialTitle":"","socialDek":"","canonicalUrl":"","metaDescription":"Courses on Coursera have a scale and breadth of diversity makes them hard to categorize. This post explains how we took a data driven approach to create relevant and useful categories.","latestPublishedAt":1548178039046,"readingTime":4.486163522012578,"previewContent":{"__typename":"PreviewContent","subtitle":"How Coursera generated course categories from thousands of courses using a data driven clustering approach."},"previewImage":{"__ref":"ImageMetadata:1*A-lEgYtSuSKQZ21ves4JOw.png"},"isShortform":false,"seoTitle":"","firstPublishedAt":1536725620251,"updatedAt":1548178039046,"shortformType":"SHORTFORM_TYPE_LINK","seoDescription":"","viewerEdge":{"__ref":"PostViewerEdge:postId:89de0104bcbd-viewerId:lo_f0984db7dad6"},"isSuspended":false,"license":"ALL_RIGHTS_RESERVED","tags":[{"__ref":"Tag:data-science"},{"__ref":"Tag:education"},{"__ref":"Tag:technology"}],"isFeaturedInPublishedPublication":false,"isNewsletter":false,"statusForCollection":"APPROVED","pendingCollection":null,"detectedLanguage":"en","wordCount":968,"layerCake":3,"responsesLocked":false}}</script><script>window.__MIDDLEWARE_STATE__={"session":{"xsrf":""},"cache":{"cacheStatus":"HIT"}}</script><script src="https://cdn-client.medium.com/lite/static/js/manifest.8b67b313.js"></script><script src="https://cdn-client.medium.com/lite/static/js/9865.1496d74a.js"></script><script src="https://cdn-client.medium.com/lite/static/js/main.94ea62ed.js"></script><script src="https://cdn-client.medium.com/lite/static/js/instrumentation.5bef8967.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/reporting.ff22a7a5.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/9120.5df29668.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/5049.d1ead72d.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/4505.6dfaf853.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/6618.db187378.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/9380.fb176dee.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/2707.dc8dbee4.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/9977.933c1c9a.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/8599.68bc318b.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/3045.1cc3d8cb.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/6349.3329b100.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/2648.26563adf.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/8393.a4ecfb83.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/6428.36238b5a.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/6199.6da73f3b.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/5642.7d9f7f3d.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/6546.67eb283b.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/6834.8aa8d357.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/4492.0c3e1a1d.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/2571.6814b962.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/839.1c286b32.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/6128.f8800a13.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/2135.2e8dc177.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/7975.60bcefe8.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/144.86429b48.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/5240.6281357f.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/8819.c627c2bf.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/8204.d0637ed0.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/PostPage.MainContent.c3ee9367.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/8414.0d800846.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/3974.8d3e0217.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/2527.18a8996d.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/PostResponsesContent.e1e580cb.chunk.js"></script> <script src="https://cdn-client.medium.com/lite/static/js/responses.editor.e89462cb.chunk.js"></script><script>window.main();</script><script>(function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'91357fd79a2afd74',t:'MTczOTc5MjM5My4wMDAwMDA='};var a=document.createElement('script');a.nonce='';a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();</script></body></html>

Pages: 1 2 3 4 5 6 7 8 9 10