CINXE.COM
dataset – CORE
<!DOCTYPE html> <html lang="en-GB" class="no-js"> <head><style>img.lazy{min-height:1px}</style><link rel="preload" href="https://blog.core.ac.uk/wp-content/plugins/w3-total-cache/pub/js/lazyload.min.js" as="script"> <meta charset="UTF-8"> <meta name="viewport" content="width=device-width"> <link rel="profile" href="http://gmpg.org/xfn/11"> <link rel="pingback" href="https://blog.core.ac.uk/xmlrpc.php"> <!--[if lt IE 9]> <script src="https://blog.core.ac.uk/wp-content/themes/twentyfifteen/js/html5.js"></script> <![endif]--> <script>(function(html){html.className = html.className.replace(/\bno-js\b/,'js')})(document.documentElement);</script> <title>dataset – CORE</title> <meta name='robots' content='max-image-preview:large' /> <style>img:is([sizes="auto" i], [sizes^="auto," i]) { contain-intrinsic-size: 3000px 1500px }</style> <link rel='dns-prefetch' href='//secure.gravatar.com' /> <link rel='dns-prefetch' href='//fonts.googleapis.com' /> <link rel='dns-prefetch' href='//v0.wordpress.com' /> <link rel='dns-prefetch' href='//c0.wp.com' /> <link href='https://fonts.gstatic.com' crossorigin rel='preconnect' /> <link rel="alternate" type="application/rss+xml" title="CORE » Feed" href="https://blog.core.ac.uk/feed/" /> <link rel="alternate" type="application/rss+xml" title="CORE » Comments Feed" href="https://blog.core.ac.uk/comments/feed/" /> <link rel="alternate" type="application/rss+xml" title="CORE » dataset Category Feed" href="https://blog.core.ac.uk/category/dataset/feed/" /> <script type="text/javascript"> /* <![CDATA[ */ window._wpemojiSettings = {"baseUrl":"https:\/\/s.w.org\/images\/core\/emoji\/15.0.3\/72x72\/","ext":".png","svgUrl":"https:\/\/s.w.org\/images\/core\/emoji\/15.0.3\/svg\/","svgExt":".svg","source":{"concatemoji":"https:\/\/blog.core.ac.uk\/wp-includes\/js\/wp-emoji-release.min.js?ver=6.7.1"}}; /*! This file is auto-generated */ !function(i,n){var o,s,e;function c(e){try{var t={supportTests:e,timestamp:(new Date).valueOf()};sessionStorage.setItem(o,JSON.stringify(t))}catch(e){}}function p(e,t,n){e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(t,0,0);var t=new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data),r=(e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(n,0,0),new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data));return t.every(function(e,t){return e===r[t]})}function u(e,t,n){switch(t){case"flag":return n(e,"\ud83c\udff3\ufe0f\u200d\u26a7\ufe0f","\ud83c\udff3\ufe0f\u200b\u26a7\ufe0f")?!1:!n(e,"\ud83c\uddfa\ud83c\uddf3","\ud83c\uddfa\u200b\ud83c\uddf3")&&!n(e,"\ud83c\udff4\udb40\udc67\udb40\udc62\udb40\udc65\udb40\udc6e\udb40\udc67\udb40\udc7f","\ud83c\udff4\u200b\udb40\udc67\u200b\udb40\udc62\u200b\udb40\udc65\u200b\udb40\udc6e\u200b\udb40\udc67\u200b\udb40\udc7f");case"emoji":return!n(e,"\ud83d\udc26\u200d\u2b1b","\ud83d\udc26\u200b\u2b1b")}return!1}function f(e,t,n){var r="undefined"!=typeof WorkerGlobalScope&&self instanceof WorkerGlobalScope?new OffscreenCanvas(300,150):i.createElement("canvas"),a=r.getContext("2d",{willReadFrequently:!0}),o=(a.textBaseline="top",a.font="600 32px Arial",{});return e.forEach(function(e){o[e]=t(a,e,n)}),o}function t(e){var t=i.createElement("script");t.src=e,t.defer=!0,i.head.appendChild(t)}"undefined"!=typeof Promise&&(o="wpEmojiSettingsSupports",s=["flag","emoji"],n.supports={everything:!0,everythingExceptFlag:!0},e=new Promise(function(e){i.addEventListener("DOMContentLoaded",e,{once:!0})}),new Promise(function(t){var n=function(){try{var e=JSON.parse(sessionStorage.getItem(o));if("object"==typeof e&&"number"==typeof e.timestamp&&(new Date).valueOf()<e.timestamp+604800&&"object"==typeof e.supportTests)return e.supportTests}catch(e){}return null}();if(!n){if("undefined"!=typeof Worker&&"undefined"!=typeof OffscreenCanvas&&"undefined"!=typeof URL&&URL.createObjectURL&&"undefined"!=typeof Blob)try{var e="postMessage("+f.toString()+"("+[JSON.stringify(s),u.toString(),p.toString()].join(",")+"));",r=new Blob([e],{type:"text/javascript"}),a=new Worker(URL.createObjectURL(r),{name:"wpTestEmojiSupports"});return void(a.onmessage=function(e){c(n=e.data),a.terminate(),t(n)})}catch(e){}c(n=f(s,u,p))}t(n)}).then(function(e){for(var t in e)n.supports[t]=e[t],n.supports.everything=n.supports.everything&&n.supports[t],"flag"!==t&&(n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&n.supports[t]);n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&!n.supports.flag,n.DOMReady=!1,n.readyCallback=function(){n.DOMReady=!0}}).then(function(){return e}).then(function(){var e;n.supports.everything||(n.readyCallback(),(e=n.source||{}).concatemoji?t(e.concatemoji):e.wpemoji&&e.twemoji&&(t(e.twemoji),t(e.wpemoji)))}))}((window,document),window._wpemojiSettings); /* ]]> */ </script> <link rel='stylesheet' id='twentyfifteen-jetpack-css' href='https://c0.wp.com/p/jetpack/11.9.3/modules/theme-tools/compat/twentyfifteen.css' type='text/css' media='all' /> <style id='wp-emoji-styles-inline-css' type='text/css'> img.wp-smiley, img.emoji { display: inline !important; border: none !important; box-shadow: none !important; height: 1em !important; width: 1em !important; margin: 0 0.07em !important; vertical-align: -0.1em !important; background: none !important; padding: 0 !important; } </style> <link rel='stylesheet' id='wp-block-library-css' href='https://c0.wp.com/c/6.7.1/wp-includes/css/dist/block-library/style.min.css' type='text/css' media='all' /> <style id='wp-block-library-inline-css' type='text/css'> .has-text-align-justify{text-align:justify;} </style> <link rel='stylesheet' id='mediaelement-css' href='https://c0.wp.com/c/6.7.1/wp-includes/js/mediaelement/mediaelementplayer-legacy.min.css' type='text/css' media='all' /> <link rel='stylesheet' id='wp-mediaelement-css' href='https://c0.wp.com/c/6.7.1/wp-includes/js/mediaelement/wp-mediaelement.min.css' type='text/css' media='all' /> <style id='classic-theme-styles-inline-css' type='text/css'> /*! This file is auto-generated */ .wp-block-button__link{color:#fff;background-color:#32373c;border-radius:9999px;box-shadow:none;text-decoration:none;padding:calc(.667em + 2px) calc(1.333em + 2px);font-size:1.125em}.wp-block-file__button{background:#32373c;color:#fff;text-decoration:none} </style> <style id='global-styles-inline-css' type='text/css'> :root{--wp--preset--aspect-ratio--square: 1;--wp--preset--aspect-ratio--4-3: 4/3;--wp--preset--aspect-ratio--3-4: 3/4;--wp--preset--aspect-ratio--3-2: 3/2;--wp--preset--aspect-ratio--2-3: 2/3;--wp--preset--aspect-ratio--16-9: 16/9;--wp--preset--aspect-ratio--9-16: 9/16;--wp--preset--color--black: #000000;--wp--preset--color--cyan-bluish-gray: #abb8c3;--wp--preset--color--white: #ffffff;--wp--preset--color--pale-pink: #f78da7;--wp--preset--color--vivid-red: #cf2e2e;--wp--preset--color--luminous-vivid-orange: #ff6900;--wp--preset--color--luminous-vivid-amber: #fcb900;--wp--preset--color--light-green-cyan: #7bdcb5;--wp--preset--color--vivid-green-cyan: #00d084;--wp--preset--color--pale-cyan-blue: #8ed1fc;--wp--preset--color--vivid-cyan-blue: #0693e3;--wp--preset--color--vivid-purple: #9b51e0;--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple: linear-gradient(135deg,rgba(6,147,227,1) 0%,rgb(155,81,224) 100%);--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan: linear-gradient(135deg,rgb(122,220,180) 0%,rgb(0,208,130) 100%);--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange: linear-gradient(135deg,rgba(252,185,0,1) 0%,rgba(255,105,0,1) 100%);--wp--preset--gradient--luminous-vivid-orange-to-vivid-red: linear-gradient(135deg,rgba(255,105,0,1) 0%,rgb(207,46,46) 100%);--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray: linear-gradient(135deg,rgb(238,238,238) 0%,rgb(169,184,195) 100%);--wp--preset--gradient--cool-to-warm-spectrum: linear-gradient(135deg,rgb(74,234,220) 0%,rgb(151,120,209) 20%,rgb(207,42,186) 40%,rgb(238,44,130) 60%,rgb(251,105,98) 80%,rgb(254,248,76) 100%);--wp--preset--gradient--blush-light-purple: linear-gradient(135deg,rgb(255,206,236) 0%,rgb(152,150,240) 100%);--wp--preset--gradient--blush-bordeaux: linear-gradient(135deg,rgb(254,205,165) 0%,rgb(254,45,45) 50%,rgb(107,0,62) 100%);--wp--preset--gradient--luminous-dusk: linear-gradient(135deg,rgb(255,203,112) 0%,rgb(199,81,192) 50%,rgb(65,88,208) 100%);--wp--preset--gradient--pale-ocean: linear-gradient(135deg,rgb(255,245,203) 0%,rgb(182,227,212) 50%,rgb(51,167,181) 100%);--wp--preset--gradient--electric-grass: linear-gradient(135deg,rgb(202,248,128) 0%,rgb(113,206,126) 100%);--wp--preset--gradient--midnight: linear-gradient(135deg,rgb(2,3,129) 0%,rgb(40,116,252) 100%);--wp--preset--font-size--small: 13px;--wp--preset--font-size--medium: 20px;--wp--preset--font-size--large: 36px;--wp--preset--font-size--x-large: 42px;--wp--preset--spacing--20: 0.44rem;--wp--preset--spacing--30: 0.67rem;--wp--preset--spacing--40: 1rem;--wp--preset--spacing--50: 1.5rem;--wp--preset--spacing--60: 2.25rem;--wp--preset--spacing--70: 3.38rem;--wp--preset--spacing--80: 5.06rem;--wp--preset--shadow--natural: 6px 6px 9px rgba(0, 0, 0, 0.2);--wp--preset--shadow--deep: 12px 12px 50px rgba(0, 0, 0, 0.4);--wp--preset--shadow--sharp: 6px 6px 0px rgba(0, 0, 0, 0.2);--wp--preset--shadow--outlined: 6px 6px 0px -3px rgba(255, 255, 255, 1), 6px 6px rgba(0, 0, 0, 1);--wp--preset--shadow--crisp: 6px 6px 0px rgba(0, 0, 0, 1);}:where(.is-layout-flex){gap: 0.5em;}:where(.is-layout-grid){gap: 0.5em;}body .is-layout-flex{display: flex;}.is-layout-flex{flex-wrap: wrap;align-items: center;}.is-layout-flex > :is(*, div){margin: 0;}body .is-layout-grid{display: grid;}.is-layout-grid > :is(*, div){margin: 0;}:where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;}:where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;}.has-black-color{color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-color{color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-color{color: var(--wp--preset--color--white) !important;}.has-pale-pink-color{color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-color{color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-color{color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-color{color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-color{color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-color{color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-color{color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-color{color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-color{color: var(--wp--preset--color--vivid-purple) !important;}.has-black-background-color{background-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-background-color{background-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-background-color{background-color: var(--wp--preset--color--white) !important;}.has-pale-pink-background-color{background-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-background-color{background-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-background-color{background-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-background-color{background-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-background-color{background-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-background-color{background-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-background-color{background-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-background-color{background-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-background-color{background-color: var(--wp--preset--color--vivid-purple) !important;}.has-black-border-color{border-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-border-color{border-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-border-color{border-color: var(--wp--preset--color--white) !important;}.has-pale-pink-border-color{border-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-border-color{border-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-border-color{border-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-border-color{border-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-border-color{border-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-border-color{border-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-border-color{border-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-border-color{border-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-border-color{border-color: var(--wp--preset--color--vivid-purple) !important;}.has-vivid-cyan-blue-to-vivid-purple-gradient-background{background: var(--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple) !important;}.has-light-green-cyan-to-vivid-green-cyan-gradient-background{background: var(--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan) !important;}.has-luminous-vivid-amber-to-luminous-vivid-orange-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange) !important;}.has-luminous-vivid-orange-to-vivid-red-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-orange-to-vivid-red) !important;}.has-very-light-gray-to-cyan-bluish-gray-gradient-background{background: var(--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray) !important;}.has-cool-to-warm-spectrum-gradient-background{background: var(--wp--preset--gradient--cool-to-warm-spectrum) !important;}.has-blush-light-purple-gradient-background{background: var(--wp--preset--gradient--blush-light-purple) !important;}.has-blush-bordeaux-gradient-background{background: var(--wp--preset--gradient--blush-bordeaux) !important;}.has-luminous-dusk-gradient-background{background: var(--wp--preset--gradient--luminous-dusk) !important;}.has-pale-ocean-gradient-background{background: var(--wp--preset--gradient--pale-ocean) !important;}.has-electric-grass-gradient-background{background: var(--wp--preset--gradient--electric-grass) !important;}.has-midnight-gradient-background{background: var(--wp--preset--gradient--midnight) !important;}.has-small-font-size{font-size: var(--wp--preset--font-size--small) !important;}.has-medium-font-size{font-size: var(--wp--preset--font-size--medium) !important;}.has-large-font-size{font-size: var(--wp--preset--font-size--large) !important;}.has-x-large-font-size{font-size: var(--wp--preset--font-size--x-large) !important;} :where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;} :where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;} :root :where(.wp-block-pullquote){font-size: 1.5em;line-height: 1.6;} </style> <link rel="stylesheet" href="https://blog.core.ac.uk/wp-content/cache/minify/3de15.css" media="all" /> <style id='ez-toc-inline-css' type='text/css'> div#ez-toc-container p.ez-toc-title {font-size: 120%;}div#ez-toc-container p.ez-toc-title {font-weight: 500;}div#ez-toc-container ul li {font-size: 95%;}div#ez-toc-container nav ul ul li ul li {font-size: %!important;} .ez-toc-container-direction {direction: ltr;}.ez-toc-counter ul {direction: ltr;counter-reset: item;}.ez-toc-counter nav ul li a::before {content: counter(item, numeric) ". ";margin-right: .2em; counter-increment: item;flex-grow: 0;flex-shrink: 0;float: left; }.ez-toc-widget-direction {direction: ltr;}.ez-toc-widget-container ul {direction: ltr;counter-reset: item;}.ez-toc-widget-container nav ul li a::before {content: counter(item, numeric) ". ";margin-right: .2em; counter-increment: item;flex-grow: 0;flex-shrink: 0;float: left; } </style> <link rel='stylesheet' id='twentyfifteen-fonts-css' href='https://fonts.googleapis.com/css?family=Noto+Sans%3A400italic%2C700italic%2C400%2C700%7CNoto+Serif%3A400italic%2C700italic%2C400%2C700%7CInconsolata%3A400%2C700&subset=latin%2Clatin-ext' type='text/css' media='all' /> <link rel='stylesheet' id='genericons-css' href='https://c0.wp.com/p/jetpack/11.9.3/_inc/genericons/genericons/genericons.css' type='text/css' media='all' /> <link rel="stylesheet" href="https://blog.core.ac.uk/wp-content/cache/minify/b09a7.css" media="all" /> <style id='twentyfifteen-style-inline-css' type='text/css'> /* Custom Sidebar Text Color */ .site-title a, .site-description, .secondary-toggle:before { color: #b75400; } .site-title a:hover, .site-title a:focus { color: #b75400; /* Fallback for IE7 and IE8 */ color: rgba( 183, 84, 0, 0.7); } .secondary-toggle { border-color: #b75400; /* Fallback for IE7 and IE8 */ border-color: rgba( 183, 84, 0, 0.1); } .secondary-toggle:hover, .secondary-toggle:focus { border-color: #b75400; /* Fallback for IE7 and IE8 */ border-color: rgba( 183, 84, 0, 0.3); } .site-title a { outline-color: #b75400; /* Fallback for IE7 and IE8 */ outline-color: rgba( 183, 84, 0, 0.3); } @media screen and (min-width: 59.6875em) { .secondary a, .dropdown-toggle:after, .widget-title, .widget blockquote cite, .widget blockquote small { color: #b75400; } .widget button, .widget input[type="button"], .widget input[type="reset"], .widget input[type="submit"], .widget_calendar tbody a { background-color: #b75400; } .textwidget a { border-color: #b75400; } .secondary a:hover, .secondary a:focus, .main-navigation .menu-item-description, .widget, .widget blockquote, .widget .wp-caption-text, .widget .gallery-caption { color: rgba( 183, 84, 0, 0.7); } .widget button:hover, .widget button:focus, .widget input[type="button"]:hover, .widget input[type="button"]:focus, .widget input[type="reset"]:hover, .widget input[type="reset"]:focus, .widget input[type="submit"]:hover, .widget input[type="submit"]:focus, .widget_calendar tbody a:hover, .widget_calendar tbody a:focus { background-color: rgba( 183, 84, 0, 0.7); } .widget blockquote { border-color: rgba( 183, 84, 0, 0.7); } .main-navigation ul, .main-navigation li, .secondary-toggle, .widget input, .widget textarea, .widget table, .widget th, .widget td, .widget pre, .widget li, .widget_categories .children, .widget_nav_menu .sub-menu, .widget_pages .children, .widget abbr[title] { border-color: rgba( 183, 84, 0, 0.1); } .dropdown-toggle:hover, .dropdown-toggle:focus, .widget hr { background-color: rgba( 183, 84, 0, 0.1); } .widget input:focus, .widget textarea:focus { border-color: rgba( 183, 84, 0, 0.3); } .sidebar a:focus, .dropdown-toggle:focus { outline-color: rgba( 183, 84, 0, 0.3); } } </style> <!--[if lt IE 9]> <link rel='stylesheet' id='twentyfifteen-ie-css' href='https://blog.core.ac.uk/wp-content/themes/twentyfifteen/css/ie.css?ver=20141010' type='text/css' media='all' /> <![endif]--> <!--[if lt IE 8]> <link rel='stylesheet' id='twentyfifteen-ie7-css' href='https://blog.core.ac.uk/wp-content/themes/twentyfifteen/css/ie7.css?ver=20141010' type='text/css' media='all' /> <![endif]--> <link rel="stylesheet" href="https://blog.core.ac.uk/wp-content/cache/minify/1881d.css" media="all" /> <style id='ecae-frontend-inline-css' type='text/css'> .ecae-button { display: inline-block !important; } </style> <link rel="stylesheet" href="https://blog.core.ac.uk/wp-content/cache/minify/9210e.css" media="all" /> <link rel='stylesheet' id='jetpack_css-css' href='https://c0.wp.com/p/jetpack/11.9.3/css/jetpack.css' type='text/css' media='all' /> <script type="text/javascript" src="https://c0.wp.com/c/6.7.1/wp-includes/js/jquery/jquery.min.js" id="jquery-core-js"></script> <script type="text/javascript" src="https://c0.wp.com/c/6.7.1/wp-includes/js/jquery/jquery-migrate.min.js" id="jquery-migrate-js"></script> <script type="text/javascript" id="ez-toc-scroll-scriptjs-js-after"> /* <![CDATA[ */ jQuery(document).ready(function(){document.querySelectorAll(".ez-toc-section").forEach(t=>{t.setAttribute("ez-toc-data-id","#"+decodeURI(t.getAttribute("id")))}),jQuery("a.ez-toc-link").click(function(){let t=jQuery(this).attr("href"),e=jQuery("#wpadminbar"),i=0;30>30&&(i=30),e.length&&(i+=e.height()),jQuery('[ez-toc-data-id="'+decodeURI(t)+'"]').length>0&&(i=jQuery('[ez-toc-data-id="'+decodeURI(t)+'"]').offset().top-i),jQuery("html, body").animate({scrollTop:i},500)})}); /* ]]> */ </script> <link rel="https://api.w.org/" href="https://blog.core.ac.uk/wp-json/" /><link rel="alternate" title="JSON" type="application/json" href="https://blog.core.ac.uk/wp-json/wp/v2/categories/58" /><link rel="EditURI" type="application/rsd+xml" title="RSD" href="https://blog.core.ac.uk/xmlrpc.php?rsd" /> <meta name="generator" content="WordPress 6.7.1" /> <style>img#wpstats{display:none}</style> <style type="text/css">.recentcomments a{display:inline !important;padding:0 !important;margin:0 !important;}</style><style type="text/css" id="custom-background-css"> body.custom-background { background-color: #f5f5f5; } </style> <!-- Jetpack Open Graph Tags --> <meta property="og:type" content="website" /> <meta property="og:title" content="dataset – CORE" /> <meta property="og:url" content="https://blog.core.ac.uk/category/dataset/" /> <meta property="og:site_name" content="CORE" /> <meta property="og:image" content="https://blog.core.ac.uk/wp-content/uploads/2023/11/cropped-favicon.png" /> <meta property="og:image:width" content="512" /> <meta property="og:image:height" content="512" /> <meta property="og:image:alt" content="" /> <meta property="og:locale" content="en_GB" /> <!-- End Jetpack Open Graph Tags --> <link rel="icon" href="https://blog.core.ac.uk/wp-content/uploads/2023/11/cropped-favicon-32x32.png" sizes="32x32" /> <link rel="icon" href="https://blog.core.ac.uk/wp-content/uploads/2023/11/cropped-favicon-192x192.png" sizes="192x192" /> <link rel="apple-touch-icon" href="https://blog.core.ac.uk/wp-content/uploads/2023/11/cropped-favicon-180x180.png" /> <meta name="msapplication-TileImage" content="https://blog.core.ac.uk/wp-content/uploads/2023/11/cropped-favicon-270x270.png" /> <script> // Opt-out function function gaOptout() { document.cookie = disableStr + '=true; expires=Thu, 31 Dec 2099 23:59:59 UTC; path=/'; window[disableStr] = true; } // Set to the same value as the web property used on the site var gaProperty = 'UA-66779096-1'; // Disable tracking if the opt-out cookie exists. var disableStr = 'ga-disable-' + gaProperty; if (document.cookie.indexOf(disableStr + '=true') > -1) { window[disableStr] = true; } // Now load GA. Tracking beacon will not be sent if user has opted out (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); ga('create', 'UA-66779096-1', 'auto'); ga('send', 'pageview'); </script> </head> <body class="archive category category-dataset category-58 custom-background"> <div id="page" class="hfeed site"> <a class="skip-link screen-reader-text" href="#content">Skip to content</a> <div id="sidebar" class="sidebar"> <header id="masthead" class="site-header" role="banner"> <div class="site-branding"> <p class="site-title"> <a href="https://blog.core.ac.uk/" rel="home"> <img class="lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%201%201'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/themes/twentyfifteen-child/images/core_logo.png" alt="CORE" /> </a> </p> <button class="secondary-toggle">Menu and widgets</button> </div><!-- .site-branding --> </header><!-- .site-header --> <!--<div class="widget"> <form method="post" action="http://core.ac.uk/search"> <input type="text" class="search_bar defaultText defaultTextActive" placeholder="Search CORE" id="searchCriteria" name="searchCriteria" value="" size="20" style="font-size: 19px; padding-left: 5px; width: 475px;"> </form> </div> --> <div id="secondary" class="secondary"> <div id="widget-area" class="widget-area" role="complementary"> <aside id="recent-posts-2" class="widget widget_recent_entries"> <h2 class="widget-title">Recent Posts</h2> <ul> <li> <a href="https://blog.core.ac.uk/2024/11/12/introducing-the-sdg-classification-module-for-the-core-dashboard/">Introducing the SDG Classification Module for the CORE Dashboard</a> </li> <li> <a href="https://blog.core.ac.uk/2024/10/01/the-core-rights-retention-statement-tracker/">The CORE Rights Retention Statement tracker</a> </li> <li> <a href="https://blog.core.ac.uk/2024/09/19/core-board-of-supporters-meeting/">CORE Board of Supporters Meeting </a> </li> <li> <a href="https://blog.core.ac.uk/2024/06/12/a-review-of-core-at-open-repositories-2024/">A review of CORE at Open Repositories 2024</a> </li> <li> <a href="https://blog.core.ac.uk/2024/05/23/core-launches-reindexing-button-for-data-providers/">CORE launches reindexing button for data providers</a> </li> </ul> </aside><aside id="block-3" class="widget widget_block widget_search"><form role="search" method="get" action="https://blog.core.ac.uk/" class="wp-block-search__button-outside wp-block-search__text-button wp-block-search" ><label class="wp-block-search__label" for="wp-block-search__input-1" >Search</label><div class="wp-block-search__inside-wrapper " ><input class="wp-block-search__input" id="wp-block-search__input-1" placeholder="" value="" type="search" name="s" required /><button aria-label="Search" class="wp-block-search__button wp-element-button" type="submit" >Search</button></div></form></aside><aside id="recent-comments-2" class="widget widget_recent_comments"><h2 class="widget-title">Recent Comments</h2><ul id="recentcomments"><li class="recentcomments"><span class="comment-author-link"><a href="https://www.arl.org/day-in-review/day-in-review-january-16-18/" class="url" rel="ugc external nofollow">Day in Review (January 16–18) - Association of Research Libraries</a></span> on <a href="https://blog.core.ac.uk/2024/01/18/university-of-chicago-adopts-cores-article-deduplication-tool/#comment-120">University of Chicago adopts CORE’s article deduplication tool</a></li><li class="recentcomments"><span class="comment-author-link"><a href="https://www.arl.org/day-in-review/day-in-review-november-13-16/" class="url" rel="ugc external nofollow">Day in Review (November 13–16) - Association of Research Libraries</a></span> on <a href="https://blog.core.ac.uk/2023/11/07/sofair-the-open-university-to-coordinate-new-international-project-to-facilitate-the-reproducibility-of-research-studies/#comment-119">SoFAIR: The Open University to coordinate new international project to facilitate the reproducibility of research studies</a></li><li class="recentcomments"><span class="comment-author-link">Petr Knoth</span> on <a href="https://blog.core.ac.uk/2023/03/02/core-welcomes-10-new-members/#comment-113">CORE welcomes 10 new members</a></li><li class="recentcomments"><span class="comment-author-link"><a href="https://purl.org/g3om4c" class="url" rel="ugc external nofollow">George Macgregor</a></span> on <a href="https://blog.core.ac.uk/2023/03/02/core-welcomes-10-new-members/#comment-112">CORE welcomes 10 new members</a></li><li class="recentcomments"><span class="comment-author-link"><a href="https://lib.uct.ac.za/digitalservices" class="url" rel="ugc external nofollow">Niklas Zimmer</a></span> on <a href="https://blog.core.ac.uk/2022/11/07/1419/#comment-111">CORE to become an independent Open Access service from August 2023</a></li></ul></aside><aside id="archives-2" class="widget widget_archive"><h2 class="widget-title">Archives</h2> <ul> <li><a href='https://blog.core.ac.uk/2024/11/'>November 2024</a></li> <li><a href='https://blog.core.ac.uk/2024/10/'>October 2024</a></li> <li><a href='https://blog.core.ac.uk/2024/09/'>September 2024</a></li> <li><a href='https://blog.core.ac.uk/2024/06/'>June 2024</a></li> <li><a href='https://blog.core.ac.uk/2024/05/'>May 2024</a></li> <li><a href='https://blog.core.ac.uk/2024/04/'>April 2024</a></li> <li><a href='https://blog.core.ac.uk/2024/03/'>March 2024</a></li> <li><a href='https://blog.core.ac.uk/2024/02/'>February 2024</a></li> <li><a href='https://blog.core.ac.uk/2024/01/'>January 2024</a></li> <li><a href='https://blog.core.ac.uk/2023/12/'>December 2023</a></li> <li><a href='https://blog.core.ac.uk/2023/11/'>November 2023</a></li> <li><a href='https://blog.core.ac.uk/2023/10/'>October 2023</a></li> <li><a href='https://blog.core.ac.uk/2023/08/'>August 2023</a></li> <li><a href='https://blog.core.ac.uk/2023/07/'>July 2023</a></li> <li><a href='https://blog.core.ac.uk/2023/06/'>June 2023</a></li> <li><a href='https://blog.core.ac.uk/2023/04/'>April 2023</a></li> <li><a href='https://blog.core.ac.uk/2023/03/'>March 2023</a></li> <li><a href='https://blog.core.ac.uk/2022/11/'>November 2022</a></li> <li><a href='https://blog.core.ac.uk/2022/10/'>October 2022</a></li> <li><a href='https://blog.core.ac.uk/2022/09/'>September 2022</a></li> <li><a href='https://blog.core.ac.uk/2022/06/'>June 2022</a></li> <li><a href='https://blog.core.ac.uk/2022/05/'>May 2022</a></li> <li><a href='https://blog.core.ac.uk/2022/04/'>April 2022</a></li> <li><a href='https://blog.core.ac.uk/2022/03/'>March 2022</a></li> <li><a href='https://blog.core.ac.uk/2022/02/'>February 2022</a></li> <li><a href='https://blog.core.ac.uk/2022/01/'>January 2022</a></li> <li><a href='https://blog.core.ac.uk/2021/10/'>October 2021</a></li> <li><a href='https://blog.core.ac.uk/2021/09/'>September 2021</a></li> <li><a href='https://blog.core.ac.uk/2021/08/'>August 2021</a></li> <li><a href='https://blog.core.ac.uk/2021/07/'>July 2021</a></li> <li><a href='https://blog.core.ac.uk/2021/06/'>June 2021</a></li> <li><a href='https://blog.core.ac.uk/2021/04/'>April 2021</a></li> <li><a href='https://blog.core.ac.uk/2021/03/'>March 2021</a></li> <li><a href='https://blog.core.ac.uk/2021/02/'>February 2021</a></li> <li><a href='https://blog.core.ac.uk/2020/12/'>December 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/11/'>November 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/10/'>October 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/09/'>September 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/08/'>August 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/07/'>July 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/06/'>June 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/05/'>May 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/04/'>April 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/03/'>March 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/02/'>February 2020</a></li> <li><a href='https://blog.core.ac.uk/2020/01/'>January 2020</a></li> <li><a href='https://blog.core.ac.uk/2019/12/'>December 2019</a></li> <li><a href='https://blog.core.ac.uk/2019/11/'>November 2019</a></li> <li><a href='https://blog.core.ac.uk/2019/10/'>October 2019</a></li> <li><a href='https://blog.core.ac.uk/2019/07/'>July 2019</a></li> <li><a href='https://blog.core.ac.uk/2018/12/'>December 2018</a></li> <li><a href='https://blog.core.ac.uk/2018/03/'>March 2018</a></li> <li><a href='https://blog.core.ac.uk/2017/12/'>December 2017</a></li> <li><a href='https://blog.core.ac.uk/2017/11/'>November 2017</a></li> <li><a href='https://blog.core.ac.uk/2017/10/'>October 2017</a></li> <li><a href='https://blog.core.ac.uk/2017/05/'>May 2017</a></li> <li><a href='https://blog.core.ac.uk/2017/02/'>February 2017</a></li> <li><a href='https://blog.core.ac.uk/2017/01/'>January 2017</a></li> <li><a href='https://blog.core.ac.uk/2016/12/'>December 2016</a></li> <li><a href='https://blog.core.ac.uk/2016/10/'>October 2016</a></li> <li><a href='https://blog.core.ac.uk/2016/07/'>July 2016</a></li> <li><a href='https://blog.core.ac.uk/2016/06/'>June 2016</a></li> <li><a href='https://blog.core.ac.uk/2016/04/'>April 2016</a></li> <li><a href='https://blog.core.ac.uk/2016/01/'>January 2016</a></li> <li><a href='https://blog.core.ac.uk/2015/12/'>December 2015</a></li> <li><a href='https://blog.core.ac.uk/2015/10/'>October 2015</a></li> <li><a href='https://blog.core.ac.uk/2015/09/'>September 2015</a></li> <li><a href='https://blog.core.ac.uk/2015/03/'>March 2015</a></li> <li><a href='https://blog.core.ac.uk/2014/03/'>March 2014</a></li> <li><a href='https://blog.core.ac.uk/2013/07/'>July 2013</a></li> <li><a href='https://blog.core.ac.uk/2013/06/'>June 2013</a></li> <li><a href='https://blog.core.ac.uk/2013/05/'>May 2013</a></li> <li><a href='https://blog.core.ac.uk/2012/11/'>November 2012</a></li> <li><a href='https://blog.core.ac.uk/2012/07/'>July 2012</a></li> <li><a href='https://blog.core.ac.uk/2012/06/'>June 2012</a></li> <li><a href='https://blog.core.ac.uk/2012/05/'>May 2012</a></li> <li><a href='https://blog.core.ac.uk/2012/04/'>April 2012</a></li> <li><a href='https://blog.core.ac.uk/2012/03/'>March 2012</a></li> <li><a href='https://blog.core.ac.uk/2012/02/'>February 2012</a></li> <li><a href='https://blog.core.ac.uk/2011/12/'>December 2011</a></li> <li><a href='https://blog.core.ac.uk/2011/09/'>September 2011</a></li> <li><a href='https://blog.core.ac.uk/2011/08/'>August 2011</a></li> <li><a href='https://blog.core.ac.uk/2011/07/'>July 2011</a></li> <li><a href='https://blog.core.ac.uk/2011/06/'>June 2011</a></li> <li><a href='https://blog.core.ac.uk/2011/05/'>May 2011</a></li> <li><a href='https://blog.core.ac.uk/2011/04/'>April 2011</a></li> <li><a href='https://blog.core.ac.uk/2011/03/'>March 2011</a></li> </ul> </aside><aside id="categories-2" class="widget widget_categories"><h2 class="widget-title">Categories</h2> <ul> <li class="cat-item cat-item-6"><a href="https://blog.core.ac.uk/category/aggregation/">aggregation</a> </li> <li class="cat-item cat-item-120"><a href="https://blog.core.ac.uk/category/ambassador/">ambassador</a> </li> <li class="cat-item cat-item-81"><a href="https://blog.core.ac.uk/category/api/">API</a> </li> <li class="cat-item cat-item-15"><a href="https://blog.core.ac.uk/category/conferences/">conferences</a> </li> <li class="cat-item cat-item-7"><a href="https://blog.core.ac.uk/category/core/">CORE</a> </li> <li class="cat-item cat-item-234"><a href="https://blog.core.ac.uk/category/core-membership/">CORE Membership</a> </li> <li class="cat-item cat-item-183"><a href="https://blog.core.ac.uk/category/coreupdate/">COREupdate</a> </li> <li class="cat-item cat-item-173"><a href="https://blog.core.ac.uk/category/dashboard/">dashboard</a> </li> <li class="cat-item cat-item-58 current-cat"><a aria-current="page" href="https://blog.core.ac.uk/category/dataset/">dataset</a> </li> <li class="cat-item cat-item-106"><a href="https://blog.core.ac.uk/category/discovery/">discovery</a> </li> <li class="cat-item cat-item-246"><a href="https://blog.core.ac.uk/category/events/">Events</a> </li> <li class="cat-item cat-item-86"><a href="https://blog.core.ac.uk/category/growth/">growth</a> </li> <li class="cat-item cat-item-5"><a href="https://blog.core.ac.uk/category/harvesting/">harvesting</a> </li> <li class="cat-item cat-item-240"><a href="https://blog.core.ac.uk/category/hype/">Hype</a> </li> <li class="cat-item cat-item-177"><a href="https://blog.core.ac.uk/category/integration/">Integration</a> </li> <li class="cat-item cat-item-241"><a href="https://blog.core.ac.uk/category/news/">News</a> </li> <li class="cat-item cat-item-112"><a href="https://blog.core.ac.uk/category/newsletter/">newsletter</a> </li> <li class="cat-item cat-item-223"><a href="https://blog.core.ac.uk/category/on-merrit/">ON-MERRIT</a> </li> <li class="cat-item cat-item-243"><a href="https://blog.core.ac.uk/category/projects/">Projects</a> </li> <li class="cat-item cat-item-51"><a href="https://blog.core.ac.uk/category/recommender/">recommender</a> </li> <li class="cat-item cat-item-4"><a href="https://blog.core.ac.uk/category/repositories/">repositories</a> </li> <li class="cat-item cat-item-82"><a href="https://blog.core.ac.uk/category/sdk/">SDK</a> </li> <li class="cat-item cat-item-203"><a href="https://blog.core.ac.uk/category/statistics/">statistics</a> </li> <li class="cat-item cat-item-1"><a href="https://blog.core.ac.uk/category/uncategorised/">Uncategorised</a> </li> <li class="cat-item cat-item-217"><a href="https://blog.core.ac.uk/category/webinar/">webinar</a> </li> </ul> </aside><aside id="meta-2" class="widget widget_meta"><h2 class="widget-title">Meta</h2> <ul> <li><a href="https://blog.core.ac.uk/core-admin/">Log in</a></li> <li><a href="https://blog.core.ac.uk/feed/">Entries feed</a></li> <li><a href="https://blog.core.ac.uk/comments/feed/">Comments feed</a></li> <li><a href="https://en-gb.wordpress.org/">WordPress.org</a></li> </ul> </aside> </div><!-- .widget-area --> </div><!-- .secondary --> </div><!-- .sidebar --> <div id="content" class="site-content"> <a href="http://core.ac.uk" class="content-link">← Back to the CORE Portal</a> <section id="primary" class="content-area"> <main id="main" class="site-main" role="main"> <header class="page-header"> <h1 class="page-title">Category: <span>dataset</span></h1> </header><!-- .page-header --> <article id="post-1535" class="post-1535 post type-post status-publish format-standard hentry category-api category-dataset category-newsletter"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2023/07/17/core-grobid-structured-text-from-34-million-scientific-documents-and-counting/" rel="bookmark">CORE + GROBID: Structured Text from 34 Million Scientific Documents (and counting)</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <!-- Begin :: Generated by Easy Custom Auto Excerpt --><div class="ecae" style=""> <p>We very recently surveyed our <a rel="noreferrer noopener" href="https://core.ac.uk/membership" data-type="URL" data-id="https://core.ac.uk/membership" target="_blank">CORE members</a> to ask what was most important to them and we received <a rel="noreferrer noopener" href="https://blog.core.ac.uk/2023/07/06/asking-core-members-what-matters-to-them/" data-type="URL" data-id="https://blog.core.ac.uk/2023/07/06/asking-core-members-what-matters-to-them/" target="_blank">wide-ranging feedback</a>. The CORE dashboard provides a range of tools for our data providers and their repository managers and users. Much of the feedback we received was regarding providing additional or enhanced tools for managing repository content via the dashboard. For example, metadata validation and enrichment tools were regarded as highly important. </p> <p>Interestingly however, what was most important was making repository content machine-readable. This is closely linked to identifying funding information and rights-retention strategies. Ensuring content is machine-readable allows for the extraction of far richer information from full-text documents than that available in the metadata alone. In the U.S., the recent <a rel="noreferrer noopener" href="https://www.whitehouse.gov/wp-content/uploads/2022/08/08-2022-OSTP-Public-Access-Memo.pdf" target="_blank">OSPT memo</a> on ‘<em>Ensuring Free, Immediate, and Equitable Access to Federally Funded Research</em>‘ includes machine-readability as a required component of the archiving and deposition of federally funded research.<span class="ecae-button ecae-buttonskin-none" style="text-align:left" > <a class="ecae-link" href="https://blog.core.ac.uk/2023/07/17/core-grobid-structured-text-from-34-million-scientific-documents-and-counting/"><span>read more...</span></a></span></p></div><!-- End :: Generated by Easy Custom Auto Excerpt --> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2023/07/17/core-grobid-structured-text-from-34-million-scientific-documents-and-counting/" rel="bookmark"><time class="entry-date published" datetime="2023-07-17T15:54:03+01:00">17th July 2023</time><time class="updated" datetime="2023-07-18T14:24:55+01:00">18th July 2023</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/davidpride/">David Pride</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/api/" rel="category tag">API</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/newsletter/" rel="category tag">newsletter</a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-1353" class="post-1353 post type-post status-publish format-standard hentry category-core category-dataset tag-core tag-data tag-dataset tag-research"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2022/02/21/using-open-access-research-in-our-battle-against-misinformation/" rel="bookmark">Using open access research in our battle against misinformation</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <!-- Begin :: Generated by Easy Custom Auto Excerpt --><div class="ecae" style=""> <p class="has-text-align-justify">Our society is facing significant challenges due to the widespread misinformation, in particular on social media, substantially influencing public opinion. As a result, we are seeing a lot of demand for innovative text processing methods to fact check and provide an automatic assessment of trustworthiness and credibility. Machine learning and natural language processing have started to be widely used to address this problem. </p> <p>While scientific papers have been traditionally seen as a source of mostly trustworthy information, their use within automated tools in the fight against misinformation, such as related to vaccine effectiveness or climate changes, has been rather limited.<span class="ecae-button ecae-buttonskin-none" style="text-align:left" > <a class="ecae-link" href="https://blog.core.ac.uk/2022/02/21/using-open-access-research-in-our-battle-against-misinformation/"><span>read more...</span></a></span></p></div><!-- End :: Generated by Easy Custom Auto Excerpt --> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2022/02/21/using-open-access-research-in-our-battle-against-misinformation/" rel="bookmark"><time class="entry-date published" datetime="2022-02-21T13:04:26+00:00">21st February 2022</time><time class="updated" datetime="2022-02-21T13:04:29+00:00">21st February 2022</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/admin/">CORE Admin</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/core/" rel="tag">core</a>, <a href="https://blog.core.ac.uk/tag/data/" rel="tag">data</a>, <a href="https://blog.core.ac.uk/tag/dataset/" rel="tag">dataset</a>, <a href="https://blog.core.ac.uk/tag/research/" rel="tag">research</a></span><span class="comments-link"><a href="https://blog.core.ac.uk/2022/02/21/using-open-access-research-in-our-battle-against-misinformation/#comments">1 Comment<span class="screen-reader-text"> on Using open access research in our battle against misinformation</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-1315" class="post-1315 post type-post status-publish format-standard hentry category-api category-core category-dataset category-newsletter tag-core tag-core-integration-api tag-coreapi tag-database tag-dataset tag-metadata tag-openacccess"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2021/10/15/partnership-announcement-cypris-and-core/" rel="bookmark">Partnership Announcement: Cypris and CORE</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <!-- Begin :: Generated by Easy Custom Auto Excerpt --><div class="ecae" style=""> <p class="has-text-align-justify"><strong>We’re delighted to announce a new partnership between CORE and </strong><a href="https://ipcypris.com/"><strong>Cypris</strong></a><strong>, a leading AI-driven, market intelligence platform that connects research & development (R&D) teams with innovation data and trends in their field.</strong></p> <figure class="wp-block-image size-large"><a href="https://blog.core.ac.uk/wp-content/uploads/2021/10/Cypris-and-CORE.jpg"><img fetchpriority="high" decoding="async" width="1024" height="586" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%201024%20586'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2021/10/Cypris-and-CORE-1024x586.jpg" alt="" class="wp-image-1316 lazy" data-srcset="https://blog.core.ac.uk/wp-content/uploads/2021/10/Cypris-and-CORE-1024x586.jpg 1024w, https://blog.core.ac.uk/wp-content/uploads/2021/10/Cypris-and-CORE-300x172.jpg 300w, https://blog.core.ac.uk/wp-content/uploads/2021/10/Cypris-and-CORE-768x440.jpg 768w, https://blog.core.ac.uk/wp-content/uploads/2021/10/Cypris-and-CORE.jpg 1100w" data-sizes="(max-width: 1024px) 100vw, 1024px" /></a></figure> <p class="has-text-align-justify">The partnership will provide Cypris with unlimited access to over 210 million open access articles to further enhance their platform and regularly add live market data to provide R&D teams with the most up-to-date research in their fields of interest.</p> <p>Continue reading this news on the <a href="https://research.jiscinvolve.org/wp/2021/10/15/partnership-announcement-cypris-and-core/" data-type="URL" data-id="https://research.jiscinvolve.org/wp/2021/10/15/partnership-announcement-cypris-and-core/">Jisc Research Blog.</a><span class="ecae-button ecae-buttonskin-none" style="text-align:left" > <a class="ecae-link" href="https://blog.core.ac.uk/2021/10/15/partnership-announcement-cypris-and-core/"><span>read more...</span></a></span></p></div><!-- End :: Generated by Easy Custom Auto Excerpt --> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2021/10/15/partnership-announcement-cypris-and-core/" rel="bookmark"><time class="entry-date published" datetime="2021-10-15T18:03:44+01:00">15th October 2021</time><time class="updated" datetime="2021-10-15T18:03:49+01:00">15th October 2021</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/admin/">CORE Admin</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/api/" rel="category tag">API</a>, <a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/newsletter/" rel="category tag">newsletter</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/core/" rel="tag">core</a>, <a href="https://blog.core.ac.uk/tag/core-integration-api/" rel="tag">core integration API</a>, <a href="https://blog.core.ac.uk/tag/coreapi/" rel="tag">coreAPI</a>, <a href="https://blog.core.ac.uk/tag/database/" rel="tag">database</a>, <a href="https://blog.core.ac.uk/tag/dataset/" rel="tag">dataset</a>, <a href="https://blog.core.ac.uk/tag/metadata/" rel="tag">metadata</a>, <a href="https://blog.core.ac.uk/tag/openacccess/" rel="tag">openacccess</a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-1239" class="post-1239 post type-post status-publish format-standard hentry category-core category-dataset category-integration tag-core tag-database tag-dataset tag-integration"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2021/04/09/flowcite-expands-its-knowledge-library-with-210-million-research-papers-from-core/" rel="bookmark">Flowcite Expands its Knowledge Library with 210 Million Research Papers from CORE</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <!-- Begin :: Generated by Easy Custom Auto Excerpt --><div class="ecae" style=""> <figure class="wp-block-image size-large"><a href="https://blog.core.ac.uk/wp-content/uploads/2021/04/23.png"><img decoding="async" width="868" height="321" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%20868%20321'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2021/04/23.png" alt="" class="wp-image-1240 lazy"/></a></figure> <p class="has-text-align-justify"><strong>Flowcite has teamed up with CORE, the world’s largest aggregator of open access research papers. The partnership will provide Flowcite users with free and unlimited access to millions of open access research papers from the CORE database.</strong></p> <p><em>CORE is delighted to partner with Flowcite and progress our aligned goals to make open research content available to all. By connecting our innovative solutions we continue to evolve the way research is being completed and increase the discoverability and usage of all research outputs.”</em><strong> Dr Petr Knoth, CORE Founder.</strong><span class="ecae-button ecae-buttonskin-none" style="text-align:left" > <a class="ecae-link" href="https://blog.core.ac.uk/2021/04/09/flowcite-expands-its-knowledge-library-with-210-million-research-papers-from-core/"><span>read more...</span></a></span></p></div><!-- End :: Generated by Easy Custom Auto Excerpt --> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2021/04/09/flowcite-expands-its-knowledge-library-with-210-million-research-papers-from-core/" rel="bookmark"><time class="entry-date published" datetime="2021-04-09T10:25:27+01:00">9th April 2021</time><time class="updated" datetime="2021-04-09T10:25:31+01:00">9th April 2021</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/admin/">CORE Admin</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/integration/" rel="category tag">Integration</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/core/" rel="tag">core</a>, <a href="https://blog.core.ac.uk/tag/database/" rel="tag">database</a>, <a href="https://blog.core.ac.uk/tag/dataset/" rel="tag">dataset</a>, <a href="https://blog.core.ac.uk/tag/integration/" rel="tag">integration</a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-1001" class="post-1001 post type-post status-publish format-standard hentry category-aggregation category-core category-dataset category-growth category-harvesting tag-core tag-data tag-dataset tag-enrichment"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2020/02/25/core-raises-repository-data-quality-by-consolidating-information-from-external-datasets/" rel="bookmark">CORE raises repository data quality by consolidating information from external datasets</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <!-- Begin :: Generated by Easy Custom Auto Excerpt --><div class="ecae" style=""> <figure class="wp-block-image size-large"><img decoding="async" width="791" height="670" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%20791%20670'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2020/02/data-data-dat-ada.png" alt="" class="wp-image-1002 lazy"/></figure> <p> Read about our work on going beyond mirroring content from our data providers to improve data quality. In our latest <a href="https://scholarlycommunications.jiscinvolve.org/wp/2020/02/24/core-raises-repository-data-quality-by-consolidating-information-from-external-datasets/">blog post</a>, we present how we link <a href="https://core.ac.uk/data/">CORE data</a> to complementary scholarly sources and databases including <a href="https://www.crossref.org/">Crossref</a>, <a href="https://www.microsoft.com/en-us/research/project/microsoft-academic-graph/">MAG</a>, and <a href="https://orcid.org/">ORCID</a>. </p> </div><!-- End :: Generated by Easy Custom Auto Excerpt --> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2020/02/25/core-raises-repository-data-quality-by-consolidating-information-from-external-datasets/" rel="bookmark"><time class="entry-date published" datetime="2020-02-25T10:42:16+00:00">25th February 2020</time><time class="updated" datetime="2020-02-25T10:47:09+00:00">25th February 2020</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/admin/">CORE Admin</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/aggregation/" rel="category tag">aggregation</a>, <a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/growth/" rel="category tag">growth</a>, <a href="https://blog.core.ac.uk/category/harvesting/" rel="category tag">harvesting</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/core/" rel="tag">core</a>, <a href="https://blog.core.ac.uk/tag/data/" rel="tag">data</a>, <a href="https://blog.core.ac.uk/tag/dataset/" rel="tag">dataset</a>, <a href="https://blog.core.ac.uk/tag/enrichment/" rel="tag">enrichment</a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-646" class="post-646 post type-post status-publish format-standard hentry category-aggregation category-api category-core category-dataset category-growth category-harvesting category-recommender category-repositories tag-105 tag-statistics"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2018/12/18/core-becomes-the-worlds-largest-open-access-aggregator-or-how-about-them-stats-2018-edition/" rel="bookmark">CORE becomes the world’s largest open access aggregator (or how about them stats 2018 edition)</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p><!-- Begin :: Generated by Easy Custom Auto Excerpt --></p> <div class="ecae" style=""><span style="font-weight: 400;">This was another productive year for the CORE team; our content providers have increased, along with our metadata and full text records. This makes CORE the </span><a href="https://scholarlycommunications.jiscinvolve.org/wp/2018/06/01/core-becomes-the-worlds-largest-aggregator/"><span style="font-weight: 400;">world’s largest open access aggregator</span></a></p> <p>. More specifically, over the last 3 months CORE had more than 25 million users, tripling our usage compared to 2017. According to <span class="ecae-button ecae-buttonskin-none" style="text-align:left" > <a class="ecae-link" href="https://blog.core.ac.uk/2018/12/18/core-becomes-the-worlds-largest-open-access-aggregator-or-how-about-them-stats-2018-edition/"><span>read more...</span></a></span></p> </div> <p><!-- End :: Generated by Easy Custom Auto Excerpt --></p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2018/12/18/core-becomes-the-worlds-largest-open-access-aggregator-or-how-about-them-stats-2018-edition/" rel="bookmark"><time class="entry-date published" datetime="2018-12-18T15:04:53+00:00">18th December 2018</time><time class="updated" datetime="2019-05-22T14:20:01+01:00">22nd May 2019</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/mcancellieri/">Matteo Cancellieri</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/aggregation/" rel="category tag">aggregation</a>, <a href="https://blog.core.ac.uk/category/api/" rel="category tag">API</a>, <a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/growth/" rel="category tag">growth</a>, <a href="https://blog.core.ac.uk/category/harvesting/" rel="category tag">harvesting</a>, <a href="https://blog.core.ac.uk/category/recommender/" rel="category tag">recommender</a>, <a href="https://blog.core.ac.uk/category/repositories/" rel="category tag">repositories</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/2018/" rel="tag">2018</a>, <a href="https://blog.core.ac.uk/tag/statistics/" rel="tag">statistics</a></span><span class="comments-link"><a href="https://blog.core.ac.uk/2018/12/18/core-becomes-the-worlds-largest-open-access-aggregator-or-how-about-them-stats-2018-edition/#comments">1 Comment<span class="screen-reader-text"> on CORE becomes the world’s largest open access aggregator (or how about them stats 2018 edition)</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-630" class="post-630 post type-post status-publish format-standard hentry category-core category-dataset category-repositories tag-fast-sync tag-harvesting tag-open-access tag-repositories tag-resource-dumps"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2018/03/17/increasing-the-speed-of-harvesting-with-on-demand-resource-dumps/" rel="bookmark">Increasing the Speed of Harvesting with On Demand Resource Dumps</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p><!-- Begin :: Generated by Easy Custom Auto Excerpt --></p> <div class="ecae" style=""> </p> <p>I am currently working with <a href="https://scholar.google.com/citations?user=nMRDlR8AAAAJ&hl=en">Martin Klein</a>, <a href="http://kmi.open.ac.uk/people/member/matteo-cancellieri">Matteo Cancellieri</a> and <a href="http://public.lanl.gov/herbertv/bio/">Herbert Van de Sompel</a> on a project funded by the <a href="https://eoscpilot.eu/">European Open Science Cloud Pilot</a> that aims to test and benchmark <a href="http://www.openarchives.org/rs/1.1/resourcesync">ResourceSync</a> against <a href="https://www.openarchives.org/OAI/openarchivesprotocol.html">OAI-PMH</a> in a range of scenarios. The objective is to perform a quantitative evaluation that could then be used as evidence to convince data providers to adopt ResourceSync. During this work, we have encountered a problem related to the scalability of ResourceSync and developed a solution to it in the form of an On Demand Resource Dump. The aim of this blog post is to explain the problem, how we arrived to the solution and how the solution works.</p> <div id="ez-toc-container" class="ez-toc-v2_0_46 counter-hierarchy ez-toc-counter ez-toc-grey ez-toc-container-direction"> <div class="ez-toc-title-container"> <p class="ez-toc-title">Highlights</p> <span class="ez-toc-title-toggle"></span></div> <nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class="ez-toc-link ez-toc-heading-1" href="https://blog.core.ac.uk/category/dataset/#The_problem" title="The problem">The problem</a></li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class="ez-toc-link ez-toc-heading-2" href="https://blog.core.ac.uk/category/dataset/#Can_Resource_Dumps_be_the_solution" title="Can Resource Dumps be the solution?">Can Resource Dumps be the solution?</a></li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class="ez-toc-link ez-toc-heading-3" href="https://blog.core.ac.uk/category/dataset/#On_Demand_Resource_Dumps" title="On Demand Resource Dumps">On Demand Resource Dumps</a><ul class='ez-toc-list-level-3'><li class='ez-toc-heading-level-3'><a class="ez-toc-link ez-toc-heading-4" href="https://blog.core.ac.uk/category/dataset/#Step_2_sending_a_POST_request_to_the_On_Demand_dump_endpoint" title="Step 2: sending a POST request to the On Demand dump endpoint">Step 2: sending a POST request to the On Demand dump endpoint</a></li></ul></li></ul></nav></div> <h2><span class="ez-toc-section" id="The_problem"></span>The problem<span class="ez-toc-section-end"></span></h2> <p>One of the scenarios we have been exploring deals with a situation where the resources to be synchronised are metadata files of a small data size (typically from a few bytes to several kilobytes). Coincidentally, this scenario is very common for metadata in repositories of academic manuscripts, research data (e.g. descriptions of images), cultural heritage, etc.</p> <p>The problem is related to the issue that while most OAI-PMH implementations typically deliver 100-1000 responses per one HTTP request, ResourceSync is designed in a way that requires resolving each resource individually. We have identified and confirmed by testing that for repositories with larges numbers of metadata items, this can have a very significant impact on the performance of harvesting, as the overhead of the HTTP request is considerable compared to the size of the metadata record.</p> <p>More specifically, we have run tests over a sample of 357 repositories. The results of these tests show that while the speed of OAI-PMH harvesting ranges from 30-520 metadata records per second, depending largely on the repository platform, the speed of harvesting by ResourceSync is somewhere in the range of only 4 metadata records per second for harvesting the same content using existing ResourceSync client/server implementations and sequential downloading strategy. We are preparing a paper on this, so I am not going to disclose the exact details of the analysis at this stage.</p> <p>As ResourceSync has been created to overcome many of the problems of OAI-PMH, such as:</p> <ul> <li>being too flexible in terms of support for incremental harvesting, resulting in inconsistent implementations of this feature across data providers,</li> <li>some of its implementations being unstable and less suitable for exchanging large quantities of metadata and</li> <li>being only designed for metadata transfer, omitting the much needed support for content exchange</li> </ul> <p>it is important that Resource Sync performs well under all common scenarios, including the one we are dealing with.</p> <h2><span class="ez-toc-section" id="Can_Resource_Dumps_be_the_solution"></span>Can Resource Dumps be the solution?<span class="ez-toc-section-end"></span></h2> <p>An obvious option for solving the problem that is already offered by ResourceSync are Resource Dumps. While a Resource Dump can speed up harvesting to levels far exceeding those of OAI-PMH, it creates some considerable extra complexity on the side of the server. The key problem is that it creates the necessity to periodically package the data as a Resource Dump, which basically means running a batch process to produce a compressed (zip) file containing the resources.</p> <p>The number of Resource Dumps a source needs to maintain is equal to the number of Capability Lists it maintains times the size of the Resource Dump Index. The minimum practical operational size of a Resource Dump Index is 2. This is to ensure we don’t remove a dump currently being downloaded by a client during the creation of a new dump. As we have observed that a typical repository may contain about 250 OAI-PMH sets (Capability Lists in the ResourceSync terminology), this implies the need for a significant data duplication and requirements on period creation of Resource Dumps if a source chose to use Resource Dumps as part of the harvesting process.</p> <h2><span class="ez-toc-section" id="On_Demand_Resource_Dumps"></span>On Demand Resource Dumps<span class="ez-toc-section-end"></span></h2> <p>To deal with the problem, we suggest an extension of ResourceSync that will support the concept of an On Demand Resource Dump. An On Demand Resource Dump is a Resource Dump which is created, as the name suggests, whenever a client asks for it. More specifically, a client can scan through the list of resources presented in a Resource List or a Change List (without resolving them individually) and request from the source to package any set of the resources as a Resource Dump. This approach speeds up and saves processing on the side of both the source as well as the client. Our initial tests show that this enables ResourceSync to perform as well as OAI-PMH in the metadata only harvesting scenario when requests are sent sequentially (the most extreme scenario for ResourceSync). However, as ResourceSync requests can be parallelised, as opposed to OAI-PMH (due to the reliance of OAI-PMH on the resumption token), this makes ResourceSync a clear winner.</p> <p>In the rest of this post, I will explain how this works and how it could be integrated with the ResourceSync specification.</p> <p class="p1"><span class="s1">There are basically 3 steps: </span></p> <ol> <li class="p1"><span class="s1">defining that the server supports an on-demand Resource Dump,</span></li> <li class="p1"><span class="s1">sending a POST request to the on-demand dump endpoint and</span></li> <li class="p1"><span class="s1">receiving a response from the server that 100% conforms to the Resource Dump specification. </span></li> </ol> <p><span class="s1">I will first introduce steps 2 and 3 and then I will come back to step 1.</span></p> <h3 class="p1"><span class="ez-toc-section" id="Step_2_sending_a_POST_request_to_the_On_Demand_dump_endpoint"></span><span class="s1"><b>Step 2: sending a POST request to the On Demand dump endpoint</b></span><span class="ez-toc-section-end"></span></h3> <p class="p1"><span class="s1">We have defined an endpoint at <a href="https://core.ac.uk/datadump"><span class="s2">https://core.ac.uk/datadump</span></a> . You can POST it a list of resource identifiers (which can be discovered in a Resource List). In the example below, I am using curl to send it a list of resource identifiers in JSON which I want to get resolved. Obviously, the approach is not limited to JSON, it can be used for any resource listed in a Resource List regardless of its type. Try it by executing the code below in your terminal.</span></p> <p><span class="s3">curl -d ‘[“<a href="https://core.ac.uk/api-v2/articles/get/42138752%22,%22https://core.ac.uk/api-v2/articles/get/32050%22%5D"><span class="s2">https://core.ac.uk/api-v2/articles/get/42138752″,”https://core.ac.uk/api-v2/articles/get/32050″]</span></a>‘ -H “Content-Type: application/json” <a href="https://core.ac.uk/datadump"><span class="s2">https://core.ac.uk/datadump</span></a> -X POST > on-demand-resource-dump.zip</span><span class="ecae-button ecae-buttonskin-none" style="text-align:left" > <a class="ecae-link" href="https://blog.core.ac.uk/2018/03/17/increasing-the-speed-of-harvesting-with-on-demand-resource-dumps/"><span>read more...</span></a></span></p> </div> <p><!-- End :: Generated by Easy Custom Auto Excerpt --></p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2018/03/17/increasing-the-speed-of-harvesting-with-on-demand-resource-dumps/" rel="bookmark"><time class="entry-date published" datetime="2018-03-17T10:24:16+00:00">17th March 2018</time><time class="updated" datetime="2018-12-17T17:50:58+00:00">17th December 2018</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/petrknoth/">Petr Knoth</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/repositories/" rel="category tag">repositories</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/fast-sync/" rel="tag">fast sync</a>, <a href="https://blog.core.ac.uk/tag/harvesting/" rel="tag">harvesting</a>, <a href="https://blog.core.ac.uk/tag/open-access/" rel="tag">open access</a>, <a href="https://blog.core.ac.uk/tag/repositories/" rel="tag">repositories</a>, <a href="https://blog.core.ac.uk/tag/resource-dumps/" rel="tag">resource dumps</a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-602" class="post-602 post type-post status-publish format-standard hentry category-aggregation category-api category-core category-dataset category-growth category-harvesting category-recommender category-repositories tag-102 tag-statistics"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2017/12/21/cores-open-access-content-has-reached-the-moon-or-how-about-them-stats-2017-edition/" rel="bookmark">CORE’s Open Access content has reached the Moon! (or how about them stats 2017 edition)</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p><!-- Begin :: Generated by Easy Custom Auto Excerpt --></p> <div class="ecae" style="">For yet another year (see previous years <a href="https://blog.core.ac.uk/2016/12/19/cores-open-access-and-text-mining-services-2016-growth-or-how-about-them-stats-2016-edition/">2016</a>, <a href="https://blog.core.ac.uk/2015/12/14/how-about-them-stats/">2015</a>) CORE has been really productive; the number of our content providers has increased and we have now more open access full text and metadata records than ever.</p> <p><a href="https://blog.core.ac.uk/wp-content/uploads/2017/12/Untitled-1-03-2.png"><img decoding="async" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%204267%202134'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2017/12/Untitled-1-03-2.png" alt="" width="4267" height="2134" class="alignnone size-full wp-image-625 lazy" /></a></p> <p>Our <a href="https://core.ac.uk/services">services</a> are also growing steadily and we would like to thank the community for using the CORE <a href="https://core.ac.uk/services#api">API</a> and CORE <a href="https://core.ac.uk/services#dataset">Datasets</a>.</p> <p><a href="https://blog.core.ac.uk/wp-content/uploads/2017/12/Untitled-1-05-1.png"><img decoding="async" class="alignnone size-full wp-image-616 lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%204267%202134'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2017/12/Untitled-1-05-1.png" alt="" width="4267" height="2134" /></a></p> <p>We also offer other services, such as the CORE <a href="https://core.ac.uk/services#dashboard">Repositories Dashboard</a>, CORE <a href="https://core.ac.uk/services#connector">Publisher Connector</a> and the <a href="https://core.ac.uk/services#recommender">CORE Recommender</a>. We received <a href="https://blog.core.ac.uk/2017/10/31/implementing-the-core-recommender-in-strathprints-a-whitehat-improvement-to-promote-user-interaction/">great feedback</a> with regards to the CORE Recommender, with George Macgregor, Institutional Repository Manager at Strathclyde University, reporting:</p> <p><a href="https://blog.core.ac.uk/wp-content/uploads/2017/12/Untitled-1-04-2.png"><img decoding="async" class="alignnone size-full wp-image-622 lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%204267%202134'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2017/12/Untitled-1-04-2.png" alt="" width="4267" height="2134" /></a></p> <p>We are thrilled that this year CORE made it to the moon. Our next destination is Venus.</p> <p><a href="https://blog.core.ac.uk/wp-content/uploads/2017/12/Untitled-1-02.png"><img decoding="async" class="alignnone size-large wp-image-604 lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%20660%20330'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2017/12/Untitled-1-02.png" alt="" width="660" height="330" /></a></p> <p>The CORE Team wishes you Merry Christmas and a Prosperous New Year!</p> <p><a href="https://blog.core.ac.uk/wp-content/uploads/2017/12/coreteam.png"><img decoding="async" class="alignnone size-full wp-image-603 lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%202563%201523'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2017/12/coreteam.png" alt="" width="2563" height="1523" /></a></p> <p>* Note: Special thanks to Matteo Cancellieri for creating the graphics in this blog post.</p></div> <p><!-- End :: Generated by Easy Custom Auto Excerpt --></p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2017/12/21/cores-open-access-content-has-reached-the-moon-or-how-about-them-stats-2017-edition/" rel="bookmark"><time class="entry-date published" datetime="2017-12-21T14:50:04+00:00">21st December 2017</time><time class="updated" datetime="2017-12-21T15:02:28+00:00">21st December 2017</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/mcancellieri/">Matteo Cancellieri</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/aggregation/" rel="category tag">aggregation</a>, <a href="https://blog.core.ac.uk/category/api/" rel="category tag">API</a>, <a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/growth/" rel="category tag">growth</a>, <a href="https://blog.core.ac.uk/category/harvesting/" rel="category tag">harvesting</a>, <a href="https://blog.core.ac.uk/category/recommender/" rel="category tag">recommender</a>, <a href="https://blog.core.ac.uk/category/repositories/" rel="category tag">repositories</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/2017/" rel="tag">2017</a>, <a href="https://blog.core.ac.uk/tag/statistics/" rel="tag">statistics</a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-490" class="post-490 post type-post status-publish format-standard hentry category-aggregation category-core category-dataset category-growth category-harvesting category-repositories tag-full-text tag-metadata tag-statistics tag-tdm"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2017/02/03/core-now-offers-5-millions-of-open-access-full-text-research-papers/" rel="bookmark">CORE now offers 5 millions of open access full-text research papers</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p><!-- Begin :: Generated by Easy Custom Auto Excerpt --></p> <div class="ecae" style="">CORE is thrilled to announce that it currently provides 5 millions of open access full-text papers.</p> <figure id="attachment_491" aria-describedby="caption-attachment-491" style="width: 975px" class="wp-caption aligncenter"><a href="https://blog.core.ac.uk/wp-content/uploads/2017/02/Picture1.png"><img decoding="async" class="wp-image-491 size-full lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%20975%20506'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2017/02/Picture1.png" width="975" height="506" /></a><figcaption id="caption-attachment-491" class="wp-caption-text">CORE’s data providers from around the world</figcaption></figure> <p><span style="font-weight: 400;">“</span><i><span style="font-weight: 400;">In the last year, we have managed to scale up our harvesting process. This enabled us to significantly increase the amount of open access content we can offer to our users. With more and more open access content being made available by data providers, thanks to recent open access policies, CORE now also captures and provides access to a higher percentage of global research literature </span></i><span style="font-weight: 400;">”, says CORE’s founder, Dr Petr Knoth. </span></p> <p>With 66 million metadata records and 5 million full-text, from 102 countries, in 52 different languages, CORE becomes now the world’s largest full-text open access aggregator. CORE embraces the vibrant collections of both institutional and disciplinary repositories, while its large volume of scholarly outputs ranges from scientific research papers, to grey literature and from Master’s to Doctoral thesis. In addition, it is a metasearch for the all the open access peer-reviewed scientific journal articles published in open access journals. <span class="ecae-button ecae-buttonskin-none" style="text-align:left" > <a class="ecae-link" href="https://blog.core.ac.uk/2017/02/03/core-now-offers-5-millions-of-open-access-full-text-research-papers/"><span>read more...</span></a></span></p> </div> <p><!-- End :: Generated by Easy Custom Auto Excerpt --></p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2017/02/03/core-now-offers-5-millions-of-open-access-full-text-research-papers/" rel="bookmark"><time class="entry-date published" datetime="2017-02-03T10:15:03+00:00">3rd February 2017</time><time class="updated" datetime="2017-05-16T11:39:09+01:00">16th May 2017</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/admin/">CORE Admin</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/aggregation/" rel="category tag">aggregation</a>, <a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/growth/" rel="category tag">growth</a>, <a href="https://blog.core.ac.uk/category/harvesting/" rel="category tag">harvesting</a>, <a href="https://blog.core.ac.uk/category/repositories/" rel="category tag">repositories</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/full-text/" rel="tag">full-text</a>, <a href="https://blog.core.ac.uk/tag/metadata/" rel="tag">metadata</a>, <a href="https://blog.core.ac.uk/tag/statistics/" rel="tag">statistics</a>, <a href="https://blog.core.ac.uk/tag/tdm/" rel="tag">tdm</a></span><span class="comments-link"><a href="https://blog.core.ac.uk/2017/02/03/core-now-offers-5-millions-of-open-access-full-text-research-papers/#comments">1 Comment<span class="screen-reader-text"> on CORE now offers 5 millions of open access full-text research papers</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <article id="post-457" class="post-457 post type-post status-publish format-standard hentry category-aggregation category-core category-dataset category-growth category-harvesting category-recommender category-repositories tag-open-access tag-statistics tag-text-mining"> <header class="entry-header"> <h2 class="entry-title"><a href="https://blog.core.ac.uk/2016/12/19/cores-open-access-and-text-mining-services-2016-growth-or-how-about-them-stats-2016-edition/" rel="bookmark">CORE’s open access and text mining services – 2016 growth (or, how about them stats – 2016 edition)</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p><!-- Begin :: Generated by Easy Custom Auto Excerpt --></p> <div class="ecae" style="">The past year has been productive for the CORE team; the number of harvested repositories and our open access content, both in metadata and full-text, has massively increased. (You can see last year’s blog post with our 2015 achievements in numbers <a href="https://blog.core.ac.uk/2015/12/">here</a>.)</p> <p><a href="https://blog.core.ac.uk/wp-content/uploads/2016/12/Asset-4.png"><img decoding="async" class="alignnone wp-image-476 size-full lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%20887%20445'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2016/12/Asset-4.png" width="887" height="445" /></a></p> <p>There was also progress with regards to our <a href="https://core.ac.uk/services">services</a>; the number of our API users was almost doubled in 2016, we have now about 200 registered CORE Dashboard users, and this past October we released a new version of our recommender and updated our dataset.</p> <p><a href="https://blog.core.ac.uk/wp-content/uploads/2016/12/Asset-2-1.png"><img decoding="async" class="alignnone wp-image-478 size-full lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%20887%20444'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2016/12/Asset-2-1.png" width="887" height="444" /></a></p> <p>Around this time of the year, the joyful Christmas spirit of the CORE team increases along with our numbers. Thus, we decided to recalculate how far are the CORE research outputs – if we had printed them – from reaching the moon (last year we made it to 1/3 of the way).</p> <p><a href="https://blog.core.ac.uk/wp-content/uploads/2016/12/Asset-1-1.png"><img decoding="async" class="alignnone wp-image-479 size-full lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%20887%20445'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2016/12/Asset-1-1.png" width="887" height="445" /></a></p> <p>We are thrilled to see that this year we got CORE even closer to the moon! We would also like to thank all our <a href="https://core.ac.uk/dataproviders">data providers</a>, who have helped us reaching this goal.</p> <p>Fear not, we will never print all our research outputs, we believe that their mission is to be discoverable on the web as open access. Plus we love trees.<a href="https://blog.core.ac.uk/wp-content/uploads/2016/12/500px-Xmas_tree_animated.gif"><img decoding="async" class="wp-image-462 aligncenter lazy" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%2057%2057'%3E%3C/svg%3E" data-src="https://blog.core.ac.uk/wp-content/uploads/2016/12/500px-Xmas_tree_animated.gif" alt="" width="57" height="57" /></a></p> <p>Merry Christmas from the CORE Team!</p> <p>* Note: Special thanks to Matteo Cancellieri for creating the CORE graphics.</p> <p> </p></div> <p><!-- End :: Generated by Easy Custom Auto Excerpt --></p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://blog.core.ac.uk/2016/12/19/cores-open-access-and-text-mining-services-2016-growth-or-how-about-them-stats-2016-edition/" rel="bookmark"><time class="entry-date published" datetime="2016-12-19T12:36:12+00:00">19th December 2016</time><time class="updated" datetime="2017-05-16T11:39:57+01:00">16th May 2017</time></a></span><span class="byline"><span class="author vcard"><span class="screen-reader-text">Author </span><a class="url fn n" href="https://blog.core.ac.uk/author/nancypontika/">nancypontika</a></span></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://blog.core.ac.uk/category/aggregation/" rel="category tag">aggregation</a>, <a href="https://blog.core.ac.uk/category/core/" rel="category tag">CORE</a>, <a href="https://blog.core.ac.uk/category/dataset/" rel="category tag">dataset</a>, <a href="https://blog.core.ac.uk/category/growth/" rel="category tag">growth</a>, <a href="https://blog.core.ac.uk/category/harvesting/" rel="category tag">harvesting</a>, <a href="https://blog.core.ac.uk/category/recommender/" rel="category tag">recommender</a>, <a href="https://blog.core.ac.uk/category/repositories/" rel="category tag">repositories</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://blog.core.ac.uk/tag/open-access/" rel="tag">open access</a>, <a href="https://blog.core.ac.uk/tag/statistics/" rel="tag">statistics</a>, <a href="https://blog.core.ac.uk/tag/text-mining/" rel="tag">text mining</a></span> </footer><!-- .entry-footer --> </article><!-- #post-## --> <nav class="navigation pagination" aria-label="Posts pagination"> <h2 class="screen-reader-text">Posts pagination</h2> <div class="nav-links"><span aria-current="page" class="page-numbers current"><span class="meta-nav screen-reader-text">Page </span>1</span> <a class="page-numbers" href="https://blog.core.ac.uk/category/dataset/page/2/"><span class="meta-nav screen-reader-text">Page </span>2</a> <a class="next page-numbers" href="https://blog.core.ac.uk/category/dataset/page/2/">Next page</a></div> </nav> </main><!-- .site-main --> </section><!-- .content-area --> </div><!-- .site-content --> <footer id="colophon" class="site-footer" role="contentinfo"> <div class="site-info"> <div class="license"> <p> <a rel="license" href="//creativecommons.org/licenses/by/4.0/" title="Creative Commons Attribution 4.0 International license"><img class="lazy" style="float:right;" src="data:image/svg+xml,%3Csvg%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%201%201'%3E%3C/svg%3E" data-src="//i.creativecommons.org/l/by/4.0/88x31.png" alt="License"></a> </p> <div style="display: inline;" xmlns:cc="http://creativecommons.org/ns#" about="http://creativecommons.org"> <p> <small> Except where otherwise noted, content on <span href="http://blog.core.ac.uk" property="cc:attributionName" rel="cc:attributionURL">this site</span> is licensed under a <a rel="license" href="//creativecommons.org/licenses/by/4.0/" class="subfoot"> Creative Commons Attribution 4.0 International license </a>. </small> </p> </div> </div> <a href="https://wordpress.org/">Proudly powered by WordPress</a> </div><!-- .site-info --> </footer><!-- .site-footer --> </div><!-- .site --> <script type='text/javascript'> /* <![CDATA[ */ r3f5x9JS=escape(document['referrer']); hf4N='b4ef26e8e995023596143e5b0f9e7a52'; hf4V='04dd9b696411828059b3f665e7ea6206'; jQuery(document).ready(function($){var e="#commentform, .comment-respond form, .comment-form, #lostpasswordform, #registerform, #loginform, #login_form, #wpss_contact_form";$(e).submit(function(){$("<input>").attr("type","hidden").attr("name","r3f5x9JS").attr("value",r3f5x9JS).appendTo(e);return true;});var h="form[method='post']";$(h).submit(function(){$("<input>").attr("type","hidden").attr("name",hf4N).attr("value",hf4V).appendTo(h);return true;});}); /* ]]> */ </script> <script async src="https://blog.core.ac.uk/wp-content/cache/minify/95d78.js"></script> <script type="text/javascript" id="twentyfifteen-script-js-extra"> /* <![CDATA[ */ var screenReaderText = {"expand":"<span class=\"screen-reader-text\">expand child menu<\/span>","collapse":"<span class=\"screen-reader-text\">collapse child menu<\/span>"}; /* ]]> */ </script> <script async src="https://blog.core.ac.uk/wp-content/cache/minify/3fe04.js"></script> <script type="text/javascript" id="ez-toc-js-js-extra"> /* <![CDATA[ */ var ezTOC = {"smooth_scroll":"1","scroll_offset":"30"}; /* ]]> */ </script> <script async src="https://blog.core.ac.uk/wp-content/cache/minify/0c713.js"></script> <script src='https://stats.wp.com/e-202447.js' defer></script> <script> _stq = window._stq || []; _stq.push([ 'view', {v:'ext',blog:'160721468',post:'0',tz:'0',srv:'blog.core.ac.uk',j:'1:11.9.3'} ]); _stq.push([ 'clickTrackerInit', '160721468', '0' ]); </script> <script>window.w3tc_lazyload=1,window.lazyLoadOptions={elements_selector:".lazy",callback_loaded:function(t){var e;try{e=new CustomEvent("w3tc_lazyload_loaded",{detail:{e:t}})}catch(a){(e=document.createEvent("CustomEvent")).initCustomEvent("w3tc_lazyload_loaded",!1,!1,{e:t})}window.dispatchEvent(e)}}</script><script async src="https://blog.core.ac.uk/wp-content/cache/minify/1615d.js"></script> </body> </html> <!-- Performance optimized by W3 Total Cache. Learn more: https://www.boldgrid.com/w3-total-cache/ Object Caching 91/412 objects using memcached Page Caching using apc (SSL caching disabled) Lazy Loading Minified using disk Database Caching 3/28 queries in 0.018 seconds using memcached Served from: blog.core.ac.uk @ 2024-11-24 06:36:35 by W3 Total Cache -->