CINXE.COM

wikidata – Andrew Gray

<!DOCTYPE html> <html lang="en-GB" class="no-js"> <head> <meta charset="UTF-8"> <meta name="viewport" content="width=device-width"> <link rel="profile" href="https://gmpg.org/xfn/11"> <link rel="pingback" href="https://www.generalist.org.uk/blog/xmlrpc.php"> <!--[if lt IE 9]> <script src="https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/js/html5.js?ver=3.7.0"></script> <![endif]--> <script>(function(html){html.className = html.className.replace(/\bno-js\b/,'js')})(document.documentElement);</script> <title>wikidata &#8211; Andrew Gray</title> <style type="text/css"> /** * GeSHi Dynamically Generated Stylesheet * -------------------------------------- * Dynamically generated stylesheet for bash * CSS class: , CSS id: * GeSHi (C) 2004 - 2007 Nigel McNie, 2007 - 2014 Benny Baumann * (http://qbnz.com/highlighter/ and http://geshi.org/) * -------------------------------------- */ .bash .de1, .bash .de2 {} .bash {font-family:monospace;} .bash .imp {font-weight: bold; color: red;} .bash li, .bash .li1 {font-weight: normal; vertical-align:top;} .bash .ln {width:1px;text-align:right;margin:0;padding:0 2px;vertical-align:top;} .bash .li2 {font-weight: bold; vertical-align:top;} .bash .kw1 {color: #000000; font-weight: bold;} .bash .kw2 {color: #c20cb9; font-weight: bold;} .bash .kw3 {color: #7a0874; font-weight: bold;} .bash .co0 {color: #666666; font-style: italic;} .bash .co1 {color: #800000;} .bash .co2 {color: #cc0000; font-style: italic;} .bash .co3 {color: #000000; font-weight: bold;} .bash .co4 {color: #666666;} .bash .es1 {color: #000099; font-weight: bold;} .bash .es2 {color: #007800;} .bash .es3 {color: #007800;} .bash .es4 {color: #007800;} .bash .es5 {color: #780078;} .bash .es_h {color: #000099; font-weight: bold;} .bash .br0 {color: #7a0874; font-weight: bold;} .bash .sy0 {color: #000000; font-weight: bold;} .bash .st0 {color: #ff0000;} .bash .st_h {color: #ff0000;} .bash .nu0 {color: #000000;} .bash .re0 {color: #007800;} .bash .re1 {color: #007800;} .bash .re2 {color: #007800;} .bash .re4 {color: #007800;} .bash .re5 {color: #660033;} .bash .ln-xtra, .bash li.ln-xtra, .bash div.ln-xtra {background-color: #ffc;} .bash span.xtra { display:block; } </style> <meta name='robots' content='max-image-preview:large' /> <link rel="alternate" type="application/rss+xml" title="Andrew Gray &raquo; Feed" href="https://www.generalist.org.uk/blog/feed/" /> <link rel="alternate" type="application/rss+xml" title="Andrew Gray &raquo; Comments Feed" href="https://www.generalist.org.uk/blog/comments/feed/" /> <link rel="alternate" type="application/rss+xml" title="Andrew Gray &raquo; wikidata Tag Feed" href="https://www.generalist.org.uk/blog/tags/wikidata/feed/" /> <script> window._wpemojiSettings = {"baseUrl":"https:\/\/s.w.org\/images\/core\/emoji\/14.0.0\/72x72\/","ext":".png","svgUrl":"https:\/\/s.w.org\/images\/core\/emoji\/14.0.0\/svg\/","svgExt":".svg","source":{"concatemoji":"https:\/\/www.generalist.org.uk\/blog\/wp-includes\/js\/wp-emoji-release.min.js?ver=6.4.5"}}; /*! This file is auto-generated */ !function(i,n){var o,s,e;function c(e){try{var t={supportTests:e,timestamp:(new Date).valueOf()};sessionStorage.setItem(o,JSON.stringify(t))}catch(e){}}function p(e,t,n){e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(t,0,0);var t=new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data),r=(e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(n,0,0),new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data));return t.every(function(e,t){return e===r[t]})}function u(e,t,n){switch(t){case"flag":return n(e,"\ud83c\udff3\ufe0f\u200d\u26a7\ufe0f","\ud83c\udff3\ufe0f\u200b\u26a7\ufe0f")?!1:!n(e,"\ud83c\uddfa\ud83c\uddf3","\ud83c\uddfa\u200b\ud83c\uddf3")&&!n(e,"\ud83c\udff4\udb40\udc67\udb40\udc62\udb40\udc65\udb40\udc6e\udb40\udc67\udb40\udc7f","\ud83c\udff4\u200b\udb40\udc67\u200b\udb40\udc62\u200b\udb40\udc65\u200b\udb40\udc6e\u200b\udb40\udc67\u200b\udb40\udc7f");case"emoji":return!n(e,"\ud83e\udef1\ud83c\udffb\u200d\ud83e\udef2\ud83c\udfff","\ud83e\udef1\ud83c\udffb\u200b\ud83e\udef2\ud83c\udfff")}return!1}function f(e,t,n){var r="undefined"!=typeof WorkerGlobalScope&&self instanceof WorkerGlobalScope?new OffscreenCanvas(300,150):i.createElement("canvas"),a=r.getContext("2d",{willReadFrequently:!0}),o=(a.textBaseline="top",a.font="600 32px Arial",{});return e.forEach(function(e){o[e]=t(a,e,n)}),o}function t(e){var t=i.createElement("script");t.src=e,t.defer=!0,i.head.appendChild(t)}"undefined"!=typeof Promise&&(o="wpEmojiSettingsSupports",s=["flag","emoji"],n.supports={everything:!0,everythingExceptFlag:!0},e=new Promise(function(e){i.addEventListener("DOMContentLoaded",e,{once:!0})}),new Promise(function(t){var n=function(){try{var e=JSON.parse(sessionStorage.getItem(o));if("object"==typeof e&&"number"==typeof e.timestamp&&(new Date).valueOf()<e.timestamp+604800&&"object"==typeof e.supportTests)return e.supportTests}catch(e){}return null}();if(!n){if("undefined"!=typeof Worker&&"undefined"!=typeof OffscreenCanvas&&"undefined"!=typeof URL&&URL.createObjectURL&&"undefined"!=typeof Blob)try{var e="postMessage("+f.toString()+"("+[JSON.stringify(s),u.toString(),p.toString()].join(",")+"));",r=new Blob([e],{type:"text/javascript"}),a=new Worker(URL.createObjectURL(r),{name:"wpTestEmojiSupports"});return void(a.onmessage=function(e){c(n=e.data),a.terminate(),t(n)})}catch(e){}c(n=f(s,u,p))}t(n)}).then(function(e){for(var t in e)n.supports[t]=e[t],n.supports.everything=n.supports.everything&&n.supports[t],"flag"!==t&&(n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&n.supports[t]);n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&!n.supports.flag,n.DOMReady=!1,n.readyCallback=function(){n.DOMReady=!0}}).then(function(){return e}).then(function(){var e;n.supports.everything||(n.readyCallback(),(e=n.source||{}).concatemoji?t(e.concatemoji):e.wpemoji&&e.twemoji&&(t(e.twemoji),t(e.wpemoji)))}))}((window,document),window._wpemojiSettings); </script> <style id='wp-emoji-styles-inline-css'> img.wp-smiley, img.emoji { display: inline !important; border: none !important; box-shadow: none !important; height: 1em !important; width: 1em !important; margin: 0 0.07em !important; vertical-align: -0.1em !important; background: none !important; padding: 0 !important; } </style> <link rel='stylesheet' id='wp-block-library-css' href='https://www.generalist.org.uk/blog/wp-includes/css/dist/block-library/style.min.css?ver=6.4.5' media='all' /> <style id='wp-block-library-theme-inline-css'> .wp-block-audio figcaption{color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-audio figcaption{color:hsla(0,0%,100%,.65)}.wp-block-audio{margin:0 0 1em}.wp-block-code{border:1px solid #ccc;border-radius:4px;font-family:Menlo,Consolas,monaco,monospace;padding:.8em 1em}.wp-block-embed figcaption{color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-embed figcaption{color:hsla(0,0%,100%,.65)}.wp-block-embed{margin:0 0 1em}.blocks-gallery-caption{color:#555;font-size:13px;text-align:center}.is-dark-theme .blocks-gallery-caption{color:hsla(0,0%,100%,.65)}.wp-block-image figcaption{color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-image figcaption{color:hsla(0,0%,100%,.65)}.wp-block-image{margin:0 0 1em}.wp-block-pullquote{border-bottom:4px solid;border-top:4px solid;color:currentColor;margin-bottom:1.75em}.wp-block-pullquote cite,.wp-block-pullquote footer,.wp-block-pullquote__citation{color:currentColor;font-size:.8125em;font-style:normal;text-transform:uppercase}.wp-block-quote{border-left:.25em solid;margin:0 0 1.75em;padding-left:1em}.wp-block-quote cite,.wp-block-quote footer{color:currentColor;font-size:.8125em;font-style:normal;position:relative}.wp-block-quote.has-text-align-right{border-left:none;border-right:.25em solid;padding-left:0;padding-right:1em}.wp-block-quote.has-text-align-center{border:none;padding-left:0}.wp-block-quote.is-large,.wp-block-quote.is-style-large,.wp-block-quote.is-style-plain{border:none}.wp-block-search .wp-block-search__label{font-weight:700}.wp-block-search__button{border:1px solid #ccc;padding:.375em .625em}:where(.wp-block-group.has-background){padding:1.25em 2.375em}.wp-block-separator.has-css-opacity{opacity:.4}.wp-block-separator{border:none;border-bottom:2px solid;margin-left:auto;margin-right:auto}.wp-block-separator.has-alpha-channel-opacity{opacity:1}.wp-block-separator:not(.is-style-wide):not(.is-style-dots){width:100px}.wp-block-separator.has-background:not(.is-style-dots){border-bottom:none;height:1px}.wp-block-separator.has-background:not(.is-style-wide):not(.is-style-dots){height:2px}.wp-block-table{margin:0 0 1em}.wp-block-table td,.wp-block-table th{word-break:normal}.wp-block-table figcaption{color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-table figcaption{color:hsla(0,0%,100%,.65)}.wp-block-video figcaption{color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-video figcaption{color:hsla(0,0%,100%,.65)}.wp-block-video{margin:0 0 1em}.wp-block-template-part.has-background{margin-bottom:0;margin-top:0;padding:1.25em 2.375em} </style> <style id='classic-theme-styles-inline-css'> /*! This file is auto-generated */ .wp-block-button__link{color:#fff;background-color:#32373c;border-radius:9999px;box-shadow:none;text-decoration:none;padding:calc(.667em + 2px) calc(1.333em + 2px);font-size:1.125em}.wp-block-file__button{background:#32373c;color:#fff;text-decoration:none} </style> <style id='global-styles-inline-css'> body{--wp--preset--color--black: #000000;--wp--preset--color--cyan-bluish-gray: #abb8c3;--wp--preset--color--white: #fff;--wp--preset--color--pale-pink: #f78da7;--wp--preset--color--vivid-red: #cf2e2e;--wp--preset--color--luminous-vivid-orange: #ff6900;--wp--preset--color--luminous-vivid-amber: #fcb900;--wp--preset--color--light-green-cyan: #7bdcb5;--wp--preset--color--vivid-green-cyan: #00d084;--wp--preset--color--pale-cyan-blue: #8ed1fc;--wp--preset--color--vivid-cyan-blue: #0693e3;--wp--preset--color--vivid-purple: #9b51e0;--wp--preset--color--dark-gray: #111;--wp--preset--color--light-gray: #f1f1f1;--wp--preset--color--yellow: #f4ca16;--wp--preset--color--dark-brown: #352712;--wp--preset--color--medium-pink: #e53b51;--wp--preset--color--light-pink: #ffe5d1;--wp--preset--color--dark-purple: #2e2256;--wp--preset--color--purple: #674970;--wp--preset--color--blue-gray: #22313f;--wp--preset--color--bright-blue: #55c3dc;--wp--preset--color--light-blue: #e9f2f9;--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple: linear-gradient(135deg,rgba(6,147,227,1) 0%,rgb(155,81,224) 100%);--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan: linear-gradient(135deg,rgb(122,220,180) 0%,rgb(0,208,130) 100%);--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange: linear-gradient(135deg,rgba(252,185,0,1) 0%,rgba(255,105,0,1) 100%);--wp--preset--gradient--luminous-vivid-orange-to-vivid-red: linear-gradient(135deg,rgba(255,105,0,1) 0%,rgb(207,46,46) 100%);--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray: linear-gradient(135deg,rgb(238,238,238) 0%,rgb(169,184,195) 100%);--wp--preset--gradient--cool-to-warm-spectrum: linear-gradient(135deg,rgb(74,234,220) 0%,rgb(151,120,209) 20%,rgb(207,42,186) 40%,rgb(238,44,130) 60%,rgb(251,105,98) 80%,rgb(254,248,76) 100%);--wp--preset--gradient--blush-light-purple: linear-gradient(135deg,rgb(255,206,236) 0%,rgb(152,150,240) 100%);--wp--preset--gradient--blush-bordeaux: linear-gradient(135deg,rgb(254,205,165) 0%,rgb(254,45,45) 50%,rgb(107,0,62) 100%);--wp--preset--gradient--luminous-dusk: linear-gradient(135deg,rgb(255,203,112) 0%,rgb(199,81,192) 50%,rgb(65,88,208) 100%);--wp--preset--gradient--pale-ocean: linear-gradient(135deg,rgb(255,245,203) 0%,rgb(182,227,212) 50%,rgb(51,167,181) 100%);--wp--preset--gradient--electric-grass: linear-gradient(135deg,rgb(202,248,128) 0%,rgb(113,206,126) 100%);--wp--preset--gradient--midnight: linear-gradient(135deg,rgb(2,3,129) 0%,rgb(40,116,252) 100%);--wp--preset--gradient--dark-gray-gradient-gradient: linear-gradient(90deg, rgba(17,17,17,1) 0%, rgba(42,42,42,1) 100%);--wp--preset--gradient--light-gray-gradient: linear-gradient(90deg, rgba(241,241,241,1) 0%, rgba(215,215,215,1) 100%);--wp--preset--gradient--white-gradient: linear-gradient(90deg, rgba(255,255,255,1) 0%, rgba(230,230,230,1) 100%);--wp--preset--gradient--yellow-gradient: linear-gradient(90deg, rgba(244,202,22,1) 0%, rgba(205,168,10,1) 100%);--wp--preset--gradient--dark-brown-gradient: linear-gradient(90deg, rgba(53,39,18,1) 0%, rgba(91,67,31,1) 100%);--wp--preset--gradient--medium-pink-gradient: linear-gradient(90deg, rgba(229,59,81,1) 0%, rgba(209,28,51,1) 100%);--wp--preset--gradient--light-pink-gradient: linear-gradient(90deg, rgba(255,229,209,1) 0%, rgba(255,200,158,1) 100%);--wp--preset--gradient--dark-purple-gradient: linear-gradient(90deg, rgba(46,34,86,1) 0%, rgba(66,48,123,1) 100%);--wp--preset--gradient--purple-gradient: linear-gradient(90deg, rgba(103,73,112,1) 0%, rgba(131,93,143,1) 100%);--wp--preset--gradient--blue-gray-gradient: linear-gradient(90deg, rgba(34,49,63,1) 0%, rgba(52,75,96,1) 100%);--wp--preset--gradient--bright-blue-gradient: linear-gradient(90deg, rgba(85,195,220,1) 0%, rgba(43,180,211,1) 100%);--wp--preset--gradient--light-blue-gradient: linear-gradient(90deg, rgba(233,242,249,1) 0%, rgba(193,218,238,1) 100%);--wp--preset--font-size--small: 13px;--wp--preset--font-size--medium: 20px;--wp--preset--font-size--large: 36px;--wp--preset--font-size--x-large: 42px;--wp--preset--spacing--20: 0.44rem;--wp--preset--spacing--30: 0.67rem;--wp--preset--spacing--40: 1rem;--wp--preset--spacing--50: 1.5rem;--wp--preset--spacing--60: 2.25rem;--wp--preset--spacing--70: 3.38rem;--wp--preset--spacing--80: 5.06rem;--wp--preset--shadow--natural: 6px 6px 9px rgba(0, 0, 0, 0.2);--wp--preset--shadow--deep: 12px 12px 50px rgba(0, 0, 0, 0.4);--wp--preset--shadow--sharp: 6px 6px 0px rgba(0, 0, 0, 0.2);--wp--preset--shadow--outlined: 6px 6px 0px -3px rgba(255, 255, 255, 1), 6px 6px rgba(0, 0, 0, 1);--wp--preset--shadow--crisp: 6px 6px 0px rgba(0, 0, 0, 1);}:where(.is-layout-flex){gap: 0.5em;}:where(.is-layout-grid){gap: 0.5em;}body .is-layout-flow > .alignleft{float: left;margin-inline-start: 0;margin-inline-end: 2em;}body .is-layout-flow > .alignright{float: right;margin-inline-start: 2em;margin-inline-end: 0;}body .is-layout-flow > .aligncenter{margin-left: auto !important;margin-right: auto !important;}body .is-layout-constrained > .alignleft{float: left;margin-inline-start: 0;margin-inline-end: 2em;}body .is-layout-constrained > .alignright{float: right;margin-inline-start: 2em;margin-inline-end: 0;}body .is-layout-constrained > .aligncenter{margin-left: auto !important;margin-right: auto !important;}body .is-layout-constrained > :where(:not(.alignleft):not(.alignright):not(.alignfull)){max-width: var(--wp--style--global--content-size);margin-left: auto !important;margin-right: auto !important;}body .is-layout-constrained > .alignwide{max-width: var(--wp--style--global--wide-size);}body .is-layout-flex{display: flex;}body .is-layout-flex{flex-wrap: wrap;align-items: center;}body .is-layout-flex > *{margin: 0;}body .is-layout-grid{display: grid;}body .is-layout-grid > *{margin: 0;}:where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;}:where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;}.has-black-color{color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-color{color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-color{color: var(--wp--preset--color--white) !important;}.has-pale-pink-color{color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-color{color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-color{color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-color{color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-color{color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-color{color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-color{color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-color{color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-color{color: var(--wp--preset--color--vivid-purple) !important;}.has-black-background-color{background-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-background-color{background-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-background-color{background-color: var(--wp--preset--color--white) !important;}.has-pale-pink-background-color{background-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-background-color{background-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-background-color{background-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-background-color{background-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-background-color{background-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-background-color{background-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-background-color{background-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-background-color{background-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-background-color{background-color: var(--wp--preset--color--vivid-purple) !important;}.has-black-border-color{border-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-border-color{border-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-border-color{border-color: var(--wp--preset--color--white) !important;}.has-pale-pink-border-color{border-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-border-color{border-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-border-color{border-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-border-color{border-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-border-color{border-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-border-color{border-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-border-color{border-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-border-color{border-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-border-color{border-color: var(--wp--preset--color--vivid-purple) !important;}.has-vivid-cyan-blue-to-vivid-purple-gradient-background{background: var(--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple) !important;}.has-light-green-cyan-to-vivid-green-cyan-gradient-background{background: var(--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan) !important;}.has-luminous-vivid-amber-to-luminous-vivid-orange-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange) !important;}.has-luminous-vivid-orange-to-vivid-red-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-orange-to-vivid-red) !important;}.has-very-light-gray-to-cyan-bluish-gray-gradient-background{background: var(--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray) !important;}.has-cool-to-warm-spectrum-gradient-background{background: var(--wp--preset--gradient--cool-to-warm-spectrum) !important;}.has-blush-light-purple-gradient-background{background: var(--wp--preset--gradient--blush-light-purple) !important;}.has-blush-bordeaux-gradient-background{background: var(--wp--preset--gradient--blush-bordeaux) !important;}.has-luminous-dusk-gradient-background{background: var(--wp--preset--gradient--luminous-dusk) !important;}.has-pale-ocean-gradient-background{background: var(--wp--preset--gradient--pale-ocean) !important;}.has-electric-grass-gradient-background{background: var(--wp--preset--gradient--electric-grass) !important;}.has-midnight-gradient-background{background: var(--wp--preset--gradient--midnight) !important;}.has-small-font-size{font-size: var(--wp--preset--font-size--small) !important;}.has-medium-font-size{font-size: var(--wp--preset--font-size--medium) !important;}.has-large-font-size{font-size: var(--wp--preset--font-size--large) !important;}.has-x-large-font-size{font-size: var(--wp--preset--font-size--x-large) !important;} .wp-block-navigation a:where(:not(.wp-element-button)){color: inherit;} :where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;} :where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;} .wp-block-pullquote{font-size: 1.5em;line-height: 1.6;} </style> <link rel='stylesheet' id='twentyfifteen-fonts-css' href='https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/assets/fonts/noto-sans-plus-noto-serif-plus-inconsolata.css?ver=20230328' media='all' /> <link rel='stylesheet' id='genericons-css' href='https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/genericons/genericons.css?ver=20201026' media='all' /> <link rel='stylesheet' id='twentyfifteen-style-css' href='https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/style.css?ver=20230328' media='all' /> <link rel='stylesheet' id='twentyfifteen-block-style-css' href='https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/css/blocks.css?ver=20230122' media='all' /> <!--[if lt IE 9]> <link rel='stylesheet' id='twentyfifteen-ie-css' href='https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/css/ie.css?ver=20220908' media='all' /> <![endif]--> <!--[if lt IE 8]> <link rel='stylesheet' id='twentyfifteen-ie7-css' href='https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/css/ie7.css?ver=20141210' media='all' /> <![endif]--> <link rel='stylesheet' id='wpgeshi-wp-geshi-highlight-css' href='https://www.generalist.org.uk/blog/wp-content/plugins/wp-geshi-highlight/wp-geshi-highlight.css?ver=6.4.5' media='all' /> <script src="https://www.generalist.org.uk/blog/wp-includes/js/jquery/jquery.min.js?ver=3.7.1" id="jquery-core-js"></script> <script src="https://www.generalist.org.uk/blog/wp-includes/js/jquery/jquery-migrate.min.js?ver=3.4.1" id="jquery-migrate-js"></script> <link rel="https://api.w.org/" href="https://www.generalist.org.uk/blog/wp-json/" /><link rel="alternate" type="application/json" href="https://www.generalist.org.uk/blog/wp-json/wp/v2/tags/78" /><link rel="EditURI" type="application/rsd+xml" title="RSD" href="https://www.generalist.org.uk/blog/xmlrpc.php?rsd" /> <meta name="generator" content="WordPress 6.4.5" /> </head> <body class="archive tag tag-wikidata tag-78 wp-embed-responsive"> <div id="page" class="hfeed site"> <a class="skip-link screen-reader-text" href="#content"> Skip to content </a> <div id="sidebar" class="sidebar"> <header id="masthead" class="site-header"> <div class="site-branding"> <p class="site-title"><a href="https://www.generalist.org.uk/blog/" rel="home">Andrew Gray</a></p> <button class="secondary-toggle">Menu and widgets</button> </div><!-- .site-branding --> </header><!-- .site-header --> <div id="secondary" class="secondary"> <div id="widget-area" class="widget-area" role="complementary"> <aside id="recent-posts-3" class="widget widget_recent_entries"> <h2 class="widget-title">Recent Posts</h2><nav aria-label="Recent Posts"> <ul> <li> <a href="https://www.generalist.org.uk/blog/2024/caffenol/">Caffenol</a> <span class="post-date">January 11, 2024</span> </li> <li> <a href="https://www.generalist.org.uk/blog/2023/gender-and-blps-on-wikipedia-redux/">Gender and BLPs on Wikipedia, redux</a> <span class="post-date">August 2, 2023</span> </li> <li> <a href="https://www.generalist.org.uk/blog/2023/on-chatgpt/">on chatGPT</a> <span class="post-date">April 10, 2023</span> </li> <li> <a href="https://www.generalist.org.uk/blog/2021/lee-of-portrush-a-timeline/">Lee of Portrush: a timeline</a> <span class="post-date">September 18, 2021</span> </li> <li> <a href="https://www.generalist.org.uk/blog/2020/industrial-library/">Industrial Library</a> <span class="post-date">January 9, 2020</span> </li> </ul> </nav></aside><aside id="tag_cloud-3" class="widget widget_tag_cloud"><h2 class="widget-title">Tags</h2><nav aria-label="Tags"><div class="tagcloud"><ul class='wp-tag-cloud' role='list'> <li><a href="https://www.generalist.org.uk/blog/tags/administrivia/" class="tag-cloud-link tag-link-88 tag-link-position-1" style="font-size: 10.290909090909pt;" aria-label="administrivia (2 items)">administrivia</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/antarctica/" class="tag-cloud-link tag-link-72 tag-link-position-2" style="font-size: 10.290909090909pt;" aria-label="antarctica (2 items)">antarctica</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/archives/" class="tag-cloud-link tag-link-15 tag-link-position-3" style="font-size: 10.290909090909pt;" aria-label="archives (2 items)">archives</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/astronomy/" class="tag-cloud-link tag-link-18 tag-link-position-4" style="font-size: 11.818181818182pt;" aria-label="astronomy (3 items)">astronomy</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/books/" class="tag-cloud-link tag-link-9 tag-link-position-5" style="font-size: 16.272727272727pt;" aria-label="books (8 items)">books</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/british-library/" class="tag-cloud-link tag-link-63 tag-link-position-6" style="font-size: 10.290909090909pt;" aria-label="british library (2 items)">british library</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/campaigning/" class="tag-cloud-link tag-link-76 tag-link-position-7" style="font-size: 8pt;" aria-label="campaigning (1 item)">campaigning</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/canadian-collection/" class="tag-cloud-link tag-link-71 tag-link-position-8" style="font-size: 10.290909090909pt;" aria-label="canadian collection (2 items)">canadian collection</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/commonplace/" class="tag-cloud-link tag-link-56 tag-link-position-9" style="font-size: 13.090909090909pt;" aria-label="commonplace (4 items)">commonplace</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/commons/" class="tag-cloud-link tag-link-75 tag-link-position-10" style="font-size: 10.290909090909pt;" aria-label="commons (2 items)">commons</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/data/" class="tag-cloud-link tag-link-81 tag-link-position-11" style="font-size: 15.636363636364pt;" aria-label="data (7 items)">data</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/digitisation/" class="tag-cloud-link tag-link-103 tag-link-position-12" style="font-size: 8pt;" aria-label="digitisation (1 item)">digitisation</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/economics/" class="tag-cloud-link tag-link-12 tag-link-position-13" style="font-size: 16.272727272727pt;" aria-label="economics (8 items)">economics</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/election/" class="tag-cloud-link tag-link-39 tag-link-position-14" style="font-size: 19.2pt;" aria-label="election (14 items)">election</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/finance/" class="tag-cloud-link tag-link-47 tag-link-position-15" style="font-size: 11.818181818182pt;" aria-label="finance (3 items)">finance</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/freedom-of-information/" class="tag-cloud-link tag-link-31 tag-link-position-16" style="font-size: 10.290909090909pt;" aria-label="freedom of information (2 items)">freedom of information</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/history/" class="tag-cloud-link tag-link-21 tag-link-position-17" style="font-size: 22pt;" aria-label="history (24 items)">history</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/idiocy/" class="tag-cloud-link tag-link-35 tag-link-position-18" style="font-size: 11.818181818182pt;" aria-label="idiocy (3 items)">idiocy</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/internet/" class="tag-cloud-link tag-link-22 tag-link-position-19" style="font-size: 11.818181818182pt;" aria-label="internet (3 items)">internet</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/journalism/" class="tag-cloud-link tag-link-24 tag-link-position-20" style="font-size: 13.090909090909pt;" aria-label="journalism (4 items)">journalism</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/law/" class="tag-cloud-link tag-link-51 tag-link-position-21" style="font-size: 10.290909090909pt;" aria-label="law (2 items)">law</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/lee-of-portrush/" class="tag-cloud-link tag-link-95 tag-link-position-22" style="font-size: 10.290909090909pt;" aria-label="lee of portrush (2 items)">lee of portrush</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/legislation/" class="tag-cloud-link tag-link-79 tag-link-position-23" style="font-size: 8pt;" aria-label="legislation (1 item)">legislation</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/libraries/" class="tag-cloud-link tag-link-14 tag-link-position-24" style="font-size: 10.290909090909pt;" aria-label="libraries (2 items)">libraries</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/maps/" class="tag-cloud-link tag-link-50 tag-link-position-25" style="font-size: 10.290909090909pt;" aria-label="maps (2 items)">maps</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/media/" class="tag-cloud-link tag-link-23 tag-link-position-26" style="font-size: 10.290909090909pt;" aria-label="media (2 items)">media</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/mps/" class="tag-cloud-link tag-link-102 tag-link-position-27" style="font-size: 8pt;" aria-label="mps (1 item)">mps</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/open-access/" class="tag-cloud-link tag-link-77 tag-link-position-28" style="font-size: 10.290909090909pt;" aria-label="open access (2 items)">open access</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/oxford/" class="tag-cloud-link tag-link-20 tag-link-position-29" style="font-size: 11.818181818182pt;" aria-label="oxford (3 items)">oxford</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/parliament/" class="tag-cloud-link tag-link-100 tag-link-position-30" style="font-size: 10.290909090909pt;" aria-label="parliament (2 items)">parliament</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/photography/" class="tag-cloud-link tag-link-19 tag-link-position-31" style="font-size: 20.981818181818pt;" aria-label="photography (20 items)">photography</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/politics/" class="tag-cloud-link tag-link-8 tag-link-position-32" style="font-size: 21.236363636364pt;" aria-label="politics (21 items)">politics</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/publishing/" class="tag-cloud-link tag-link-27 tag-link-position-33" style="font-size: 16.909090909091pt;" aria-label="publishing (9 items)">publishing</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/recipes/" class="tag-cloud-link tag-link-6 tag-link-position-34" style="font-size: 13.090909090909pt;" aria-label="recipes (4 items)">recipes</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/remembrance/" class="tag-cloud-link tag-link-53 tag-link-position-35" style="font-size: 13.090909090909pt;" aria-label="remembrance (4 items)">remembrance</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/research/" class="tag-cloud-link tag-link-87 tag-link-position-36" style="font-size: 10.290909090909pt;" aria-label="research (2 items)">research</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/scotland/" class="tag-cloud-link tag-link-80 tag-link-position-37" style="font-size: 8pt;" aria-label="scotland (1 item)">scotland</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/security/" class="tag-cloud-link tag-link-28 tag-link-position-38" style="font-size: 10.290909090909pt;" aria-label="security (2 items)">security</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/software/" class="tag-cloud-link tag-link-46 tag-link-position-39" style="font-size: 10.290909090909pt;" aria-label="software (2 items)">software</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/statistics/" class="tag-cloud-link tag-link-25 tag-link-position-40" style="font-size: 16.909090909091pt;" aria-label="statistics (9 items)">statistics</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/travel/" class="tag-cloud-link tag-link-34 tag-link-position-41" style="font-size: 11.818181818182pt;" aria-label="travel (3 items)">travel</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/wikidata/" class="tag-cloud-link tag-link-78 tag-link-position-42" style="font-size: 16.272727272727pt;" aria-label="wikidata (8 items)">wikidata</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/wikimedia/" class="tag-cloud-link tag-link-74 tag-link-position-43" style="font-size: 13.090909090909pt;" aria-label="wikimedia (4 items)">wikimedia</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/wikipedia/" class="tag-cloud-link tag-link-26 tag-link-position-44" style="font-size: 21.745454545455pt;" aria-label="wikipedia (23 items)">wikipedia</a></li> <li><a href="https://www.generalist.org.uk/blog/tags/ww1/" class="tag-cloud-link tag-link-65 tag-link-position-45" style="font-size: 13.090909090909pt;" aria-label="ww1 (4 items)">ww1</a></li> </ul> </div> </nav></aside><aside id="archives-3" class="widget widget_archive"><h2 class="widget-title">Archives</h2> <label class="screen-reader-text" for="archives-dropdown-3">Archives</label> <select id="archives-dropdown-3" name="archive-dropdown"> <option value="">Select Month</option> <option value='https://www.generalist.org.uk/blog/2024/01/'> January 2024 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2023/08/'> August 2023 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2023/04/'> April 2023 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2021/09/'> September 2021 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2020/01/'> January 2020 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2019/05/'> May 2019 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2019/03/'> March 2019 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2019/02/'> February 2019 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2018/11/'> November 2018 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2018/10/'> October 2018 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2017/09/'> September 2017 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2017/01/'> January 2017 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2016/08/'> August 2016 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2016/04/'> April 2016 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2016/02/'> February 2016 &nbsp;(3)</option> <option value='https://www.generalist.org.uk/blog/2016/01/'> January 2016 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2015/12/'> December 2015 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2015/11/'> November 2015 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2015/10/'> October 2015 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2015/08/'> August 2015 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2015/02/'> February 2015 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2015/01/'> January 2015 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2014/11/'> November 2014 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2014/10/'> October 2014 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2014/09/'> September 2014 &nbsp;(3)</option> <option value='https://www.generalist.org.uk/blog/2014/08/'> August 2014 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2013/12/'> December 2013 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2013/08/'> August 2013 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2013/06/'> June 2013 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2013/05/'> May 2013 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2013/04/'> April 2013 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2013/02/'> February 2013 &nbsp;(3)</option> <option value='https://www.generalist.org.uk/blog/2012/12/'> December 2012 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2012/11/'> November 2012 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2012/10/'> October 2012 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2012/02/'> February 2012 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2011/11/'> November 2011 &nbsp;(3)</option> <option value='https://www.generalist.org.uk/blog/2011/07/'> July 2011 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2011/06/'> June 2011 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2011/05/'> May 2011 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2011/02/'> February 2011 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2011/01/'> January 2011 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2010/12/'> December 2010 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2010/11/'> November 2010 &nbsp;(6)</option> <option value='https://www.generalist.org.uk/blog/2010/10/'> October 2010 &nbsp;(5)</option> <option value='https://www.generalist.org.uk/blog/2010/09/'> September 2010 &nbsp;(1)</option> <option value='https://www.generalist.org.uk/blog/2010/08/'> August 2010 &nbsp;(4)</option> <option value='https://www.generalist.org.uk/blog/2010/07/'> July 2010 &nbsp;(2)</option> <option value='https://www.generalist.org.uk/blog/2010/06/'> June 2010 &nbsp;(4)</option> <option value='https://www.generalist.org.uk/blog/2010/05/'> May 2010 &nbsp;(11)</option> <option value='https://www.generalist.org.uk/blog/2010/04/'> April 2010 &nbsp;(10)</option> <option value='https://www.generalist.org.uk/blog/2010/03/'> March 2010 &nbsp;(9)</option> <option value='https://www.generalist.org.uk/blog/2010/02/'> February 2010 &nbsp;(8)</option> <option value='https://www.generalist.org.uk/blog/2010/01/'> January 2010 &nbsp;(8)</option> <option value='https://www.generalist.org.uk/blog/2009/12/'> December 2009 &nbsp;(3)</option> <option value='https://www.generalist.org.uk/blog/2009/11/'> November 2009 &nbsp;(7)</option> </select> <script> (function() { var dropdown = document.getElementById( "archives-dropdown-3" ); function onSelectChange() { if ( dropdown.options[ dropdown.selectedIndex ].value !== '' ) { document.location.href = this.options[ this.selectedIndex ].value; } } dropdown.onchange = onSelectChange; })(); </script> </aside><aside id="block-6" class="widget widget_block"><h2 class="widget-title">Elsewhere</h2> <ul><li><a href="https://twitter.com/generalising" data-type="URL" data-id="https://twitter.com/generalising" target="_blank" rel="noreferrer noopener">Twitter</a></li><li><a href="https://mastodon.flooey.org/web/@generalising" data-type="URL" data-id="https://mastodon.flooey.org/web/@generalising" target="_blank" rel="me noreferrer noopener">Mastodon</a></li></ul></aside> </div><!-- .widget-area --> </div><!-- .secondary --> </div><!-- .sidebar --> <div id="content" class="site-content"> <section id="primary" class="content-area"> <main id="main" class="site-main"> <header class="page-header"> <h1 class="page-title">Tag: <span>wikidata</span></h1> </header><!-- .page-header --> <article id="post-1714" class="post-1714 post type-post status-publish format-standard hentry category-andrew tag-data tag-statistics tag-wikidata tag-wikipedia"> <header class="entry-header"> <h2 class="entry-title"><a href="https://www.generalist.org.uk/blog/2023/gender-and-blps-on-wikipedia-redux/" rel="bookmark">Gender and BLPs on Wikipedia, redux</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p>Back in 2019 I <a rel="noreferrer noopener" href="https://www.generalist.org.uk/blog/2019/gender-and-deletion-on-wikipedia/" target="_blank">generated</a><a href="https://www.generalist.org.uk/blog/2019/gender-and-deletion-on-wikipedia/"> </a><a rel="noreferrer noopener" href="https://www.generalist.org.uk/blog/2019/gender-and-deletion-on-wikipedia/" target="_blank">some</a><a href="https://www.generalist.org.uk/blog/2019/gender-and-deletion-on-wikipedia/"> data</a> on how the English Wikipedia&#8217;s biographies of living people (BLPs) broke down by gender, and how that intersected with creation and deletion rates. The headline figures were that:</p> <ul> <li>There was a significant difference between the gender split for all biographies, at 17.8% women &#8211; and for biographies of living people (BLPs), 22.7%.</li> <li>In 2009, around 20% of <em>existing</em> BLPs were on women. As time went on, the average <em>share</em> of BLPs increased slowly, by perhaps a quarter of a percentage point per year.</li> <li>In 2009, around 20% of <em>newly created</em> BLPs were on women. In about 2012, this kicked up a gear, rising above the long term average &#8211; first to about 25%, peaking around 33% before falling back a little.</li> <li>BLP articles on women were more likely to be nominated for deletion <em>until about 2017</em>, when the effect disappeared.</li> </ul> <p>One thing that was raised during the subsequent discussion was that a lot of the skew by gender was potentially linked to subject area &#8211; I was able to identify that for athletes (defined broadly, all sports players) the articles were much more likely to be men. I didn&#8217;t investigate this too much, though. Last week, I was <a rel="noreferrer noopener" href="https://en.wikipedia.org/wiki/Wikipedia_talk:WikiProject_Women_in_Red#Topics_that_account_for_a_disproportionate_amount_of_the_gender_gap_in_biographies" target="_blank">reminded about this</a>, and I&#8217;ve been looking at the numbers again. It brought up two interesting divergences.</p> <h3 class="wp-block-heading">Please don&#8217;t make me read all this</h3> <p>Okay &#8211; but you&#8217;ll miss the graphs. In summary:</p> <p><em>English Wikipedia has more women in recent cohorts (about ~25% of living people born since the seventies) and there are far more men among athletes. Since the athletes make up a staggeringly high amount of articles among younger subjects, the gender split among non-athletes is much more balanced &#8211; a little under a third overall, but breaking 50% female among the younger cohorts.</em></p> <p>Still with me? Let&#8217;s start. Sorry about the spoilers.</p> <h3 class="wp-block-heading">Time and tide</h3> <p>The first phenomenon is very straightforward: while the overall percentage across all people is around 25% women, how that is <em>distributed</em> over time varies. In general, there is a steady rise until about the 1970s; <strong>for those born from the 1970s onwards, the generation who are currently in their active working lives, the level is relatively stable at around 25% women.</strong></p> <p>The exception is those born in the 1920s (where it sits at 26%) &#8211; this is presumably affected by the fact that at this point, female life expectancy is significantly higher than male, and so the proportion of women begins to rise as a result.</p> <figure class="wp-block-image size-full"><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-people-on-Wikipedia-female1.png"><img fetchpriority="high" decoding="async" width="600" height="371" src="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-people-on-Wikipedia-female1.png" alt="" class="wp-image-1730" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-people-on-Wikipedia-female1.png 600w, https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-people-on-Wikipedia-female1-300x186.png 300w" sizes="(max-width: 600px) 100vw, 600px" /></a></figure> <p>One surprising outcome, however, is that <strong>the share of living people with no recorded age (green) is much more female than the average</strong>. This is a <em>large</em> cohort &#8211; there are in fact slightly more women in it than in any individual decade. I believe that it skews young &#8211; in other words, were this information known, it would increase the share of women in recent decades &#8211; but it is hard to find a way to confirm this. This issue is discussed in more detail below.</p> <p>(Those born in the 2010s/20s and in the 1900s/10s are omitted &#8211; the four groups have a total of 175 articles, while the cohorts shown range from 5,000 to 170,000 &#8211; but the levels are around 50%. This is likely due to life expectancy in the oldest cohorts, and the fact that the people in the youngest cohorts are mostly notable at this point as being &#8220;the child of someone famous&#8221; &#8211; which you would broadly expect to be independent of gender.)</p> <p>The percentages shown here are of the total male + female articles, but it is also possible to calculate the share of people who have a recorded gender that is not male/female. These show a very striking rise over time, though it should be cautioned that the absolute numbers are small &#8211; the largest single cohort is the 1980s with 345 people out of 170,000.</p> <figure class="wp-block-image size-full"><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-people-on-Wikipedia-not-M_F.png"><img decoding="async" width="600" height="371" src="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-people-on-Wikipedia-not-M_F.png" alt="" class="wp-image-1723" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-people-on-Wikipedia-not-M_F.png 600w, https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-people-on-Wikipedia-not-M_F-300x186.png 300w" sizes="(max-width: 600px) 100vw, 600px" /></a></figure> <h3 class="wp-block-heading">Sports by the numbers</h3> <p>The original question was to look at what the effect of athlete articles is on the overall totals. It turns out&#8230; very striking. </p> <figure class="wp-block-image size-full is-resized"><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Living-people-on-Wikipedia-by-sports-status.png"><img decoding="async" src="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Living-people-on-Wikipedia-by-sports-status.png" alt="" class="wp-image-1726" width="600" height="371" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Living-people-on-Wikipedia-by-sports-status.png 600w, https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Living-people-on-Wikipedia-by-sports-status-300x186.png 300w" sizes="(max-width: 600px) 100vw, 600px" /></a></figure> <p>A few things are immediately apparent. The first is that <strong>the share of athletes is very substantial</strong> &#8211; it reflects only around a quarter of people born in the 1950s, but 85-90% of people born in the 1990s/2000s. </p> <p>The second is that <strong>those athletes are overwhelmingly men</strong> &#8211; among the 1950s cohort, only about 10% of those athletes are female, and even by recent years it is only around 20%. This means that if we look purely at the non-athlete articles, the gender split becomes a lot more balanced. </p> <figure class="wp-block-image size-full"><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-non-athletes-on-Wikipedia-female.png"><img loading="lazy" decoding="async" width="600" height="371" src="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-non-athletes-on-Wikipedia-female.png" alt="" class="wp-image-1727" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-non-athletes-on-Wikipedia-female.png 600w, https://www.generalist.org.uk/blog/wp-content/uploads/2023/08/Gender-split-for-living-non-athletes-on-Wikipedia-female-300x186.png 300w" sizes="(max-width: 600px) 100vw, 600px" /></a></figure> <p>Across all articles, it is around 32% female. But <strong>among living <strong>non-athlete</strong>s, born since 1990, the gender balance is over 50% female.</strong></p> <p>This is a really amazing figure. I don&#8217;t think I ever particularly expected to see a gender analysis on Wikipedia that would break 50%. Granted, the absolute numbers involved are low &#8211; as is apparent from the previous graph, &#8220;non-athletes born in the 1990s&#8221; is around 22,000 people, and &#8220;born in the 2000s&#8221; is as low as 2,500 &#8211; but it&#8217;s a pretty solid trend and the total numbers for the earlier decades are definitely large enough for it to be no anomaly.</p> <p>(Eagle-eyed readers will note that these do not quite align with the numbers in the original linked discussion &#8211; those were a couple of points lower in recent decades. I have not quite worked out why, but I think this was an error in the earlier queries; possibly it was counting redirects?)</p> <p>One last detail to note: the &#8220;date missing&#8221; cohort comes out over 90% <em>non</em>-athletes. Presumably this is because their exact age is often significant and linked in to eg when they start professional sports, so it&#8217;s easily publicly available. </p> <h3 class="wp-block-heading">Methodology: the thousand word footnote</h3> <p>Feel free to let your eyes glaze over now.</p> <p>These numbers were constructed mostly using the <a rel="noreferrer noopener" href="https://petscan.wmflabs.org/" data-type="URL" data-id="https://petscan.wmflabs.org/" target="_blank">petscan</a> tool, and leveraging data from both English Wikipedia and Wikidata. From Wikipedia, we have a robust categorisation system for year/decade of birth, and for whether someone is a living person. From Wikidata, we have fairly comprehensive gender data, which Wikipedia doesn&#8217;t know about. (It also has dates of birth, but it is more efficient to use WP categories here). So it is straightforward to produce intersection queries like &#8220;all living people marked as 1920s births and marked as female&#8221; (<a href="https://petscan.wmflabs.org/?outlinks_any=&amp;namespace_conversion=keep&amp;cb_labels_any_l=1&amp;labels_no=&amp;search_wiki=&amp;common_wiki=auto&amp;show_soft_redirects=both&amp;depth=0&amp;sitelinks_no=&amp;show_redirects=no&amp;min_redlink_count=1&amp;categories=Living+people%0D%0A1920s+births%7C1&amp;sparql=select+*+where+%7B+%3Fitem+wdt%3AP21+wd%3AQ6581072+%7D&amp;output_compatability=catscan&amp;templates_any=&amp;active_tab=tab_other_sources&amp;langs_labels_no=&amp;maxlinks=&amp;sitelinks_yes=&amp;links_to_all=&amp;cb_labels_yes_l=1&amp;edits%5Bflagged%5D=both&amp;interface_language=en&amp;search_max_results=500&amp;templates_yes=&amp;format=html&amp;show_disambiguation_pages=no&amp;language=en&amp;referrer_name=&amp;negcats=&amp;project=wikipedia&amp;combination=subset&amp;ns%5B0%5D=1&amp;sortorder=ascending&amp;edits%5Bbots%5D=both&amp;min_sitelink_count=&amp;page_image=any&amp;max_age=&amp;edits%5Banons%5D=both&amp;cb_labels_no_l=1&amp;subpage_filter=either">report</a>). Note that this is crunching a lot of data &#8211; don&#8217;t be surprised if queries take a minute or two to run or occasionally time out.</p> <p>To my surprise, the report for &#8220;living people known to be female&#8221; initially produced a reliable figure, but one for &#8220;living people known to be male&#8221; produced a figure that was an undercount. (I could validate this by checking against some small categories where I could run a report listing the gender of every item). The root cause seemed to be a timeout in the Wikidata query &#8211; I was originally looking for<em> { ?item wdt:P31 wd:Q5 . wdt:P21 wd:Q6581097 }</em> &#8211; items known to be human with gender male. Tweaking this to be simply <em>{ ?item wdt:P21 wd:Q6581097 }</em> &#8211; items with gender male &#8211; produced a reliable figure. Similarly, we had the same issue when trying to get a total for all items with reported gender &#8211; simply <em>{ ?item wdt:P21 ?val }</em> works.</p> <p>Percentages are calculated as percentage of the number of articles identified as (male + female), rather than of all BLPs with a recorded gender value or simply of all BLPs. There are good arguments for either of the first two, but the former is simpler (some of my &#8220;any recorded gender value&#8221; queries timed out) and also consistent with the 2019 analysis. </p> <p>A thornier problem comes from the sports element. There are a number of potential ways we could determine &#8220;sportiness&#8221;. The easiest option would be to use Wikidata occupation and look for something that indicates their occupation is some form of athlete, or that indicates a sport being played. The problem is that this is too all-encompassing, and would give us people who <em>played</em> sports but for whom it is not their main claim to fame. An alternative is to use the Wikipedia article categorisation hierarchy, but this is very complex and deep, making the queries very difficult to work with. The category hierarchy includes a number of surprise crosslinks and loops, meaning that deep queries tend to get very confusing results, or just time out.</p> <p>The approach I eventually went with was to use Wikipedia&#8217;s infoboxes &#8211; the little standardised box on the top right of a page. There are a wide range of distinct infobox templates tailored to specific fields; each article usually only displays one, but can embed elements of others to bring in secondary data. If we look for articles using one of the 77(!) distinct sports infoboxes (<a rel="noreferrer noopener" href="https://petscan.wmflabs.org/?labels_any=&amp;labels_yes=&amp;regexp_filter=&amp;search_query=&amp;templates_no=&amp;manual_list=&amp;links_to_any=&amp;categories=Living+people&amp;output_limit=&amp;labels_no=&amp;ores_type=any&amp;edits%5Bflagged%5D=both&amp;outlinks_any=&amp;namespace_conversion=keep&amp;psid=25494250&amp;maxlinks=&amp;cb_labels_no_l=1&amp;templates_any=Infobox+F1+driver%0D%0AInfobox+professional+wrestler%0D%0AInfobox+tennis+biography%0D%0AInfobox+boxer%0D%0AInfobox+Canadian+Football+League+biography%0D%0AInfobox+figure+skater%0D%0AInfobox+snooker+player%0D%0AInfobox+Champ+Car+driver%0D%0AInfobox+sumo+wrestler%0D%0AInfobox+Gaelic+games+player%0D%0AInfobox+basketball+biography%0D%0AInfobox+ice+hockey+biography%0D%0AInfobox+college+coach%0D%0AInfobox+bodybuilder%0D%0AInfobox+British+Touring+Car+Championship+record%0D%0AInfobox+rugby+biography%0D%0AInfobox+rugby+league+biography%0D%0AInfobox+lacrosse+player%0D%0AInfobox+V8+Supercar+record%0D%0AInfobox+darts+player%0D%0AInfobox+NASCAR+driver%0D%0AInfobox+field+hockey+player%0D%0AInfobox+sports+announcer+details%0D%0AInfobox+volleyball+biography%0D%0AInfobox+NCAA+athlete%0D%0AInfobox+WRC+driver%0D%0AInfobox+Gaelic+games+manager%0D%0AInfobox+cyclist%0D%0AInfobox+badminton+player%0D%0AInfobox+alpine+ski+racer%0D%0AInfobox+go+player%0D%0AInfobox+baseball+biography%0D%0AInfobox+horseracing+personality%0D%0AInfobox+racing+driver%0D%0AInfobox+skier%0D%0AInfobox+Le+Mans+driver%0D%0AInfobox+chess+biography%0D%0AInfobox+speed+skater%0D%0AInfobox+speedway+rider%0D%0AInfobox+swimmer%0D%0AInfobox+NFL+biography%0D%0AInfobox+cricketer%0D%0AInfobox+martial+artist%0D%0AInfobox+amateur+wrestler%0D%0AInfobox+AFL+biography%0D%0AInfobox+college+football+player%0D%0AInfobox+table+tennis+player%0D%0AInfobox+Motocross+rider%0D%0AInfobox+motorcycle+rider%0D%0AInfobox+netball+biography%0D%0AInfobox+handball+biography%0D%0AInfobox+gymnast%0D%0AInfobox+sportsperson%0D%0AInfobox+climber%0D%0AInfobox+boxer+%28amateur%29%0D%0AInfobox+golfer%0D%0AInfobox+football+official%0D%0AInfobox+squash+player%0D%0AInfobox+surfer%0D%0AInfobox+professional+bowler%0D%0AInfobox+pelotari%0D%0AInfobox+curler%0D%0AInfobox+fencer%0D%0AInfobox+bullfighting+career%0D%0AInfobox+mountaineer%0D%0AInfobox+tennis+player+season%0D%0AInfobox+racing+driver+series+section%0D%0AInfobox+sailor%0D%0AInfobox+biathlete%0D%0AInfobox+sport+wrestler%0D%0AInfobox+football+biography%0D%0AInfobox+bandy+biography%0D%0AInfobox+checkers+biography%0D%0AInfobox+water+polo+biography%0D%0AInfobox+sportsperson%2FWikidata%0D%0AInfobox+pool+player%0D%0AInfobox+judoka&amp;templates_yes=&amp;sitelinks_no=&amp;cb_labels_any_l=1&amp;search_max_results=500&amp;source_combination=&amp;language=en&amp;sortby=none&amp;langs_labels_no=&amp;common_wiki_other=&amp;cb_labels_yes_l=1&amp;langs_labels_any=&amp;edits%5Banons%5D=both&amp;project=wikipedia&amp;links_to_all=&amp;depth=0&amp;referrer_name=&amp;wpiu=any&amp;negcats=&amp;combination=subset&amp;ns%5B0%5D=1&amp;min_sitelink_count=&amp;referrer_url=&amp;active_tab=tab_templates_n_links&amp;interface_language=en&amp;before=&amp;wikidata_prop_item_use=" target="_blank">report</a>), we can conclude they probably had a significant sporting career. An article that does not contain one can be inferred to not have a sporting background.</p> <p>But then we need to consider people with significant sports <em>and</em> non-sports careers. For example, the biographies of both <a rel="noreferrer noopener" href="https://en.wikipedia.org/wiki/Sebastian_Coe" data-type="URL" data-id="https://en.wikipedia.org/wiki/Sebastian_Coe" target="_blank">Seb Coe</a> and <a rel="noreferrer noopener" href="https://en.wikipedia.org/wiki/Tanni_Grey-Thompson" data-type="URL" data-id="https://en.wikipedia.org/wiki/Tanni_Grey-Thompson" target="_blank">Tanni Grey-Thompson</a> use the &#8220;infobox officeholder&#8221; to reflect their careers in Parliament being more recent, but it is set up to embed a sports infobox towards the end. This would entail them being counted as athletes by our infobox method. This is probably correct for <em>those</em> two, but there are no doubt people out there where we would draw the line differently. (To stay in the UK political theme: how about <a href="https://en.wikipedia.org/wiki/Henry_McLeish" data-type="URL" data-id="https://en.wikipedia.org/wiki/Henry_McLeish">Henry McLeish</a>? His athletic career on its own would probably <em>just</em> qualify for a Wikipedia biography, but it is, perhaps, a bit of a footnote compared to being First Minister&#8230;)</p> <p>So, here is another complication. How reliable is our assumption that an athlete has a sports infobox, and that non-athletes don&#8217;t? If it&#8217;s broadly true, great, our numbers hold up. If it&#8217;s not, and if it&#8217;s not in some kind of systematic way, there might be a more complex skew. I <em>believe</em> that for modern athletes, it&#8217;s reasonably safe to assume that infoboxes are nearly ubiquitous; there are groups of articles where they&#8217;re less common, but this isn&#8217;t one of them. However, I can&#8217;t say for sure; it&#8217;s not an area I&#8217;ve worked intensively in.</p> <p>Finally, we have the issue of dates. We&#8217;ve based the calculation on Wikipedia categories. Wikipedia birth/death categories are pretty reliably used where that data is known. However, about 150k (14%) of our BLP articles are marked &#8220;year of birth unknown&#8221;, and these are disproportionately female (35.4%). </p> <p>What effect do these factors have?</p> <p>Counting the stats as percentage of M+F rather than percentage of all people with recorded gender could be argued either way, but the numbers involved are quite low and do not change the overall pattern of the results.</p> <p>The infobox question is more complicated. It is possible that it is meaning we are not picking up all athletes because they do not have infoboxes. On the other hand, it is possible that it is meaning we are being more expansive in counting people as athletes because they have a &#8220;secondary&#8221; infobox along the line of Coe &amp; Grey-Thompson above. The problem there is defining where we draw the line, and what level of &#8220;other significance&#8221; stops someone being counted. That feels like a very subjective threshold and hard to test for automatically. It is certainly a more conservative test than a Wikidata-based one, at least.</p> <p>And for dates, hmm. We know that the articles that do not report an age are disproportionately female (35% vs the BLP average of 25%), but also that they are <em>even</em> more disproportionately &#8220;not athletes&#8221; (7% athletes vs the BLP average of 43%). There are also a lot of articles that don&#8217;t report an age; around 14% of all BLPs.</p> <p>This one probably introduces the biggest question mark here. Depending on how that 14% break down, it could change the totals for the year-by-year cohorts; but there&#8217;s not really much we can do at the moment to work that out.</p> <p>Anecdotally, I suspect that they are more likely to skew younger rather than being evenly distributed over time, but there is very little to go on here. However, I feel it is unlikely they would be distributed in such a way as to <em>counteract</em> the overall conclusions &#8211; this would require, for example, the female ones being predominantly shifted into older groups and the male ones into younger groups. It&#8217;s possible, but I don&#8217;t see an obvious mechanism to cause that.</p> <p><em>[Edit 4/8/23 &#8211; tweaked to confirm that these are English Wikipedia only figures, after a reminder from <a rel="noreferrer noopener" href="https://hildabastian.wordpress.com/2023/08/04/some-knowledge-gaps-are-no-coincidence/" data-type="URL" data-id="https://hildabastian.wordpress.com/2023/08/04/some-knowledge-gaps-are-no-coincidence/" target="_blank">Hilda</a>. I would be very interested in seeing similar data for other projects, but the methodology might be tricky to translate &#8211; eg French and German do not have an equivalent category for indexing living people, and different projects may have quite different approaches for applying infoboxes.]</em></p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://www.generalist.org.uk/blog/2023/gender-and-blps-on-wikipedia-redux/" rel="bookmark"><time class="entry-date published" datetime="2023-08-02T23:36:52+01:00">August 2, 2023</time><time class="updated" datetime="2023-08-04T18:14:40+01:00">August 4, 2023</time></a></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://www.generalist.org.uk/blog/authors/andrew/" rel="category tag">Andrew</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://www.generalist.org.uk/blog/tags/data/" rel="tag">data</a>, <a href="https://www.generalist.org.uk/blog/tags/statistics/" rel="tag">statistics</a>, <a href="https://www.generalist.org.uk/blog/tags/wikidata/" rel="tag">wikidata</a>, <a href="https://www.generalist.org.uk/blog/tags/wikipedia/" rel="tag">wikipedia</a></span><span class="comments-link"><a href="https://www.generalist.org.uk/blog/2023/gender-and-blps-on-wikipedia-redux/#comments">1 Comment<span class="screen-reader-text"> on Gender and BLPs on Wikipedia, redux</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-1714 --> <article id="post-1578" class="post-1578 post type-post status-publish format-standard hentry category-andrew tag-data tag-statistics tag-wikidata tag-wikipedia"> <header class="entry-header"> <h2 class="entry-title"><a href="https://www.generalist.org.uk/blog/2019/gender-and-deletion-on-wikipedia/" rel="bookmark">Gender and deletion on Wikipedia</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p>So, a really interesting question <a href="https://www.wikidata.org/wiki/Wikidata:Request_a_query#Question_about_BLPs">cropped up</a> this weekend:</p> <blockquote><p> I&#8217;m trying to find out how many biographies of living persons exist on the English Wikipedia, and what kind of data we have on them. In particular, I&#8217;m looking for the gender breakdown. I&#8217;d also like to know when they were created; average length; and whether they&#8217;ve been nominated for deletion.</p></blockquote> <p>This is, of course, something that&#8217;s being discussed a lot right now; there is a lot of emerging push-back against the <a href="https://www.nature.com/articles/d41586-018-05947-8">excellent work</a> being done to try and add more notable women to Wikipedia, and one particular deletion debate <a href="https://undark.org/2019/04/25/wikipedia-diversity-problem/">got a lot of attention</a> in the past few weeks, so it&#8217;s on everyone&#8217;s mind. And, instinctively, it seems plausible that there is a bias in the relative frequency of nomination for deletion &#8211; can we find if it&#8217;s there?</p> <p>My initial assumption was, huh, I don&#8217;t think we can do that with Wikidata. Then I went off and thought about it for a bit more, and realised we could get <i>most</i> of the way there of it with some inferences. Here&#8217;s the results, and how I got there. Thanks to <a href="https://www.wikidata.org/wiki/User:SlimVirgin">Sarah</a> for prompting the research!</p> <p>(If you want to get the tl;dr summary &#8211; yes, there is <b>some kind</b> of difference in the way older male vs female articles have been involved with the deletion process, but exactly what that indicates is not obvious without data I can&#8217;t get at. The difference seems to have <i>mostly</i> disappeared for articles created in the last couple of years.)</p> <h3>Statistics on the gender breakdown of BLPs</h3> <p>As of a snapshot of yesterday morning, 5 May 2019, the English Wikipedia had 906,720 articles identified as biographies of living people (BLPs for short). Of those, 697,402 were identified as male by Wikidata, 205,117 as female, 2464 had some other value for gender, 1220 didn&#8217;t have any value for gender (usually articles on <i>groups</i> of people, plus some not yet updated), and 517 simply didn&#8217;t have a connected Wikidata item (yet). Of those with known gender, it breaks down as 77.06% male, 22.67% female, and 0.27% some other value. (Because of the limits of the query, I didn&#8217;t try and break down those in any more detail.)</p> <p>This is, as noted, only articles about <i>living people</i>; across <a href="https://www.denelezh.org/gender-gap/?project=enwiki&amp;sort=label">all 1,626,232 biographies in the English Wikipedia</a> with a gender known to Wikidata, it&#8217;s about 17.83% female, 82.13% male, and 0.05% some other value. I&#8217;ll be sticking to data on living people throughout this post, but it&#8217;s interesting to compare the historic information.</p> <p>So, how has that changed over time?</p> <p><a title="Andrew Gray [CC BY-SA 3.0 (https://creativecommons.org/licenses/by-sa/3.0)], via Wikimedia Commons" href="https://commons.wikimedia.org/wiki/File:BLPs_by_gender_and_date_of_creation.png"><img decoding="async" alt="BLPs by gender and date of creation" src="https://upload.wikimedia.org/wikipedia/commons/4/42/BLPs_by_gender_and_date_of_creation.png" width="512"></a></p> <p>This graph shows all existing BLPs, broken down by gender and (approximately) when they were created. As can be seen, and as might be expected, the gap has closed a bit over time.</p> <p><a title="Andrew Gray [CC BY-SA 3.0 (https://creativecommons.org/licenses/by-sa/3.0)], via Wikimedia Commons" href="https://commons.wikimedia.org/wiki/File:Percentage_of_BLPs_which_are_female_over_time.png"><img decoding="async" alt="Percentage of BLPs which are female over time" src="https://upload.wikimedia.org/wikipedia/commons/c/c0/Percentage_of_BLPs_which_are_female_over_time.png" width="512"></a></p> <p>Looking at the ratio over time (expressed here as %age of total male+female), the relative share of female BLPs was ~20% in 2009. In late 2012, the rate of creation of female BLPs kicked up a gear, and from then on it&#8217;s been noticeably above the long-term average (almost hitting 33% in late 2017, but dropping back since then). This has driven the overall share steadily and continually upwards, now at 22.7% (as noted above).</p> <p>Now the second question, do the article lengths differ by gender? Indeed they do, by a small amount.</p> <p><a title="Andrew Gray [CC BY-SA 3.0 (https://creativecommons.org/licenses/by-sa/3.0)], via Wikimedia Commons" href="https://commons.wikimedia.org/wiki/File:BLPs_by_current_article_size_and_date_of_creation.png"><img decoding="async" alt="BLPs by current article size and date of creation" src="https://upload.wikimedia.org/wikipedia/commons/e/ea/BLPs_by_current_article_size_and_date_of_creation.png" width="512"></a></p> <p>Female BLPs created at any time since 2009 are slightly longer on average than male ones of similar age, with only a couple of brief exceptions; the gap may be widening over the past year but it&#8217;s maybe too soon to say for sure. Average difference is about 500 bytes or a little under 10% of mean article size &#8211; not dramatic but probably not trivial either. (Pre-2009 articles, not shown here, are about even on average)</p> <p>Note that this is raw bytesize &#8211; actual prose size will be smaller, particularly if an article is well-referenced; a single well-structured reference can be a few hundred characters. It&#8217;s also the <i>current</i> article size, not size at creation, hence why older articles tend to be longer &#8211; they&#8217;ve had more time to grow. It&#8217;s interesting to note that once they&#8217;re more than about five years old they seem to plateau in average length.</p> <p>Finally, the third question &#8211; have they been nominated for deletion? This was really interesting.</p> <p><a title="Andrew Gray [CC BY-SA 3.0 (https://creativecommons.org/licenses/by-sa/3.0)], via Wikimedia Commons" href="https://commons.wikimedia.org/wiki/File:Percentage_of_BLPs_which_have_previously_been_to_AFD,_by_date_of_creation_and_gender.png"><img decoding="async" alt="Percentage of BLPs which have previously been to AFD, by date of creation and gender" src="https://upload.wikimedia.org/wikipedia/commons/c/c2/Percentage_of_BLPs_which_have_previously_been_to_AFD%2C_by_date_of_creation_and_gender.png" width="512"></a></p> <p>So, first of all, some caveats. This only identifies articles which go through the structured &#8220;articles for deletion&#8221; (AFD) process &#8211; nomination, discussion, decision to keep or delete. (There are <a href="https://en.wikipedia.org/wiki/Wikipedia:Deletion_process">three deletion processes</a> on Wikipedia; the other two are more lightweight and do not show up in an easily traceable form). It also cannot specifically identify if <i>that exact page</i> was nominated for deletion, only that &#8220;an article with exactly the same page name has been nominated in the past&#8221; &#8211; but the odds are good they&#8217;re the same if there&#8217;s a match. It will miss out any where the article was renamed after the deletion discussion, and, most critically, <i>it will only see articles that survived deletion</i>. If they were deleted, I won&#8217;t be able to see them in this analysis, so there&#8217;s an obvious survivorship bias limiting what conclusions we can draw.</p> <p>Having said all that&#8230;</p> <p>Female BLPs created 2009-16 appear noticeably more likely than male BLPs of equivalent age to have been through a deletion discussion at some point in their lives (and, presumably, all have been kept). Since 2016, this has changed and the two groups are about even.</p> <p>Alongisde this, there is a corresponding drop-off in the number of articles created since 2016 which have associated deletion discussions. My tentative hypothesis is that articles created in the last few years are generally less likely to be nominated for deletion, perhaps because the growing use of things like the draft namespace (and associated reviews) means that articles are more robust when first published. Conversely, though, it&#8217;s possible that nominations continue at the same rate, but the deletion process is just more rigorous now and a higher proportion of those which are nominated get deleted (and so disappear from our data). We can&#8217;t tell.</p> <p>(One possible explanation that we can tentatively dismiss is age &#8211; an article can be nominated at any point in its lifespan so you would tend to expect a slowly increasing share over time, but I would expect the majority of deletion nominations come in the first weeks and then it&#8217;s pretty much evenly distributed after that. As such, the drop-off seems far too rapid to be explained by <i>just</i> article age.)</p> <p>What we don&#8217;t know is what the overall <i>nomination for deletion</i> rate, including deleted articles, looks like. From our data, it could be that pre-2016 male and female articles are nominated at equal rates but more male articles are deleted; or it could be that pre-2016 male and female articles are equally likely to get deleted, but the female articles are nominated more frequently than they should be. Either of these would cause the imbalance. I think this is very much the missing piece of data and I&#8217;d love to see any suggestions for how we can work it out &#8211; perhaps something like trying to estimate gender from the names of deleted articles?</p> <p><b>Update:</b> Magnus has <a href="http://magnusmanske.de/wordpress/?p=613">run some numbers on deleted pages</a>, doing exactly this &#8211; inferring gender from pagenames. Of those which were probably a person, ~2/3 had an inferred gender, and 23% of those were female. This is a remarkably similar figure to the analysis here (~23% of current BLPs female; ~26% of all BLPs which have survived a deletion debate female)</p> <p><b>So in conclusion</b>&#8230;</p> <ul> <li>We know the gender breakdown: skewed male, but growing slowly more balanced over time, and better for living people than historical ones.</li> <li>We know the article lengths; slightly longer for women than men for recent articles, about equal for those created a long time ago.</li> <li>We know that there is <i>something</i> different about the way male and female biographies created before ~2017 experience the deletion process, but we don&#8217;t have clear data to indicate exactly what is going on, and there are multiple potential explanations.</li> <li>We also know that deletion activity seems to be more balanced for articles in both groups created from ~2017 onwards, and that these also have a lower frequency of involvement with the deletion process than might have been expected. It is not clear what the mechanism is here, or if the two factors are directly linked.</li> </ul> <h3>How can you extract this data? (Yes, this is very dull)</h3> <p>The first problem was generating the lists of articles and their metadata. The English Wikipedia category system lets us identify &#8220;living people&#8221;, but not gender; Wikidata lets us identify gender (property P21), but not reliably &#8220;living people&#8221;. However, we can creatively use the <a href="http://petscan.wmflabs.org/">petscan</a> tool to get the intersection of a SPARQL gender query + the category. Instructing it to explicitly use Wikipedia (&#8220;enwiki&#8221; in other sources &gt; manual list) and give output as a TSV &#8211; then waiting for about fifteen minutes &#8211; leaves you with a nice clean data dump. Thanks, <a href="http://magnusmanske.de/wordpress/">Magnus</a>!</p> <p>(It&#8217;s worth noting that you can get this data with any characteristic indexed by Wikidata, or any characteristic identifiable through the Wikipedia category schema, but you will need to run a new query for each aspect you want to analyse &#8211; the exported data just has article metadata, none of the Wikidata/category information)</p> <p>The exported files contain three things that are very useful to us: article title, pageid, and length. I normalised the files like so:</p> <div class="wp-geshi-highlight-wrap5"><div class="wp-geshi-highlight-wrap4"><div class="wp-geshi-highlight-wrap3"><div class="wp-geshi-highlight-wrap2"><div class="wp-geshi-highlight-wrap"><div class="wp-geshi-highlight"><div class="bash"><pre class="de1"><span class="kw2">grep</span> <span class="br0">&#91;</span><span class="nu0">0</span>-<span class="nu0">9</span><span class="br0">&#93;</span> enwiki_blp_women_from_list.tsv <span class="sy0">|</span> <span class="kw2">cut</span> <span class="re5">-f</span> <span class="nu0">2</span>,<span class="nu0">3</span>,<span class="nu0">5</span> <span class="sy0">&amp;</span>gt; women-noheader.tsv</pre></div></div></div></div></div></div></div> <p>This drops the header line (it&#8217;s the only one with no numeric characters) and extracts only the three values we care about (and conveniently saves about 20MB).</p> <p>This gives us two of the things we want (age and size) but not deletion data. For that, we fall back on inference. Any article that is put through the AFD process gets a new subpage created at &#8220;Wikipedia:Articles for deletion/PAGENAME&#8221;. It is reasonable to infer that if an article has a corresponding AFD subpage, it&#8217;s <i>probably</i> about that specific article. This is not always true, of course &#8211; names get recycled, pages get moved &#8211; but it&#8217;s a reasonable working hypothesis and hopefully the errors are evenly distributed over time. I&#8217;ve racked my brains to see if I could anticipate a noticeable difference here by gender, as this could really complicate the results, but provisionally I think we&#8217;re okay to go with it.</p> <p>To find out if those subpages exist, we turn to <a href="https://dumps.wikimedia.org/enwiki/latest/">the enwiki dumps</a>. Specifically, we want &#8220;enwiki-latest-all-titles.gz&#8221; &#8211; which, as it suggests, is a simple file listing all page titles on the wiki. Extracted, it comes to about 1GB. From this, we can extract all the AFD subpages, as so:</p> <div class="wp-geshi-highlight-wrap5"><div class="wp-geshi-highlight-wrap4"><div class="wp-geshi-highlight-wrap3"><div class="wp-geshi-highlight-wrap2"><div class="wp-geshi-highlight-wrap"><div class="wp-geshi-highlight"><div class="bash"><pre class="de1"><span class="kw2">grep</span> <span class="st0">&quot;Articles_for_deletion/&quot;</span> enwiki-latest-all-titles <span class="sy0">|</span> <span class="kw2">cut</span> <span class="re5">-f</span> <span class="nu0">2</span> <span class="sy0">|</span> <span class="kw2">sort</span> <span class="sy0">|</span> <span class="kw2">uniq</span> <span class="sy0">|</span> <span class="kw2">cut</span> <span class="re5">-f</span> <span class="nu0">2</span> <span class="re5">-d</span> <span class="sy0">/</span> <span class="sy0">|</span> <span class="kw2">sort</span> <span class="sy0">|</span> <span class="kw2">uniq</span> <span class="sy0">&amp;</span>gt; afds</pre></div></div></div></div></div></div></div> <p>This extracts all the AFD subpages, removes any duplicates (since eg talkpages are listed here as well), and sorts the list alphabetically. There are about 424,000 of them.</p> <p>Going back to our original list of articles, we want to bin them by age. To a first approximation, <tt>pageid</tt> is sequential with age &#8211; it&#8217;s assigned when the page is first created. There are some big caveats here; for example, a page being created as a redirect and later expanded will have the ID of its initial creation. Pages being deleted and recreated may get a new ID, pages which are merged may end up with either of the original IDs, and some complicated page moves may end up with the original IDs being lost. But, for the majority of pages, it&#8217;ll work out okay.</p> <p>To correlate pageID to age, I did a bit of speculative guessing to find an item created on 1 January and 1 July every year back to 2009 (eg <a href="https://en.wikipedia.org/w/index.php?curid=43190000&amp;action=info#Edit_history">pageid 43190000</a> was created at 11am on 1 July 2014). I could then use these to extract the articles corresponding to each period as so:</p> <div class="wp-geshi-highlight-wrap5"><div class="wp-geshi-highlight-wrap4"><div class="wp-geshi-highlight-wrap3"><div class="wp-geshi-highlight-wrap2"><div class="wp-geshi-highlight-wrap"><div class="wp-geshi-highlight"><div class="bash"><pre class="de1">... <span class="kw2">awk</span> <span class="re5">-F</span> <span class="st_h">'\t'</span> <span class="st_h">'$2 &amp;gt;= 41516000 &amp;amp;&amp;amp; $2 &amp;lt; 43190000'</span> <span class="sy0">&amp;</span>lt; men-noheader.tsv <span class="sy0">&amp;</span>gt; bins<span class="sy0">/</span><span class="nu0">2014</span>-<span class="nu0">1</span>-M <span class="kw2">awk</span> <span class="re5">-F</span> <span class="st_h">'\t'</span> <span class="st_h">'$2 &amp;gt;= 43190000 &amp;amp;&amp;amp; $2 &amp;lt; 44909000'</span> <span class="sy0">&amp;</span>lt; men-noheader.tsv <span class="sy0">&amp;</span>gt; bins<span class="sy0">/</span><span class="nu0">2014</span>-<span class="nu0">2</span>-M ...</pre></div></div></div></div></div></div></div> <p>This finds all items with a pageid (in column #2 of the file) between the specified values, and copies them into the relevant bin. Run once for men and once for women.</p> <p>Then we can run a short report, along these lines (the original had loops in it):</p> <div class="wp-geshi-highlight-wrap5"><div class="wp-geshi-highlight-wrap4"><div class="wp-geshi-highlight-wrap3"><div class="wp-geshi-highlight-wrap2"><div class="wp-geshi-highlight-wrap"><div class="wp-geshi-highlight"><div class="bash"><pre class="de1"> <span class="kw2">cut</span> <span class="re5">-f</span> <span class="nu0">1</span> bins<span class="sy0">/</span><span class="nu0">2014</span>-<span class="nu0">1</span>-M <span class="sy0">|</span> <span class="kw2">sort</span> <span class="sy0">&amp;</span>gt; temp-M <span class="kw3">echo</span> <span class="re5">-e</span> <span class="nu0">2014</span>-<span class="nu0">1</span>-M<span class="st0">&quot;<span class="es1">\t</span>M<span class="es1">\t</span>&quot;</span><span class="sy0">`</span><span class="kw2">cat</span> bins<span class="sy0">/</span><span class="nu0">2014</span>-<span class="nu0">1</span>-M <span class="sy0">|</span> <span class="kw2">wc</span> -l<span class="sy0">`</span><span class="st0">&quot;<span class="es1">\t</span>&quot;</span><span class="sy0">`</span><span class="kw2">awk</span> <span class="st_h">'{ total += $3; count++ } END { print total/count }'</span> bins<span class="sy0">/</span><span class="nu0">2014</span>-<span class="nu0">1</span>-M<span class="sy0">`</span><span class="st0">&quot;<span class="es1">\t</span>&quot;</span><span class="sy0">`</span><span class="kw2">comm</span> <span class="re5">-1</span> <span class="re5">-2</span> temp-M afds <span class="sy0">|</span> <span class="kw2">wc</span> -l<span class="sy0">`</span> <span class="sy0">&amp;</span>gt;<span class="sy0">&amp;</span>gt; report.tsv</pre></div></div></div></div></div></div></div> <p>This adds a line to the file <tt>report.tsv</tt> with (in order) the name of the bin, the number of entries in it, the mean value of the <tt>length</tt> column, and a count of the number which also match names in the <tt>afds</tt> file. (The use of the <tt>temp-M</tt> file is to deal with the fact that the comm tool needs properly sorted input).</p> <p>After that, generating the data is lovely and straightforward &#8211; drop the report into a spreadsheet and play around with it.</p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://www.generalist.org.uk/blog/2019/gender-and-deletion-on-wikipedia/" rel="bookmark"><time class="entry-date published" datetime="2019-05-06T21:36:49+01:00">May 6, 2019</time><time class="updated" datetime="2022-08-14T22:07:02+01:00">August 14, 2022</time></a></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://www.generalist.org.uk/blog/authors/andrew/" rel="category tag">Andrew</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://www.generalist.org.uk/blog/tags/data/" rel="tag">data</a>, <a href="https://www.generalist.org.uk/blog/tags/statistics/" rel="tag">statistics</a>, <a href="https://www.generalist.org.uk/blog/tags/wikidata/" rel="tag">wikidata</a>, <a href="https://www.generalist.org.uk/blog/tags/wikipedia/" rel="tag">wikipedia</a></span><span class="comments-link"><a href="https://www.generalist.org.uk/blog/2019/gender-and-deletion-on-wikipedia/#comments">3 Comments<span class="screen-reader-text"> on Gender and deletion on Wikipedia</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-1578 --> <article id="post-1540" class="post-1540 post type-post status-publish format-gallery has-post-thumbnail hentry category-andrew tag-parliament tag-wikidata tag-wikipedia post_format-post-format-gallery"> <a class="post-thumbnail" href="https://www.generalist.org.uk/blog/2019/george-ernest-spero-the-vanishing-mp/" aria-hidden="true"> <img width="468" height="227" src="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/spero.png" class="attachment-post-thumbnail size-post-thumbnail wp-post-image" alt="George Ernest Spero, the vanishing MP" decoding="async" loading="lazy" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/spero.png 468w, https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/spero-300x146.png 300w" sizes="(max-width: 468px) 100vw, 468px" /> </a> <header class="entry-header"> <h2 class="entry-title"><a href="https://www.generalist.org.uk/blog/2019/george-ernest-spero-the-vanishing-mp/" rel="bookmark">George Ernest Spero, the vanishing MP</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p>As part of the ongoing <a href="https://www.wikidata.org/wiki/Wikidata:WikiProject_British_Politicians">Wikidata MPs project</a>, I&#8217;ve come across a number of oddities &#8211; MPs who may or may not have been the same person, people who essentially disappear after they leave office, and so on. Tracking these down can turn into quite a complex investigation.</p> <p>One such was George Ernest Spero, Liberal MP for Stoke Newington 1923-24, then Labour MP for Fulham West 1929-30. His career was cut short by his resignation in April 1930; shortly afterwards, he was declared bankrupt. Spero had already left the country for America, and nothing more was heard of him. The main ambiguity was when he died &#8211; various sources claimed either 1960 or 1976, but without it being clear which was more reliable, or any real details on what happened to him after 1930. In correspondence with Stephen Lees, who has been working on an incredibly useful comprehensive record of MP&#8217;s death-dates, I did some work on it last year and eventually confirmed the 1960 date; I&#8217;ve just rediscovered the notes from this and since it was an interesting little mystery, thought I&#8217;d post them.</p> <h4>George Spero, MP and businessman</h4> <p>So, let&#8217;s begin with what we know about him up to the point at which he vanished.</p> <p>George Ernest Spero was born in 1894. He began training at the Royal Dental Hospital in 1912, and served in the RNVR as a surgeon during the First World War. He had two brothers who also went into medicine; Samuel was a dentist in London (and apparently also went bankrupt, in 1933), while Leopold was a surgeon or physician (trained at St. Mary&#8217;s, RNVR towards the end of WWI, still in practice in the 1940s). All of this was reasonably straightforward to trace, although oddly George&#8217;s RNVR service records seem to be missing from the National Archives.</p> <p>After the war, he married Rina Ansley (nee Rina Ansbacher, born 14 March 1902) in 1922; her father was a wealthy German-born stockbroker, resident in Park Lane, who had naturalised in 1918. They had two daughters, Rachel Anne (b. 1923) and Betty Sheila (b. 1928). After his marriage, Spero went into politics in Leicester, where he seems to have been living, and stood for Parliament in the 1922 general election. The <em>Nottingham Journal</em> described him as for &#8220;the cause of free, unfettered Liberalism &#8230; Democratic in conviction, he stands for the abolition of class differences and for the co-operation of capital and labour.&#8221; However, while this was well-tailored to appeal to the generally left-wing voters of Leicester West, and his war record was well-regarded, the moderate vote was split between the Liberal and National Liberal candidates, with Labour taking the seat.</p> <p>The Conservative government held another election in 1923, aiming to strengthen a small majority (does this sound familiar?), and Spero &#8211; now back in London &#8211; contested Stoke Newington, then a safe Conservative seat, again as a left Liberal. With support from Labour, who did not contest the seat, Spero ran a successful campaign and unseated the sitting MP. He voted in support of the minority Labour government on a number of occasions, and was one of the small number of Liberal rebels who supported them in the final no-confidence vote. However, this was not enough to prevent Labour fielding a candidate against him in 1924; the Conservative candidate took 57% of the vote, with the rest split evenly between Labour and Liberal.</p> <p>Spero drifted from the Liberals into the Labour Party, probably a more natural home for his politics, joining it in 1925. By the time of the next general election, in May 1929, he had become the party&#8217;s candidate for Fulham West, winning it from the Conservatives with 45% of the vote.</p> <p>He was a moderately active Government backbencher for the next few months, including being sent as a visitor to Canada during the recess in September 1929, travelling with his wife. While overseas, she caused some minor amusement to the British papers after reporting the loss of a £6,000 pearl necklace &#8211; they were delighted to <a href="https://www.britishnewspaperarchive.co.uk/viewer/bl/0001480/19290928/068/0005" target="_blank" rel="noopener noreferrer">report this</a> alongside &#8220;socialist MP&#8221;. He was last recorded voting in Hansard in December, and did not appear in 1930. In February and March he was paired for votes, with a newspaper report in <a href="https://www.britishnewspaperarchive.co.uk/viewer/bl/0002026/19300307/034/0003" target="_blank" rel="noopener noreferrer">early March</a> stating that he had been advised to take a rest to avoid a complete nervous breakdown about the start of the year, and had gone to the South of France, but &#8220;hopes to return to Parliament before the month is out&#8221;. However, on 9th April he formally took the Chiltern Hundreds (it is interesting that <a href="https://www.britishnewspaperarchive.co.uk/viewer/bl/0000687/19300409/251/0004" target="_blank" rel="noopener noreferrer">a newspaper report</a> suggested his local party would choose whether to accept the resignation).</p> <p>However, <a href="https://www.britishnewspaperarchive.co.uk/viewer/bl/0000437/19300606/104/0007" target="_blank" rel="noopener noreferrer">things were moving quickly elsewhere</a>. A case was brought against him in the High Court for £10,000, arising from his sale of a radio company in 1928-29. During the court hearing, at the end of May, it was discovered that a personal cheque for £4000 given by Spero to guarantee the company&#8217;s debts had been presented to his bank in October 1929, but was not honoured. He had at this point claimed to be suing the company for £20,000, buying six months legal delay, sold his furniture, and &#8211; apparently &#8211; left the country for America. Bankruptcy proceedings followed later that year (where he was <a href="https://www.britishnewspaperarchive.co.uk/viewer/bl/0000321/19301007/003/0001" target="_blank" rel="noopener noreferrer">again stated</a> to be in America) and, unsurprisingly, his creditors seem to have received very little.</p> <p>At this point, the British trail and the historic record draw to a gentle close. But what happened to him?</p> <p>The National Portrait Gallery gave his death as 1960, while an entry in <i>The Palgrave Dictionary of Anglo-Jewish History</i> reported that they had traced his death to 1976 in Belgrade, Yugoslavia (where, as a citizen, it was registered with the US embassy). Unfortunately, it did not go into any detail about how they worked this out, and this just heightened the mystery &#8211; if it was true, how had a disgraced ex-MP ended up in Yugoslavia on a US passport three decades later? And, conversely, who was it had died in 1960?</p> <h4>George Spears, immigrant and doctor</h4> <p>We know that Spero went to America in 1929-30; that much seemed to be a matter of common agreement. Conveniently, the American census was carried out in April 1930, and the papers are available. On 18 April, he was living with his family in Riverside Drive, upper Manhattan; all the names and ages line up, and Spero is given as a medical doctor, actively working. Clearly they were reasonably well off, as they had a live-in maid, and it seems to be quite a nice area.</p> <p><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_19-51-52.png"><img loading="lazy" decoding="async" class="alignnone size-medium wp-image-1545" src="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_19-51-52-300x57.png" alt="" width="300" height="57" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_19-51-52-300x57.png 300w, https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_19-51-52.png 684w" sizes="(max-width: 300px) 100vw, 300px" /></a></p> <p>In 1937, he petitioned for American citizenship in California, noting that he had lived there since March 1933. As part of the process, he formally notified that he intended to change his name to <strong>George Ernest Spears</strong>. (He also gave his birthdate as 2 March 1894, of which more later).</p> <p><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_20-06-54.png"><img loading="lazy" decoding="async" class="alignnone size-medium wp-image-1546" src="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_20-06-54-300x49.png" alt="" width="300" height="49" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_20-06-54-300x49.png 300w, https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_20-06-54.png 717w" sizes="(max-width: 300px) 100vw, 300px" /></a></p> <p>While we can be reasonably confident these are the same man due to the names and dates of the family, the match is very neatly confirmed by the fact that the citizenship papers <em>have a photograph</em>, which can be compared to an <a href="https://www.britishnewspaperarchive.co.uk/viewer/bl/0001897/19211216/063/0003" target="_blank" rel="noopener noreferrer">older newspaper one</a>. There is fifteen years difference, but we can see the similarities between the prospective MP of 27 and the older man of 43.</p> <p><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/spero.png"><img loading="lazy" decoding="async" class="alignnone size-medium wp-image-1549" src="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/spero-300x146.png" alt="" width="300" height="146" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/spero-300x146.png 300w, https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/spero.png 468w" sizes="(max-width: 300px) 100vw, 300px" /></a></p> <p>George Spears, with the same family, then reappears in the 1940 census, back in Riverside Drive. He is now apparently practicing as an optician, and doing well – income upwards of $6000. Finally, we find a draft record for him living in Huntingdon, Long Island at some point in 1942. Note his signature here, which is visibly the same hand as in 1937, except &#8220;E. Spears&#8221; not &#8220;Ernest Spero&#8221;.</p> <p><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_21-38-59.png"><img loading="lazy" decoding="async" class="alignnone size-medium wp-image-1550" src="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_21-38-59-300x86.png" alt="" width="300" height="86" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_21-38-59-300x86.png 300w, https://www.generalist.org.uk/blog/wp-content/uploads/2018/12/Screenshot_2018-12-05_21-38-59.png 462w" sizes="(max-width: 300px) 100vw, 300px" /></a></p> <p>It is possible he reverted to his old name for a while – there are occasional appearances of a Dr. George Spero, optometrist, in the New York phone books between the 1940s and late 1950s. Not enough detail to be sure either way, though.</p> <p>So at this point, we can trace Spero/Spears continually from 1930 to 1942. And then nothing, until on 7 January 1960, George E. Spears, born 2 March 1894, died in California. Some time later, in June 1976, George Spero, born 11 April 1894, died in Belgrade, Yugoslavia, apparently a US citizen. Which one was our man?</p> <p>The former seemed more likely, but can we prove it? The death details come from an index, which gives a mother&#8217;s maiden name of &#8220;Robinson&#8221; &#8211; unfortunately the full certificate isn&#8217;t there and I did not feel up to trying to track down a paper Californian record to see what else it said.</p> <p>If we return to the UK, we can find George Spero in the 1901 census in Dover, with his parents Isidore Sol [Solomon], a &#8216;dental mechanic&#8217;, and Rachel, maiden name unknown. The family later moved to London, the parents naturalised, Isidore died in 1925 &#8211; and probate goes to &#8220;George Ernest Spero, physician&#8221;, which seems to confirm that this is definitely the right family and not a different George Spero. The 1901 censuses note that two of the older children were born in Dublin, so we can trace them in the Irish records. Here we have an &#8220;Israel S Spero&#8221; marrying Rachel Robinson in 1884, and a subsequent child born to Solomon Israel Spero and Rachel Spero nee Robinson. There are a few other Speros or Spiros appearing in Dublin, but none married around the right time, and none with such similar names. <em>If</em> Israel Solomon Spero is the same as Isidore Solomon Spero, this all ties up very neatly.</p> <p>It leaves open the mystery, however, of who died in Yugoslavia. It seems likely this was a completely different man (who had not changed his name), but I have completely failed to trace anything about him. A pity &#8211; it would have been nice to definitively close off that line of enquiry.</p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="entry-format"><span class="screen-reader-text">Format </span><a href="https://www.generalist.org.uk/blog/type/gallery/">Gallery</a></span><span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://www.generalist.org.uk/blog/2019/george-ernest-spero-the-vanishing-mp/" rel="bookmark"><time class="entry-date published" datetime="2019-03-17T15:04:10+00:00">March 17, 2019</time><time class="updated" datetime="2019-03-17T16:38:50+00:00">March 17, 2019</time></a></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://www.generalist.org.uk/blog/authors/andrew/" rel="category tag">Andrew</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://www.generalist.org.uk/blog/tags/parliament/" rel="tag">parliament</a>, <a href="https://www.generalist.org.uk/blog/tags/wikidata/" rel="tag">wikidata</a>, <a href="https://www.generalist.org.uk/blog/tags/wikipedia/" rel="tag">wikipedia</a></span><span class="comments-link"><a href="https://www.generalist.org.uk/blog/2019/george-ernest-spero-the-vanishing-mp/#comments">4 Comments<span class="screen-reader-text"> on George Ernest Spero, the vanishing MP</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-1540 --> <article id="post-1508" class="post-1508 post type-post status-publish format-standard hentry category-uncategorized tag-history tag-wikidata"> <header class="entry-header"> <h2 class="entry-title"><a href="https://www.generalist.org.uk/blog/2018/our-man-in-havana-or-q56761118/" rel="bookmark">Our man in Havana (or, Q56761118)</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p>Has it really been a year since I posted here? Oh, dear. Well. So, this Friday/Saturday I went to <a href="https://www.eventbrite.co.uk/e/who-was-our-man-in-havana-tickets-49384851420#">the FCO&#8217;s hackathon event</a> &#8211; wonderfully titled &#8220;Who Was Our Man In Havana?&#8221; &#8211; to have a play with a dataset of British diplomats.</p> <p>My goal was to try and synch this up with Wikidata in some way &#8211; there were obviously some overlaps with <a href="https://www.wikidata.org/wiki/Wikidata:WikiProject_British_Politicians">the MPs project</a>, but given how closely tied the diplomatic service has been into the establishment, it seemed likely there would be a lot of overlap. The objective of the event was to produce some kind of visualisation/interface, so after a bit of discussion with my team-mates we decided to get the data cleaned up, import some into Wikidata, and pull it out again in an enriched fashion.</p> <p>The data cleaning was a bit of a challenge. <a href="https://github.com/percevalve">Sev</a> and <a href="https://github.com/motatoes">Mohammed</a>, my team-mates, did excellent work hacking away at the XML and eventually produced a nice, elegantly-parsed, version of the source data.</p> <p>I uploaded this into Magnus&#8217;s <a href="">mix-and-match</a> tool, using a notional ID number which we could tie back to the records. Hammering away at mix-and-match that evening got me about 400 initial matches to work with. While I was doing this, Sev and Mohammed expanded the XML parsing to include all the positions held plus dates, tied back to the notional IDs in mix-and-match.</p> <p>On Saturday, I wrote a script to pull down the mix-and-match records, line them up with the expanded parsing data, and put that into a form that could be used for QuickStatements. Thankfully, someone had already established a clear data model for diplomatic positions, so I was able to build on that to work out how to handle the positions without having to invent it from scratch.</p> <p>The upload preparation was necessarily a messily manual process &#8211; I ended up compromising with <a href="https://github.com/generalist/fcohack">a script</a> generating a plain TSV which I could feed into a spreadsheet and then manually lookup (eg) the relevant Wikidata IDs for positions. If I&#8217;d had more time we could have put together something which automatically looked up position IDs in a table and then produced a formatted sheet (or even sent it out through something like <a href="https://github.com/maxlath/wikidata-cli">wikidata-cli</a>, but I wanted a semi-manual approach for this stage so I could keep an eye on the data and check it was looking sensible. (Thanks at this point also to <a href="https://twitter.com/Tagishsimon">@tagishsimon</a>, who helped with the matching and updating on mix-and-match). And then I started feeding it in, lump by lump. <a href="https://www.wikidata.org/wiki/Q7599600#P39">Behold, success</a>!</p> <p><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2018/10/Screenshot_2018-10-01_20-11-32.png"><img loading="lazy" decoding="async" src="https://www.generalist.org.uk/blog/wp-content/uploads/2018/10/Screenshot_2018-10-01_20-11-32.png" alt="" width="520" height="326" class="alignnone size-full wp-image-1515" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2018/10/Screenshot_2018-10-01_20-11-32.png 520w, https://www.generalist.org.uk/blog/wp-content/uploads/2018/10/Screenshot_2018-10-01_20-11-32-300x188.png 300w" sizes="(max-width: 520px) 100vw, 520px" /></a></p> <p>While I was doing this, Mohammed assembled a <a href="https://github.com/percevalve/fco_xml">front-end display</a>, which used vue.js to format and display a set of ambassadors drawn from <a href="https://query.wikidata.org/#%23%20Wikidata%20entries%20for%20British%20ambassadors%20and%20high%20commissioners%0A%23%20all%20people%20who%20held%20at%20least%20one%20such%20position%0A%23%20one%20line%20per%20position%20held%20%28so%20many%20people%20appear%20repeatedly%29%0A%23%20start%2Fend%20dates%20for%20that%20particular%20position%0A%0Aselect%20distinct%20%3Fperson%20%3FpersonLabel%20%3FpositionLabel%20%3Fstartyear%20%3Fendyear%20%3Fbirthyear%20%3Fdeathyear%20%3Fimage%20%3FotherpositionLabel%20%3Fotherstartyear%20%3Fotherendyear%20where%0A%7B%0A%20%20%7B%20%3Fposition%20wdt%3AP31%20wd%3AQ18115939%20.%20%7D%20union%20%7B%20%3Fposition%20wdt%3AP31%20wd%3AQ56760832%20%7D%20.%20%23%20position%20is%20UK%20ambassador%20or%20high%20commissioner%0A%20%20%20%20%0A%20%20%20%20%3Fperson%20p%3AP39%20%3FpositionStatement%20.%20%3FpositionStatement%20ps%3AP39%20%3Fposition%20.%20%23%20find%20positions%20they%20held%0A%20%20%20%20%3Fperson%20wdt%3AP18%20%3Fimage%20.%20%0A%20%20%20%20optional%20%7B%20%3FpositionStatement%20pq%3AP580%20%3Fstart%20.%20bind%28year%28%3Fstart%29%20as%20%3Fstartyear%29%20%7D%20%23%20id%20start%20year%0A%20%20%20%20optional%20%7B%20%3FpositionStatement%20pq%3AP582%20%3Fend%20.%20bind%28year%28%3Fend%29%20as%20%3Fendyear%29%20%7D%20%23%20id%20end%20year%0A%20%20%20%20optional%20%7B%20%3Fperson%20wdt%3AP569%20%3Fborn%20.%20bind%28year%28%3Fborn%29%20as%20%3Fbirthyear%29%20%7D%20%23%20id%20start%20year%0A%20%20%20%20optional%20%7B%20%3Fperson%20wdt%3AP570%20%3Fdied%20.%20bind%28year%28%3Fdied%29%20as%20%3Fdeathyear%29%20%7D%20%23%20id%20end%20year%0A%20%20%20%20optional%20%7B%20%3Fperson%20p%3AP39%20%3FotherpositionStatement%20.%20%3FotherpositionStatement%20ps%3AP39%20%3Fotherposition%20.%20%0A%20%20%20%20%20%20%20%20%20%20%20%20%20%20filter%20not%20exists%20%7B%20%3Fotherposition%20wdt%3AP31%20wd%3AQ18115939%20.%20%7D%20%0A%20%20%20%20%20%20%20%20%20%20%20%20%20%20filter%20not%20exists%20%7B%20%3Fotherposition%20wdt%3AP31%20wd%3AQ56760832%20.%20%7D%20%0A%20%20%20%20%20%20%20%20%20%20%20%20%20%20filter%20not%20exists%20%7B%20%3FotherpositionStatement%20ps%3AP39%20wd%3AQ121998%20.%20%7D%0A%20%20%20%20%20%20%20%20%20%20%20%20%20%20optional%20%7B%20%3FotherpositionStatement%20pq%3AP580%20%3Fotherstart%20.%20bind%28year%28%3Fotherstart%29%20as%20%3Fotherstartyear%29%20%7D%0A%20%20%20%20%20%20%20%20%20%20%20%20%20%20optional%20%7B%20%3FotherpositionStatement%20pq%3AP580%20%3Fotherend%20.%20bind%28year%28%3Fotherend%29%20as%20%3Fotherendyear%29%20%7D%0A%20%20%20%20%20%20%20%20%20%20%20%20%20%7D%0A%0A%20%20SERVICE%20wikibase%3Alabel%20%7B%20bd%3AserviceParam%20wikibase%3Alanguage%20%22%5BAUTO_LANGUAGE%5D%2Cen%22.%20%7D%0A%7D">a Wikidata SPARQL query</a>. It concentrated on a couple of additional things to demonstrate the enrichment available from Wikidata &#8211; a picture and some notes of other non-ambassadorial positions they&#8217;d held.</p> <p>To go alongside this, as a demonstration of other linkages that weren&#8217;t exposed in our tool, I knocked up a couple of quick visualisations through the Wikidata query tool: a map of <a href="http://tinyurl.com/yd254e32">where British ambassadors to Argentina were born</a> (mainly the Home Counties and India!), or a chart of <a href="http://tinyurl.com/ya29gznt">where ambassadors/High Commissioners were educated</a> (Eton, perhaps unsurprisingly, making a good showing). It&#8217;s remarkable how useful the query service is for whipping up this kind of visualisation.</p> <p><a href="https://www.generalist.org.uk/blog/wp-content/uploads/2018/10/image1-e1538423190603.jpeg"><img loading="lazy" decoding="async" src="https://www.generalist.org.uk/blog/wp-content/uploads/2018/10/image1-e1538423190603-225x300.jpeg" alt="" width="225" height="300" class="alignright size-medium wp-image-1522" srcset="https://www.generalist.org.uk/blog/wp-content/uploads/2018/10/image1-e1538423190603-225x300.jpeg 225w, https://www.generalist.org.uk/blog/wp-content/uploads/2018/10/image1-e1538423190603-768x1024.jpeg 768w" sizes="(max-width: 225px) 100vw, 225px" /></a></p> <p>We presented this on Saturday afternoon and it went down well &#8211; we won a prize! A bottle of wine and &#8211; very appropriately &#8211; mugs with <a href="https://en.wikipedia.org/wiki/Palmerston_(cat)">the famed Foreign Office cat</a> on them. A great weekend, even if it did mean an unreasonably early Saturday start!</p> <p>So, some thoughts on the event in conclusion:</p> <ul> <li>It was very clear how well the range of skills worked at an event like this. I don&#8217;t think any of us could have produced the result on our own.</li> <li>A lot of time &#8211; not just our group, but everyone &#8211; was spent parsing and massaging the (oddly structured) XML. Had the main lists been available as a CSV/TSV, this might have been a lot quicker. I certainly wouldn&#8217;t have been able to get anywhere with it myself.</li> <li>On the data quality note, we were lucky that the names of records were more or less unique strings, but an ID number for each record inserted when the original XML was generated might have saved a bit of time.</li> <li>A handful of people could go from a flat file of names, positions, dates to about a thousand name-position pairs on Wikidata, some informative queries, and a prototype front-end viewer with a couple of days of work, and some of that could have been bypassed with cleaner initial data. This is really promising for </li> </ul> <p>And <a href="https://www.wikidata.org/wiki/Wikidata:WikiProject_British_Politicians/ambassadors">on the Wikidata side</a>, there are a few modelling questions this has thrown up:</p> <ul> <li>I took the decision not to change postings based on the diplomatic rank &#8211; eg someone who was officially the &#8220;Minister to Norway&#8221; (1905-1942) conceptually held the same post as someone who was &#8220;Ambassador to Norway&#8221; (1942-2018). If desired, we can represent the rank as a qualifier on the item (eg/ subject has role: &#8220;chargé d&#8217;affaires&#8221;). This seemed to make the most sense &#8211; &#8220;ambassadors with a small &#8216;a'&#8221;.</li> <li>The exception to this is High Commissioners, who are currently modelled parallel to Ambassadors &#8211; same hierarchy but in parallel. This lets us find all the HCs without simply treating them as &#8220;Ambassadors with a different job title&#8221;.<br /> <br />However, this may not be a perfect approach as some HCs changed to Ambassadors and back again (eg Zimbabwe) when a country leaves/rejoins the Commonwealth. At the moment these are modelled by picking one for a country and sticking to it, with the option of qualifiers as above, but a better approach might be needed in the long run.</li> <li>Dates as given are the dates of service. A few times &#8211; especially in the 19th century when journeys were more challenging &#8211; an ambassador was appointed but did not proceed overseas. These have been imported with no start-end dates, but this isn&#8217;t a great solution. Arguably they could have a start/end date in the same year and a qualifier to say they did not take up the post; alternatively, you could make a case that they should not be listed as ambassadors at all.</li> </ul> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://www.generalist.org.uk/blog/2018/our-man-in-havana-or-q56761118/" rel="bookmark"><time class="entry-date published" datetime="2018-10-01T20:47:43+01:00">October 1, 2018</time><time class="updated" datetime="2018-10-01T21:48:57+01:00">October 1, 2018</time></a></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://www.generalist.org.uk/blog/authors/uncategorized/" rel="category tag">Uncategorized</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://www.generalist.org.uk/blog/tags/history/" rel="tag">history</a>, <a href="https://www.generalist.org.uk/blog/tags/wikidata/" rel="tag">wikidata</a></span><span class="comments-link"><a href="https://www.generalist.org.uk/blog/2018/our-man-in-havana-or-q56761118/#respond">Leave a comment<span class="screen-reader-text"> on Our man in Havana (or, Q56761118)</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-1508 --> <article id="post-1433" class="post-1433 post type-post status-publish format-standard hentry category-andrew tag-wikidata tag-wikipedia"> <header class="entry-header"> <h2 class="entry-title"><a href="https://www.generalist.org.uk/blog/2016/history-of-parliament-and-wikidata-the-first-round-complete/" rel="bookmark">History of Parliament and Wikidata &#8211; the first round complete</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p>Back in January, I wrote up some things I was aiming to do this year, including:</p> <blockquote><p>Firstly, I’d like to clear off the History of Parliament work on Wikidata. I haven’t really written this up yet (maybe that’s step 1.1) but, in short, I’m trying to get every MP in the History of Parliament database listed and crossreferenced in Wikidata. At the moment, we have around 5200 of them listed, out of a total of 22200 – so we’re getting there. (Raw data here.) Finding the next couple of thousand who’re listed, and mass-creating the others, is definitely an achievable task.</p></blockquote> <p>Well, seven months later, here&#8217;s where it stands:</p> <ul> <li>9,372 of a total 21,400 (43.7%) of History of Parliament entries been matched to records for people in Wikidata. <li>These 9,372 entries represent 7,257 people &#8211; 80 have entries in three HoP volumes, and 1,964 in two volumes. (This suggests that, when complete, we will have about ~16,500 people for those initial 21,400 entries &#8211; so maybe we&#8217;re actually over half-way there). <li>These are crossreferenced to a lot of other identifiers. 1,937 of our 7,257 people (26.7%) are in the <i>Oxford Dictionary of National Biography</i>, 1,088 (15%) are in the National Portrait Gallery database, and 2,256 (31.1%) are linked to their speeches in the digital edition of Hansard. There is <a href="http://www.generalist.org.uk/wikidata/">a report generated each night</a> crosslinking various interesting identifiers. <li><i>Every</i> MP in the 1820-32 volume (1,367 of them) is now linked and identified, and the 1790-1820 volume is now around 85% complete. (This explains the high showing for Hansard, which covers 1805 onwards) <li>The metadata for these is still limited &#8211; a lot more importing work to do &#8211; but in some cases pretty decent; 94% of the 1820-32 entries have a date of death, for example. </ul> <p>Of course, there&#8217;s a lot more still to do &#8211; more metadata to add, more linkages to make, and so on. It still does not have any reasonable data linking MPs to constituencies, which is a major gap (but perhaps one that can be filled semi-automatically using the HoP/Hansard links and a clever script).</p> <p>But as a proof of concept, I&#8217;m very happy with it. Here&#8217;s some queries playing with the (1820-32) data:</p> <ul> <li>There are <a href="http://tinyurl.com/howvw8r">990 MPs with an article about them in at least one language/WM project</a>. Strikingly, ten of these <i>don&#8217;t</i> have an English Wikipedia article (yet). The most heavily written-about MP is &#8211; to my surprise &#8211; David Ricardo, with articles in 67 Wikipedias. (The next three are Peel, Palmerston, and Edward Bulwer-Lytton). <li>303 of the 1,367 MPs (22.1%) have a recorded link to at least one other person in Wikidata by a close family relationship (parent, child, spouse, sibling) &#8211; there are 803 links, to 547 unique people &#8211; 108 of whom are also in the 1820-32 MPs list, and 439 of whom are from elsewhere in Wikidata. (I expect this number to rise dramatically as more metadata goes in). <li>The longest-surviving pre-Reform MP (of the 94% indexed by deathdate, anyway) was John Savile, later Earl of Mexborough, who made it to August 1899&#8230; <li>Of <a href="http://tinyurl.com/zedvca9">the 360 with a place of education listed</a>, the most common is Eton (104), closely followed by Christ Church, Oxford (97) &#8211; there is, of course, substantial overlap between them. It&#8217;s impressive to see just how far we&#8217;ve come. No-one would ever expect to see anything like that for Parliament today, would we. <li>Of the 1,185 who&#8217;ve had first name indexed by Wikidata so far, the most popular is John (14.4%), then William (11.5%), Charles (7.5%), George (7.4%), and Henry (7.2%): <p><iframe loading="lazy" width="500" height="500" src="https://query.wikidata.org/embed.html#%23Popular%20names%20among%20MPs%0A%23defaultView%3ABubbleChart%0ASELECT%20%3Fname%20%3FnameLabel%20%3Fcount%20WHERE%20%7B%0A%20%20%7B%0A%20%20%20%20SELECT%20%3Fname%20%28COUNT%28%3Fperson%29%20AS%20%3Fcount%29%20WHERE%20%7B%0A%20%20%20%20%20%20%3Fperson%20wdt%3AP1614%20%3Fhop%20.%20%0A%20%20%20%20%20%20%3Fperson%20wdt%3AP735%20%3Fname.%0A%09%20%20FILTER%28STRSTARTS%28%3Fhop%2C%20%221820%22%29%29.%0A%20%20%20%20%7D%0A%20%20%20%20GROUP%20BY%20%3Fname%0A%20%20%7D%0A%20%20SERVICE%20wikibase%3Alabel%20%7B%20bd%3AserviceParam%20wikibase%3Alanguage%20%22en%22.%20%7D%0A%7D%0AORDER%20BY%20DESC%28%3Fcount%29%0ALIMIT%2050"></iframe></p> <li>A map of the (currently) 154 MPs whose place of death has been imported: <p><iframe loading="lazy" width="500" height="500" src="https://query.wikidata.org/embed.html#%23MPs%20in%20the%201820-32%20HoP%20with%20known%20deathplace%0ASELECT%20%3Fitem%20%3FitemLabel%20%3FdeathplaceLabel%20%3Fcoords%0AWHERE%20%0A%7B%0A%09%3Fitem%20wdt%3AP1614%20%3Fhop%20.%0A%20%20%20%20%3Fitem%20wdt%3AP20%20%3Fdeathplace%20.%0A%20%20%20%20%23FILTER%20NOT%20EXISTS%20%7B%20%3Fdeathplace%20wdt%3AP31%20wd%3AQ3336843%20.%20%7D%20%23%20these%20two%20omit%20country-level%20records%0A%20%20%20%20%23FILTER%20NOT%20EXISTS%20%7B%20%3Fdeathplace%20wdt%3AP31%20wd%3AQ6256%20.%20%7D%20%23%20these%20two%20omit%20country-level%20records%0A%20%20%20%20%3Fdeathplace%20wdt%3AP625%20%3Fcoords%20.%0A%20%20%20%20SERVICE%20wikibase%3Alabel%20%7B%20bd%3AserviceParam%20wikibase%3Alanguage%20%22en%22.%20%7D%0A%09FILTER%28STRSTARTS%28%3Fhop%2C%20%221820%22%29%29.%0A%7D%0A%23defaultView%3AMap"></iframe> </ul> <p>All these are of course provisional, but it makes me feel I&#8217;m definitely on the right track!</p> <hr> <p>So, you may be asking, what can I do to help? Why, thankyou, that&#8217;s very kind&#8230;</p> <ul> <li>First of all, <a href="http://www.generalist.org.uk/wikidata/hop-links.txt">this is the master list</a>, updated every night, of as-yet-unmatched HoP entries. Grab one, load it up, search Wikidata for a match, and add it (property <a href="https://www.wikidata.org/wiki/Property:P1614">P1614</a>). Bang, one more down, and we&#8217;re 0.01% closer to completion&#8230; <li>It&#8217;s not there? (About half to two thirds probably won&#8217;t be). You can create an item manually, or you can set it aside to create a batch of them later. I wrote a <a href="https://github.com/generalist/wikidata-hop/blob/master/hopcreate">fairly basic bash script</a> to take a spreadsheet of HoP identifiers and basic metadata and prepare it for bulk-item-creation on Wikidata. <li>Or you could help sanitise some of the metadata &#8211; here&#8217;s some interesting edge cases: <ul> <li><a href="http://tinyurl.com/hkcy25z">This list</a> is ~680 items who probably have a death date (the HoP slug ends in a number), but who don&#8217;t currently have one in Wikidata. <li><a href="http://tinyurl.com/ja9gclk">This list</a> is ~540 people who are titled &#8220;Honourable&#8221; &#8211; and so are almost certainly the sons of noblemen, themselves likely to be in Wikidata &#8211; but who don&#8217;t have a link to their father. <a href="http://tinyurl.com/zhsrt8c">This list</a> is the same, but for &#8220;Lord&#8221;, and <a href="http://tinyurl.com/hemhfg6">this list</a> has all the apparently fatherless men who were the 2nd through 9th holders of a title&#8230; </ul> </ul> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://www.generalist.org.uk/blog/2016/history-of-parliament-and-wikidata-the-first-round-complete/" rel="bookmark"><time class="entry-date published" datetime="2016-08-14T21:55:19+01:00">August 14, 2016</time><time class="updated" datetime="2016-08-14T22:49:01+01:00">August 14, 2016</time></a></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://www.generalist.org.uk/blog/authors/andrew/" rel="category tag">Andrew</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://www.generalist.org.uk/blog/tags/wikidata/" rel="tag">wikidata</a>, <a href="https://www.generalist.org.uk/blog/tags/wikipedia/" rel="tag">wikipedia</a></span><span class="comments-link"><a href="https://www.generalist.org.uk/blog/2016/history-of-parliament-and-wikidata-the-first-round-complete/#comments">3 Comments<span class="screen-reader-text"> on History of Parliament and Wikidata &#8211; the first round complete</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-1433 --> <article id="post-1161" class="post-1161 post type-post status-publish format-standard hentry category-andrew tag-wikidata tag-wikipedia"> <header class="entry-header"> <h2 class="entry-title"><a href="https://www.generalist.org.uk/blog/2014/wikidata-and-identifiers-part-2-the-matching-process/" rel="bookmark">Wikidata and identifiers &#8211; part 2, the matching process</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p>Yesterday, I wrote about the work we&#8217;re doing <a href="https://www.generalist.org.uk/blog/2014/wikidata-identifiers-and-the-odnb-where-next/">matching identifiers into Wikidata</a>. Today, the tools we use for it!</p> <h3>Mix-and-match</h3> <p>The main tool we&#8217;re using is a beautiful thing Magnus developed called <a href="http://tools.wmflabs.org/mix-n-match/?"><b>mix-and-match</b></a>. It imports all the identifiers with some core metadata &#8211; for the ODNB, for example, this was names and dates and the brief descriptive text &#8211; and sorts them into five groups:</p> <ul> <li><b>Manually matched</b> &#8211; these matches have been confirmed by a person (or imported from data already in Wikidata); <li><b>Automatic</b> &#8211; the system has guessed these are probably the same people but wants human confirmation; <li><b>Unmatched</b> &#8211; we have no idea who these identifiers match to; <li><b>No Wikidata</b> &#8211; we know there is <i>currently</i> no Wikidata match; <li><b>N/A</b> &#8211; this identifier shouldn&#8217;t match to a Wikidata entity (for example, it&#8217;s a placeholder, a subject Wikidata will never cover, or an cross-reference with its own entry). </ul> <p>The goal is to work through everything and move as much as possible to &#8220;manually matched&#8221;. Anything in this group can then be migrated over to Wikidata with a couple of clicks. Here&#8217;s the ODNB as it stands today:</p> <p><img decoding="async" src="https://upload.wikimedia.org/wikipedia/commons/thumb/7/71/Wikidata_mix-and-match_tool_screenshot_1.png/800px-Wikidata_mix-and-match_tool_screenshot_1.png"></p> <p>(Want to see what&#8217;s happening with the data? The <a href="http://tools.wmflabs.org/mix-n-match/?mode=rc&#038;ts=">recent changes</a> link will show you the last fifty edits to all the lists.)</p> <p>So, how do we do this? Firstly, you&#8217;ll need a Wikipedia account, and to log in to our &#8220;WiDaR&#8221; authentication tool. Follow the link on the top of the mix-and-match page (or, indeed, <a href="http://tools.wmflabs.org/widar/index.php?action=authorize">this one</a>), sign in with your Wikipedia account if requested, and you&#8217;ll be authorised. </p> <p>On to the matching itself. There&#8217;s two methods &#8211; manually, or in a semi-automated &#8220;game mode&#8221;.</p> <h3>How to match &#8211; manually</h3> <p>The first approach works line-by-line. Clicking on one of the entries &#8211; here, unmatched ODNB &#8211; brings up the first fifty entries in that set. Each one has options on the left hand side &#8211; to search Wikidata or English Wikipedia, either by the internal search or Google. On the right-hand side, there are three options &#8211; &#8220;set Q&#8221;, to provide it with a Wikidata ID (these are all of the form Q&#8212;&#8211;, and so we often call them &#8220;Q numbers&#8221;); &#8220;No WD&#8221;, to list it as not on Wikidata; &#8220;N/A&#8221;, to record that it&#8217;s not appropriate for Wikidata matching.</p> <p><img decoding="async" src="https://upload.wikimedia.org/wikipedia/commons/thumb/d/d0/Wikidata_mix-and-match_tool_screenshot_2.png/800px-Wikidata_mix-and-match_tool_screenshot_2.png"></p> <p>If you&#8217;ve found a match on Wikidata, the ID number should be clearly displayed at the top of that page. Click &#8220;set Q&#8221; and paste it in. If you&#8217;ve found a match via Wikipedia, you can click the &#8220;Wikidata&#8221; link in the left-hand sidebar to take you to the corresponding Wikidata page, and get the ID from there. </p> <p>After a moment, it&#8217;ll display a very rough-and-ready precis of what&#8217;s on Wikidata next to that line &#8211; </p> <p><img decoding="async" src="https://upload.wikimedia.org/wikipedia/commons/thumb/4/4d/Wikidata_mix-and-match_tool_screenshot_3.png/800px-Wikidata_mix-and-match_tool_screenshot_3.png"></p> <p>&#8211; which makes it easy to spot if you&#8217;ve accidentally pasted in the wrong code! Here, we&#8217;ve identified one person (with rather limited information, just gender and deathdate, currently in Wikidata, and marked another as definitely not found)</p> <p>If you&#8217;re using the automatically matched list, you&#8217;ll see something like this:</p> <p><img decoding="async" src="https://upload.wikimedia.org/wikipedia/commons/thumb/3/31/Wikidata_mix-and-match_tool_screenshot_4.png/800px-Wikidata_mix-and-match_tool_screenshot_4.png"></p> <p>&#8211; it&#8217;s already got the data from the possible matches but wants you to confirm. Clicking on the Q-number will take you to the provisional Wikidata match, and from there you can get to relevant Wikipedia articles if you need further confirmation. </p> <h3>How to match &#8211; game mode</h3> <p>We&#8217;ve also set up a &#8220;game mode&#8221;. This is suitable when we expect a high number of the unmatched entries to be connectable to Wikipedia articles; it gives you a random entry from the unmatched list, along with a handful of possible results from a Wikipedia search, and asks you to choose the correct one if it&#8217;s there. you can get it by clicking [G] next to the unmatched entries.</p> <p><a href="http://tools.wmflabs.org/mix-n-match/?mode=random&#038;catalog=16&#038;submode=unmatched">Here&#8217;s an example</a>, using the OpenPlaques database. </p> <p><img decoding="async" src="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f6/Wikidata_mix-and-match_tool_screenshot_5.png/800px-Wikidata_mix-and-match_tool_screenshot_5.png"></p> <p>In this one, it was pretty clear that their Roy Castle is the same as the first person listed here (remember him?), so we click the blue Q-number; it&#8217;s marked as matched, and the game generates a new entry. Alternatively, we could look him up elsewhere and paste the Q-number or Wikipedia URL in, then click the &#8220;set Q&#8221; button. If our subject&#8217;s not here &#8211; click &#8220;skip&#8221; and move on to the next one.</p> <h3>Finishing up</h3> <p>When you&#8217;ve finished matching, go back to the main screen and click the [Y] at the end of the list. This allows you to synchronise the work you&#8217;ve done with Wikidata &#8211; it will make the edits to Wikidata under your account. (There is also an option to import existing matches from Wikidata, but at the moment the mix-and-match database is a bit out of synch and this is best avoided&#8230;) There&#8217;s no need to do this if you&#8217;re feeling overly cautious, though &#8211; we&#8217;ll synchronise them soon enough. The same page will also report any cases where two distinct Wikidata entries have been matched to the same identifier, which (usually) shouldn&#8217;t happen.</p> <p>If you want a simple export of the matched data, you can click the [D] link for a TSV file (Q-number, identifier, identifier URL &#038; name if relevant), and some stats on how many matches to individual wikis are available with [S].</p> <h3>Brute force</h3> <p>Finally, if you have a lot of matched data, and you are confident it&#8217;s accurate without needing human confirmation, then you can adopt the brute-force method &#8211; <a href="http://tools.wmflabs.org/wikidata-todo/quick_statements.php?">QuickStatements</a>. This is the tool used for pushing data from mix-and-match to Wikidata, and can be used for any data import. Instructions are on that page &#8211; but if you&#8217;re going to use it, test it with a few individual items first to make sure it&#8217;s doing what you think, and please don&#8217;t be shy to ask for help&#8230;</p> <p>So, we&#8217;ve covered a) what we&#8217;re doing; and b) how we get the information into Wikidata. Next instalment, how to actually use these identifiers for your own purposes&#8230;</p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://www.generalist.org.uk/blog/2014/wikidata-and-identifiers-part-2-the-matching-process/" rel="bookmark"><time class="entry-date published" datetime="2014-11-27T19:39:36+00:00">November 27, 2014</time><time class="updated" datetime="2014-11-27T20:35:49+00:00">November 27, 2014</time></a></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://www.generalist.org.uk/blog/authors/andrew/" rel="category tag">Andrew</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://www.generalist.org.uk/blog/tags/wikidata/" rel="tag">wikidata</a>, <a href="https://www.generalist.org.uk/blog/tags/wikipedia/" rel="tag">wikipedia</a></span><span class="comments-link"><a href="https://www.generalist.org.uk/blog/2014/wikidata-and-identifiers-part-2-the-matching-process/#comments">10 Comments<span class="screen-reader-text"> on Wikidata and identifiers &#8211; part 2, the matching process</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-1161 --> <article id="post-1164" class="post-1164 post type-post status-publish format-standard hentry category-andrew tag-wikidata tag-wikipedia"> <header class="entry-header"> <h2 class="entry-title"><a href="https://www.generalist.org.uk/blog/2014/wikidata-identifiers-and-the-odnb-where-next/" rel="bookmark">Wikidata identifiers and the ODNB &#8211; where next?</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p>Wikidata, for those of you unfamiliar with it, is the backend we are developing for Wikipedia. At its simplest, it&#8217;s a spine linking together the same concept in different languages &#8211; so we can tell that a <a href="https://en.wikipedia.org/wiki/Coronation">coronation</a> in English matches <a href="https://az.wikipedia.org/wiki/Tacqoyma">Tacqoyma</a> in Azeri or <a href="https://uk.wikipedia.org/wiki/%D0%9A%D0%BE%D1%80%D0%BE%D0%BD%D0%B0%D1%86%D1%96%D1%8F">Коронація</a> in Ukranian, or thirty-five other languages between. This all gets bundled up into a single data entry &#8211; the enigmatically named <a href="https://www.wikidata.org/wiki/Q209715">Q209715</a> &#8211; which then gets other properties attached. In this case, a coronation is a kind of (or subclass of, for you semanticians) &#8220;ceremony&#8221; (<a href="https://www.wikidata.org/wiki/Q2627975">Q2627975</a>), and is linked to a few external thesauruses. The system is fully multilingual, so we can express &#8220;coronation &#8211; subclass of &#8211; ceremony&#8221; in English as easily as &#8220;kroning &#8211; undergruppe af &#8211; ceremoni&#8221; in Danish.</p> <p>So far, so good.</p> <p>There has been a great deal of work around Wikipedia in recent years in connecting our rich-text articles to static authority control records &#8211; confirming that our <a href="https://en.wikipedia.org/wiki/George_Washington">George Washington</a> is the same as the one <a href="http://id.loc.gov/authorities/names/n86140996.html">the Library of Congress knows about</a>. During 2012-13, these were ingested from Wikipedia into Wikidata, and as of a year ago <a href="http://journal.code4lib.org/articles/8964">we had identified</a> around 420,000 Wikidata entities with authority control identifiers. Most of these were from VIAF, but around half had an identifier from the German GND database, another half from ISNI, and a little over a third LCCN identifiers. Many had all four (and more). We now support matching to a large number of library catalogue identifiers, but &#8211; speaking as a librarian &#8211; I&#8217;m aware this isn&#8217;t very exciting to anyone who doesn&#8217;t spend much of their time cataloguing&#8230;</p> <p>So, the next phase was to move beyond simply &#8220;authority&#8221; identifiers and move to ones that actually provide content. The main project that I&#8217;ve been working on (along with Charles Matthews and Magnus Manske, with the help of Jo Payne at OUP) is matching Wikidata to the <a href="http://www.oxforddnb.com/"><i>Oxford Dictionary of National Biography</i></a> &#8211; Wikipedia authors tend to hold the ODNB in high regard, and many of our articles already use it as a reference work. We&#8217;re currently about three-quarters of the way through, having identified around 40,000 ODNB entries who have been clearly matched to a Wikidata entity, and the rest should be finished some time in 2015. (You can see the tool <a href="http://tools.wmflabs.org/mix-n-match/?">here</a>, and how to use that will be a post for another day.) After that, I&#8217;ve been working on a project to make links between Wikidata and the <a href="http://www.historyofparliamentonline.org/">History of Parliament</a> (with the assistance of Matthew Kilburn and Paul Seaward) &#8211; looking forward to being able to announce some results from this soon.</p> <p>What does this mean? Well, for a first step, it means we can start making better links to a valuable resource on a more organised basis &#8211; for example, Robin Owain and I recently deployed an experimental tool on the Welsh Wikipedia that will generate ODNB links at the end of any article on a relevant subject (see, eg, <a href="https://cy.wikipedia.org/wiki/Dylan_Thomas#Dolenni_allanol">Dylan Thomas</a>). It means we can start making <a href="https://en.wikisource.org/wiki/Dictionary_of_National_Biography,_1885-1900">the Wikisource edition</a> of the (original) <i>Dictionary of National Biography</i> more visible. It means we can quickly generate worklists &#8211; you want suitable articles to work on? Well, we have all these interesting and undeniably notable biographies not yet covered in English (or Welsh, or German, or&#8230;)</p> <p>For the ODNB, it opens up the potential for linking to other interesting datasets (and that without having to pass through wikidata &#8211; all this can be exported). At the moment, we can identify matches to <a href="https://tools.wmflabs.org/wikidata-todo/beacon.php?prop=1415&#038;source=213">twelve thousand ISNIs</a>, <a href="https://tools.wmflabs.org/wikidata-todo/beacon.php?prop=1415&#038;source=214">twenty thousand VIAF identifiers</a>, and &#8211; unexpectedly &#8211; <a href="https://tools.wmflabs.org/wikidata-todo/beacon.php?prop=1415&#038;source=345">a thousand entries in IMDb</a>. (Ten of them are entries for &#8220;characters&#8221;, which opens up a marvellous conceptual can of worms, but let&#8217;s leave that aside&#8230;). </p> <p>And for third parties? Well, this is where it gets interesting. If you have ODNB links in your dataset, we can generate Wikipedia entries (probably less valuable, but in oh so many languages). We can generate images for you &#8211; Wikidata knows about openly licensed portraits for 214,000 people. Or we can crosswalk to whatever other project we support &#8211; YourPaintings links, perhaps? We can match <a href="https://tools.wmflabs.org/wikidata-todo/beacon.php?prop=1415&#038;source=1367">a thousand</a> of those. It can go backwards &#8211; we can take your existing VIAF links and give you ODNB entries. (Cataloguers, take note.)</p> <p>And, best of all, we can ingest that data &#8211; and once it&#8217;s in Wikidata, the next third party to come along can make the links directly to you, and every new dataset makes the existing ones more valuable. Right now, we have a lot of authority control data, but we&#8217;re lighter on serious content links. If you have a useful online project with permanent identifiers, and you&#8217;d like to start matching those up to Wikidata, please do <a href="../../contact-me/">get in touch</a> &#8211; this is really exciting work and we&#8217;d love to work with anyone wanting to help take it forward. </p> <p><hl></p> <p><b>Update</b>: Here&#8217;s part 2: <a href="https://www.generalist.org.uk/blog/2014/wikidata-and-identifiers-part-2-the-matching-process/">on how to use the mix-and-match tool</a>.</p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://www.generalist.org.uk/blog/2014/wikidata-identifiers-and-the-odnb-where-next/" rel="bookmark"><time class="entry-date published" datetime="2014-11-26T21:59:10+00:00">November 26, 2014</time><time class="updated" datetime="2014-11-27T19:41:44+00:00">November 27, 2014</time></a></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://www.generalist.org.uk/blog/authors/andrew/" rel="category tag">Andrew</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://www.generalist.org.uk/blog/tags/wikidata/" rel="tag">wikidata</a>, <a href="https://www.generalist.org.uk/blog/tags/wikipedia/" rel="tag">wikipedia</a></span><span class="comments-link"><a href="https://www.generalist.org.uk/blog/2014/wikidata-identifiers-and-the-odnb-where-next/#comments">4 Comments<span class="screen-reader-text"> on Wikidata identifiers and the ODNB &#8211; where next?</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-1164 --> <article id="post-1130" class="post-1130 post type-post status-publish format-standard hentry category-andrew tag-law tag-legislation tag-wikidata tag-wikimedia tag-wikipedia"> <header class="entry-header"> <h2 class="entry-title"><a href="https://www.generalist.org.uk/blog/2014/laws-on-wikidata/" rel="bookmark">Laws on Wikidata</a></h2> </header><!-- .entry-header --> <div class="entry-content"> <p>So, I had the day off, and decided to fiddle a little with Wikidata. After some experimenting, it now knows about:</p> <ul> <li><a href="http://tools.wmflabs.org/wikidata-todo/autolist.html?q=claim%5B31%3A4677783%5D">1516</a> Acts of the Parliament of the United Kingdom (1801-present) <li><a href="http://tools.wmflabs.org/wikidata-todo/autolist.html?q=claim%5B31%3A18009431%5D">194</a> Acts of the Parliament of Great Britain (1707-1800) <li><a href="http://tools.wmflabs.org/wikidata-todo/autolist.html?q=claim%5B31%3A18009587%5D">329</a> Acts of the Parliament of England (to 1707) <li><a href="http://tools.wmflabs.org/wikidata-todo/autolist.html?q=claim%5B31%3A18009569%5D">20</a> Acts of the Parliament of Scotland (to 1707) <li><a href="http://tools.wmflabs.org/wikidata-todo/autolist.html?q=claim%5B31%3A18009650%5D">19</a> Acts of the Parliament of Ireland (to 1800) </ul> <p>(Acts of the modern devolved parliaments for NI, Scotland, and Wales will follow.)</p> <p>Each has a specific &#8220;instance of&#8221; property &#8211; <a href="https://www.wikidata.org/wiki/Q18009569">Q18009569</a>, for example, is &#8220;act of the Parliament of Scotland&#8221; &#8211; and is set up as a subclass of the general &#8220;act of parliament&#8221;. At the moment, there&#8217;s detailed subclasses for the UK and Canada (which has a seperate class for each province&#8217;s legislation) but nowhere else. Yet&#8230;</p> <p>These numbers are slightly fuzzy &#8211; it&#8217;s mainly based on Wikipedia articles and so there are a small handful of cases where the entry represents a particular clause (eg <a href="https://www.wikidata.org/wiki/Q7444697">Q7444697</a>, s.4 and s.10 of the Human Rights Act 1998</a>), or cases hwere multiple statutes are treated in the same article (eg <a href="https://www.wikidata.org/wiki/Q1133144">Q1133144</a>, the Corn Laws</a>), but these are relatively rare and, mostly, it&#8217;s a good direct correspondence. (I&#8217;ve been fairly careful to keep out oddities, but of course, some will creep in&#8230;)</p> <p>So where next? At the moment, these almost all reflect Wikipedia articles. Only <a href="http://tools.wmflabs.org/wikidata-todo/autolist.html?q=%28CLAIM%5B31%3A18009431%5D%20OR%20CLAIM%5B31%3A18009650%5D%20OR%20CLAIM%5B31%3A18009569%5D%20OR%20CLAIM%5B31%3A18009587%5D%20OR%20CLAIM%5B31%3A4677783%5D%29%20AND%20LINK%5Benwikisource%5D">34</a> have a link to (English) Wikisource, though I&#8217;d guess there&#8217;s about 200-250 statutes currently on there. Matching those up will definitely be valuable; for legislation currently in force and on the Statute Law Database, it would be good to be able to crosslink to there as well. </p> </div><!-- .entry-content --> <footer class="entry-footer"> <span class="posted-on"><span class="screen-reader-text">Posted on </span><a href="https://www.generalist.org.uk/blog/2014/laws-on-wikidata/" rel="bookmark"><time class="entry-date published updated" datetime="2014-09-09T20:17:23+01:00">September 9, 2014</time></a></span><span class="cat-links"><span class="screen-reader-text">Categories </span><a href="https://www.generalist.org.uk/blog/authors/andrew/" rel="category tag">Andrew</a></span><span class="tags-links"><span class="screen-reader-text">Tags </span><a href="https://www.generalist.org.uk/blog/tags/law/" rel="tag">law</a>, <a href="https://www.generalist.org.uk/blog/tags/legislation/" rel="tag">legislation</a>, <a href="https://www.generalist.org.uk/blog/tags/wikidata/" rel="tag">wikidata</a>, <a href="https://www.generalist.org.uk/blog/tags/wikimedia/" rel="tag">wikimedia</a>, <a href="https://www.generalist.org.uk/blog/tags/wikipedia/" rel="tag">wikipedia</a></span><span class="comments-link"><a href="https://www.generalist.org.uk/blog/2014/laws-on-wikidata/#comments">2 Comments<span class="screen-reader-text"> on Laws on Wikidata</span></a></span> </footer><!-- .entry-footer --> </article><!-- #post-1130 --> </main><!-- .site-main --> </section><!-- .content-area --> </div><!-- .site-content --> <footer id="colophon" class="site-footer"> <div class="site-info"> <a href="https://wordpress.org/" class="imprint"> Proudly powered by WordPress </a> </div><!-- .site-info --> </footer><!-- .site-footer --> </div><!-- .site --> <script src="https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/js/skip-link-focus-fix.js?ver=20141028" id="twentyfifteen-skip-link-focus-fix-js"></script> <script id="twentyfifteen-script-js-extra"> var screenReaderText = {"expand":"<span class=\"screen-reader-text\">expand child menu<\/span>","collapse":"<span class=\"screen-reader-text\">collapse child menu<\/span>"}; </script> <script src="https://www.generalist.org.uk/blog/wp-content/themes/twentyfifteen/js/functions.js?ver=20221101" id="twentyfifteen-script-js"></script> </body> </html>

Pages: 1 2 3 4 5 6 7 8 9 10