From 30a1f612ffc1144e66ac3c9e73bf791d049fb693 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Fri, 9 Aug 2019 09:57:26 +0300 Subject: [PATCH] Add notes for 2019-08-09 --- content/posts/2019-08.md | 14 ++++++++++++++ docs/2019-08/index.html | 25 ++++++++++++++++++++++--- docs/sitemap.xml | 10 +++++----- 3 files changed, 41 insertions(+), 8 deletions(-) diff --git a/content/posts/2019-08.md b/content/posts/2019-08.md index 50c3a08b4..4d23e55a5 100644 --- a/content/posts/2019-08.md +++ b/content/posts/2019-08.md @@ -120,4 +120,18 @@ proxy_set_header Host dev.ares.codeobia.com; - Though I am really wondering why this happened now, because the configuration has been working for months... - Improve the output of the suspicious characters check in [csv-metadata-quality](https://github.com/alanorth/csv-metadata-quality) script and tag version 0.2.0 +## 2019-08-09 + +- Looking at the 128 IITA records (20195TH.xls) that Sisay uploadd to DSpace Test last month: [IITA_July_29](https://dspacetest.cgiar.org/handle/10568/102361) + - The records are pretty clean because Sisay ran them through the csv-metadata-quality tool + - I fixed one incorrect country (MELBOURNE) + - I normalized all DOIs to be https://doi.org format + - This item is using the wrong Google Books link: https://dspacetest.cgiar.org/handle/10568/102593 + - The French abstract here has copy/paste errors: https://dspacetest.cgiar.org/handle/10568/102491 + - Validate and normalize affiliations against our 2019-04 list using reconcile-csv and OpenRefine: + - `$ lein run ~/src/git/DSpace/2019-04-08-affiliations.csv name id` + - I always forget how to copy the reconciled values in OpenRefine, but you need to make a new colum and populate it using this GREL: `if(cell.recon.matched, cell.recon.match.name, value)` + - I asked Bosede to check about twenty-five invalid AGROVOC subjects identified by csv-metadata-quality script + - I still need to check the sponsors and then check for duplicates + diff --git a/docs/2019-08/index.html b/docs/2019-08/index.html index 2abff5b72..4fbfa4b65 100644 --- a/docs/2019-08/index.html +++ b/docs/2019-08/index.html @@ -27,7 +27,7 @@ Run system updates on DSpace Test (linode19) and reboot it - + @@ -59,9 +59,9 @@ Run system updates on DSpace Test (linode19) and reboot it "@type": "BlogPosting", "headline": "August, 2019", "url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-08\/", - "wordCount": "909", + "wordCount": "1043", "datePublished": "2019-08-03T12:39:51\x2b03:00", - "dateModified": "2019-08-08T18:10:44\x2b03:00", + "dateModified": "2019-08-09T01:42:13\x2b03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -282,6 +282,25 @@ $ ./generate-thumbnails.py -i /tmp/user-upload2.csv -w --url-field-name url -d |
  • Improve the output of the suspicious characters check in csv-metadata-quality script and tag version 0.2.0

  • +

    2019-08-09

    + + + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index 4c84ce9f4..9456dbc4e 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,30 +4,30 @@ https://alanorth.github.io/cgspace-notes/2019-08/ - 2019-08-08T18:10:44+03:00 + 2019-08-09T01:42:13+03:00 https://alanorth.github.io/cgspace-notes/ - 2019-08-08T18:10:44+03:00 + 2019-08-09T01:42:13+03:00 0 https://alanorth.github.io/cgspace-notes/tags/notes/ - 2019-08-08T18:10:44+03:00 + 2019-08-09T01:42:13+03:00 0 https://alanorth.github.io/cgspace-notes/posts/ - 2019-08-08T18:10:44+03:00 + 2019-08-09T01:42:13+03:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2019-08-08T18:10:44+03:00 + 2019-08-09T01:42:13+03:00 0