From a37eaf795eb1ebe8f9dba737f7299b3591ad124c Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Mon, 25 Sep 2017 00:38:30 +0300 Subject: [PATCH] Update notes for 2017-09-24 --- content/post/2017-09.md | 10 ++++++++++ public/2017-09/index.html | 17 ++++++++++++++--- public/robots.txt | 2 +- public/sitemap.xml | 18 +++++++++--------- 4 files changed, 34 insertions(+), 13 deletions(-) diff --git a/content/post/2017-09.md b/content/post/2017-09.md index c2700dcb7..f522894c0 100644 --- a/content/post/2017-09.md +++ b/content/post/2017-09.md @@ -463,3 +463,13 @@ $ schedtool -D -e ionice -c2 -n7 nice -n19 dspace filter-media -f -i 10947/1 -p - Peter asked if we could map all the items of type `Journal Article` in [ILRI Archive](https://cgspace.cgiar.org/handle/10568/2703) to [ILRI articles in journals and newsletters](https://cgspace.cgiar.org/handle/10568/3) - It is easy to do via CSV using OpenRefine but I noticed that on CGSpace ~1,000 of the expected 2,500 are already mapped, while on DSpace Test they were not - I've asked Peter if he knows what's going on (or who mapped them) +- Turns out he had already mapped some, but requested that I finish the rest +- With this GREL in OpenRefine I can find items that are mapped, ie they have `10568/3||` or `10568/3$` in their `collection` field: + +``` +isNotNull(value.match(/.+?10568\/3(\|\|.+|$)/)) +``` + +- Peter also made a lot of changes to the data in the Archives collections while I was attempting to import the changes, so we were essentially competing for PostgreSQL and Solr connections +- I ended up having to kill the import and wait until he was done +- I exported a clean CSV and applied the changes from that one, which was a hundred or two less than I thought there should be (at least compared to the current state of DSpace Test, which is a few months old) diff --git a/public/2017-09/index.html b/public/2017-09/index.html index 0cdf0c4cc..49c7d91dd 100644 --- a/public/2017-09/index.html +++ b/public/2017-09/index.html @@ -25,7 +25,7 @@ Ask Sisay to clean up the WLE approvers a bit, as Marianne’s user account - + @@ -61,9 +61,9 @@ Ask Sisay to clean up the WLE approvers a bit, as Marianne’s user account "@type": "BlogPosting", "headline": "September, 2017", "url": "https://alanorth.github.io/cgspace-notes/2017-09/", - "wordCount": "3456", + "wordCount": "3580", "datePublished": "2017-09-07T16:54:52+07:00", - "dateModified": "2017-09-24T11:43:57+03:00", + "dateModified": "2017-09-24T17:10:15+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -649,6 +649,17 @@ DELETE 207
  • Peter asked if we could map all the items of type Journal Article in ILRI Archive to ILRI articles in journals and newsletters
  • It is easy to do via CSV using OpenRefine but I noticed that on CGSpace ~1,000 of the expected 2,500 are already mapped, while on DSpace Test they were not
  • I’ve asked Peter if he knows what’s going on (or who mapped them)
  • +
  • Turns out he had already mapped some, but requested that I finish the rest
  • +
  • With this GREL in OpenRefine I can find items that are mapped, ie they have 10568/3|| or 10568/3$ in their collection field:
  • + + +
    isNotNull(value.match(/.+?10568\/3(\|\|.+|$)/))
    +
    + + diff --git a/public/robots.txt b/public/robots.txt index bb802e51c..defa6419a 100644 --- a/public/robots.txt +++ b/public/robots.txt @@ -27,7 +27,7 @@ Disallow: /cgspace-notes/2015-12/ Disallow: /cgspace-notes/2015-11/ Disallow: /cgspace-notes/ Disallow: /cgspace-notes/categories/ -Disallow: /cgspace-notes/tags/notes/ Disallow: /cgspace-notes/categories/notes/ +Disallow: /cgspace-notes/tags/notes/ Disallow: /cgspace-notes/post/ Disallow: /cgspace-notes/tags/ diff --git a/public/sitemap.xml b/public/sitemap.xml index c65dd07bc..c4524ebcb 100644 --- a/public/sitemap.xml +++ b/public/sitemap.xml @@ -9,7 +9,7 @@ https://alanorth.github.io/cgspace-notes/2017-09/ - 2017-09-24T11:43:57+03:00 + 2017-09-24T17:10:15+03:00 @@ -133,27 +133,27 @@ 0 - - https://alanorth.github.io/cgspace-notes/tags/notes/ - 2017-09-24T11:43:57+03:00 - 0 - - https://alanorth.github.io/cgspace-notes/categories/notes/ 2017-09-19T22:23:37+03:00 0 + + https://alanorth.github.io/cgspace-notes/tags/notes/ + 2017-09-24T17:10:15+03:00 + 0 + + https://alanorth.github.io/cgspace-notes/post/ - 2017-09-24T11:43:57+03:00 + 2017-09-24T17:10:15+03:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2017-09-24T11:43:57+03:00 + 2017-09-24T17:10:15+03:00 0