From 32830944c29ed31e24ba91984b3b6cca2b202a6c Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Fri, 17 May 2019 18:46:13 +0300 Subject: [PATCH] Add notes for 2019-05-17 --- content/posts/2019-05.md | 20 ++++++++++++++++++++ docs/2019-05/index.html | 28 +++++++++++++++++++++++++--- docs/sitemap.xml | 10 +++++----- 3 files changed, 50 insertions(+), 8 deletions(-) diff --git a/content/posts/2019-05.md b/content/posts/2019-05.md index adce99e47..6796519b4 100644 --- a/content/posts/2019-05.md +++ b/content/posts/2019-05.md @@ -364,4 +364,24 @@ COPY 995 - Fork the [ICARDA AReS v1 repository](https://github.com/icarda-git/AReS) to [ILRI's GitHub](https://github.com/ilri/AReS) and give access to CodeObia guys - The plan is that we develop the v2 code here +## 2019-05-17 + +- Peter sent me a bunch of fixes for investors from yesterday +- I did a quick check in Open Refine (trim and collapse whitespace, clean smart quotes, etc) and then applied them on CGSpace: + +``` +$ ./fix-metadata-values.py -i /tmp/2019-05-16-fix-306-Investors.csv -db dspace-u dspace-p 'fuuu' -f dc.description.sponsorship -m 29 -t correct -d +$ ./delete-metadata-values.py -i /tmp/2019-05-16-delete-297-Investors.csv -db dspace -u dspace -p 'fuuu' -m 29 -f dc.description.sponsorship -d +``` + +- Then I started a full Discovery re-indexing: + +``` +$ export JAVA_OPTS="-Dfile.encoding=UTF-8 -Xmx1024m" +$ time schedtool -B -e ionice -c2 -n7 nice -n19 dspace index-discovery -b +``` + +- I was going to make a new controlled vocabulary of the top 100 terms after these corrections, but I noticed a bunch of duplicates and variations when I sorted them alphabetically +- Instead, I exported a new list and asked Peter to look at it again + diff --git a/docs/2019-05/index.html b/docs/2019-05/index.html index 52577d32a..5c71d75d4 100644 --- a/docs/2019-05/index.html +++ b/docs/2019-05/index.html @@ -28,7 +28,7 @@ But after this I tried to delete the item from the XMLUI and it is still present - + @@ -61,9 +61,9 @@ But after this I tried to delete the item from the XMLUI and it is still present "@type": "BlogPosting", "headline": "May, 2019", "url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-05\/", - "wordCount": "2541", + "wordCount": "2674", "datePublished": "2019-05-01T07:37:43\x2b03:00", - "dateModified": "2019-05-16T00:12:50\x2b03:00", + "dateModified": "2019-05-16T18:26:49\x2b03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -581,6 +581,28 @@ COPY 995 +

2019-05-17

+ + + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index d7b15a412..98ba74478 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,30 +4,30 @@ https://alanorth.github.io/cgspace-notes/ - 2019-05-16T00:12:50+03:00 + 2019-05-16T18:26:49+03:00 0 https://alanorth.github.io/cgspace-notes/2019-05/ - 2019-05-16T00:12:50+03:00 + 2019-05-16T18:26:49+03:00 https://alanorth.github.io/cgspace-notes/tags/notes/ - 2019-05-16T00:12:50+03:00 + 2019-05-16T18:26:49+03:00 0 https://alanorth.github.io/cgspace-notes/posts/ - 2019-05-16T00:12:50+03:00 + 2019-05-16T18:26:49+03:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2019-05-16T00:12:50+03:00 + 2019-05-16T18:26:49+03:00 0