From 9d0f0cbfde1da7685479260fe86c67d23fbca5e5 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Thu, 10 Sep 2020 12:18:03 +0300 Subject: [PATCH] Add notes for 2020-09-10 --- content/posts/2020-09.md | 44 +++++++++++++++++++ docs/2020-09/index.html | 58 +++++++++++++++++++++++-- docs/categories/index.html | 2 +- docs/categories/notes/index.html | 2 +- docs/categories/notes/page/2/index.html | 2 +- docs/categories/notes/page/3/index.html | 2 +- docs/categories/notes/page/4/index.html | 2 +- docs/index.html | 2 +- docs/page/2/index.html | 2 +- docs/page/3/index.html | 2 +- docs/page/4/index.html | 2 +- docs/page/5/index.html | 2 +- docs/page/6/index.html | 2 +- docs/page/7/index.html | 2 +- docs/posts/index.html | 2 +- docs/posts/page/2/index.html | 2 +- docs/posts/page/3/index.html | 2 +- docs/posts/page/4/index.html | 2 +- docs/posts/page/5/index.html | 2 +- docs/posts/page/6/index.html | 2 +- docs/posts/page/7/index.html | 2 +- docs/sitemap.xml | 10 ++--- 22 files changed, 123 insertions(+), 27 deletions(-) diff --git a/content/posts/2020-09.md b/content/posts/2020-09.md index 6f3ce4530..269d15c93 100644 --- a/content/posts/2020-09.md +++ b/content/posts/2020-09.md @@ -146,5 +146,49 @@ https://cgspace.cgiar.org/bitstream/handle/10568/82745/Characteristics-Silage.JP - So they end up getting rate limited due to the XMLUI rate limits - I told them to use the REST API bitstream retrieve links, because we don't have any rate limits there +## 2020-09-09 + +- Wire up the systemd service/timer for the CGSpace Country Code Tagger curation task in the [Ansible infrastructure scripts](https://github.com/ilri/rmg-ansible-public) + - ~~For now it won't work on DSpace 6 because the curation task invocation needs to be slightly different (minus the `-l` parameter) and for some reason the task isn't working on DSpace Test (version 6) right now~~ + - I added DSpace 6 support to the playbook templates... +- Run system updates on DSpace Test (linode26), re-deploy the DSpace 6 test branch, and reboot the server + - After rebooting I deleted old copies of the cgspace-java-helpers JAR in the DSpace lib directory and then the curation worked + - To my great surprise the curation worked (and completed, albeit a few times slower) on my local DSpace 6 environment as well: + +``` +$ ~/dspace63/bin/dspace curate -t countrycodetagger -i all -s object +``` + +## 2020-09-10 + +- I checked the country code tagger on CGSpace and DSpace Test and it ran fine from the systemd timer last night... w00t +- I started looking at Peter's changes to the CGSpace regions that were proposed in 2020-07 + - The changes will be: + +``` +$ cat 2020-09-10-fix-cgspace-regions.csv +cg.coverage.region,correct +EAST AFRICA,EASTERN AFRICA +WEST AFRICA,WESTERN AFRICA +SOUTHEAST ASIA,SOUTHEASTERN ASIA +SOUTH ASIA,SOUTHERN ASIA +AFRICA SOUTH OF SAHARA,SUB-SAHARAN AFRICA +NORTH AFRICA,NORTHERN AFRICA +WEST ASIA,WESTERN ASIA +SOUTHWEST ASIA,SOUTHWESTERN ASIA +$ ./fix-metadata-values.py -i 2020-09-10-fix-cgspace-regions.csv -db dspace -u dspace -p 'fuuu' -f cg.coverage.region -t 'correct' -m 227 -d -n +Connected to database. +Would fix 12227 occurences of: EAST AFRICA +Would fix 7996 occurences of: WEST AFRICA +Would fix 3515 occurences of: SOUTHEAST ASIA +Would fix 3443 occurences of: SOUTH ASIA +Would fix 1134 occurences of: AFRICA SOUTH OF SAHARA +Would fix 357 occurences of: NORTH AFRICA +Would fix 81 occurences of: WEST ASIA +Would fix 3 occurences of: SOUTHWEST ASIA +``` + +- I think we need to wait for the web team, though, as they need to update their mappings + - Not to mention that we'll need to give WLE and CCAFS time to update their harvesters as well... hmmm diff --git a/docs/2020-09/index.html b/docs/2020-09/index.html index b2252c1d9..689ebc992 100644 --- a/docs/2020-09/index.html +++ b/docs/2020-09/index.html @@ -25,7 +25,7 @@ I filed an issue on OpenRXV to make some minor edits to the admin UI: https://gi - + @@ -55,9 +55,9 @@ I filed an issue on OpenRXV to make some minor edits to the admin UI: https://gi "@type": "BlogPosting", "headline": "September, 2020", "url": "https://alanorth.github.io/cgspace-notes/2020-09/", - "wordCount": "838", + "wordCount": "1159", "datePublished": "2020-09-02T15:35:54+03:00", - "dateModified": "2020-09-04T13:32:16+03:00", + "dateModified": "2020-09-08T12:10:08+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -290,6 +290,58 @@ dspace=# UPDATE metadatavalue SET text_value = regexp_replace(text_value, '^http +

2020-09-09

+ +
$ ~/dspace63/bin/dspace curate -t countrycodetagger -i all -s object
+

2020-09-10

+ +
$ cat 2020-09-10-fix-cgspace-regions.csv
+cg.coverage.region,correct
+EAST AFRICA,EASTERN AFRICA
+WEST AFRICA,WESTERN AFRICA
+SOUTHEAST ASIA,SOUTHEASTERN ASIA
+SOUTH ASIA,SOUTHERN ASIA
+AFRICA SOUTH OF SAHARA,SUB-SAHARAN AFRICA
+NORTH AFRICA,NORTHERN AFRICA
+WEST ASIA,WESTERN ASIA
+SOUTHWEST ASIA,SOUTHWESTERN ASIA
+$ ./fix-metadata-values.py -i 2020-09-10-fix-cgspace-regions.csv -db dspace -u dspace -p 'fuuu' -f cg.coverage.region -t 'correct' -m 227 -d -n
+Connected to database.
+Would fix 12227 occurences of: EAST AFRICA
+Would fix 7996 occurences of: WEST AFRICA
+Would fix 3515 occurences of: SOUTHEAST ASIA
+Would fix 3443 occurences of: SOUTH ASIA
+Would fix 1134 occurences of: AFRICA SOUTH OF SAHARA
+Would fix 357 occurences of: NORTH AFRICA
+Would fix 81 occurences of: WEST ASIA
+Would fix 3 occurences of: SOUTHWEST ASIA
+
diff --git a/docs/categories/index.html b/docs/categories/index.html index 385d67b6f..aabfc2696 100644 --- a/docs/categories/index.html +++ b/docs/categories/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/categories/notes/index.html b/docs/categories/notes/index.html index 3ea90f530..e6e165943 100644 --- a/docs/categories/notes/index.html +++ b/docs/categories/notes/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/categories/notes/page/2/index.html b/docs/categories/notes/page/2/index.html index 1986d103e..cda11b758 100644 --- a/docs/categories/notes/page/2/index.html +++ b/docs/categories/notes/page/2/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/categories/notes/page/3/index.html b/docs/categories/notes/page/3/index.html index c7008fb2c..fb7d1e958 100644 --- a/docs/categories/notes/page/3/index.html +++ b/docs/categories/notes/page/3/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/categories/notes/page/4/index.html b/docs/categories/notes/page/4/index.html index ac66f6f71..0c35d83a0 100644 --- a/docs/categories/notes/page/4/index.html +++ b/docs/categories/notes/page/4/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/index.html b/docs/index.html index 4def53b1a..d73b3b694 100644 --- a/docs/index.html +++ b/docs/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/2/index.html b/docs/page/2/index.html index 398bfc53c..997b1e26f 100644 --- a/docs/page/2/index.html +++ b/docs/page/2/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/3/index.html b/docs/page/3/index.html index 0a9c468cf..6cc3e17c6 100644 --- a/docs/page/3/index.html +++ b/docs/page/3/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/4/index.html b/docs/page/4/index.html index 81954c635..a04f5364c 100644 --- a/docs/page/4/index.html +++ b/docs/page/4/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/5/index.html b/docs/page/5/index.html index 89a0fc966..b1c4ef3d7 100644 --- a/docs/page/5/index.html +++ b/docs/page/5/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/6/index.html b/docs/page/6/index.html index 9fddab172..47f08cd4f 100644 --- a/docs/page/6/index.html +++ b/docs/page/6/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/7/index.html b/docs/page/7/index.html index dac75be69..63b3479ab 100644 --- a/docs/page/7/index.html +++ b/docs/page/7/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/index.html b/docs/posts/index.html index 2b1d96fea..38c138346 100644 --- a/docs/posts/index.html +++ b/docs/posts/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/2/index.html b/docs/posts/page/2/index.html index e30e766da..ad1435bfa 100644 --- a/docs/posts/page/2/index.html +++ b/docs/posts/page/2/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/3/index.html b/docs/posts/page/3/index.html index 8e53a430e..fd95db1b4 100644 --- a/docs/posts/page/3/index.html +++ b/docs/posts/page/3/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/4/index.html b/docs/posts/page/4/index.html index 93548e6fc..5e0221cb4 100644 --- a/docs/posts/page/4/index.html +++ b/docs/posts/page/4/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/5/index.html b/docs/posts/page/5/index.html index 495559fd0..0be45e701 100644 --- a/docs/posts/page/5/index.html +++ b/docs/posts/page/5/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/6/index.html b/docs/posts/page/6/index.html index 759cdd7fe..479bb77a4 100644 --- a/docs/posts/page/6/index.html +++ b/docs/posts/page/6/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/7/index.html b/docs/posts/page/7/index.html index 0e570a794..c348ac379 100644 --- a/docs/posts/page/7/index.html +++ b/docs/posts/page/7/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index 32ccc3f4c..3b90c9ffa 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,27 +4,27 @@ https://alanorth.github.io/cgspace-notes/categories/ - 2020-09-04T13:32:16+03:00 + 2020-09-08T12:10:08+03:00 https://alanorth.github.io/cgspace-notes/ - 2020-09-04T13:32:16+03:00 + 2020-09-08T12:10:08+03:00 https://alanorth.github.io/cgspace-notes/categories/notes/ - 2020-09-04T13:32:16+03:00 + 2020-09-08T12:10:08+03:00 https://alanorth.github.io/cgspace-notes/posts/ - 2020-09-04T13:32:16+03:00 + 2020-09-08T12:10:08+03:00 https://alanorth.github.io/cgspace-notes/2020-09/ - 2020-09-04T13:32:16+03:00 + 2020-09-08T12:10:08+03:00