diff --git a/content/posts/2019-05.md b/content/posts/2019-05.md index b820bdfd6..53f3724b2 100644 --- a/content/posts/2019-05.md +++ b/content/posts/2019-05.md @@ -418,4 +418,29 @@ $ ./delete-metadata-values.py -i /tmp/2019-05-17-delete-14-Investors.csv -db dsp $ dspace import -a -e me@cgiar.org -m 2019-05-25-AfricaRice.map -s /tmp/SimpleArchiveFormat ``` +## 2019-05-27 + +- Peter sent me over two thousand corrections for the authors on CGSpace that I had dumped last month + - I proofed them for whitespace and invalid special characters in OpenRefine and then applied them on CGSpace and DSpace Test: + +``` +$ ./fix-metadata-values.py -i /tmp/2019-05-27-fix-2472-Authors.csv -db dspace -u dspace -p 'fuuu' -f dc.contributor.author -m 3 -t corrections -d +``` + +- Then start a full Discovery re-indexing on each server: + +``` +$ export JAVA_OPTS="-Dfile.encoding=UTF-8 -Xmx1024m" +$ time schedtool -B -e ionice -c2 -n7 nice -n19 dspace index-discovery -b +``` + +- Export new list of all authors from CGSpace database to send to Peter: + +``` +dspace=# \copy (select distinct text_value, count(*) as count from metadatavalue where metadata_field_id = (select metadata_field_id from metadatafieldregistry where element = 'contributor' and qualifier = 'author') AND resource_type_id = 2 group by text_value order by count desc) to /tmp/2019-05-27-all-authors.csv with csv header; +COPY 64871 +``` + +- Run all system updates on DSpace Test (linode19) and reboot it + diff --git a/docs/2019-04/index.html b/docs/2019-04/index.html index f58798fdb..5e89298bf 100644 --- a/docs/2019-04/index.html +++ b/docs/2019-04/index.html @@ -38,7 +38,7 @@ $ ./delete-metadata-values.py -i /tmp/2019-02-21-delete-1-region.csv -db dspace - + @@ -81,9 +81,9 @@ $ ./delete-metadata-values.py -i /tmp/2019-02-21-delete-1-region.csv -db dspace "@type": "BlogPosting", "headline": "April, 2019", "url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-04\/", - "wordCount": "6800", + "wordCount": "6799", "datePublished": "2019-04-01T09:00:43\x2b03:00", - "dateModified": "2019-04-30T11:39:09\x2b03:00", + "dateModified": "2019-05-27T12:04:14\x2b03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -1339,7 +1339,7 @@ item_id | submitter_id | in_archive | withdrawn | last_modified | o diff --git a/docs/2019-05/index.html b/docs/2019-05/index.html index 54e253618..97c86488d 100644 --- a/docs/2019-05/index.html +++ b/docs/2019-05/index.html @@ -28,7 +28,7 @@ But after this I tried to delete the item from the XMLUI and it is still present - + @@ -61,9 +61,9 @@ But after this I tried to delete the item from the XMLUI and it is still present "@type": "BlogPosting", "headline": "May, 2019", "url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-05\/", - "wordCount": "2874", + "wordCount": "3023", "datePublished": "2019-05-01T07:37:43\x2b03:00", - "dateModified": "2019-05-24T12:27:22\x2b03:00", + "dateModified": "2019-05-25T14:17:27\x2b03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -649,6 +649,33 @@ $ ./delete-metadata-values.py -i /tmp/2019-05-17-delete-14-Investors.csv -db dsp +

2019-05-27

+ + + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index 9dfa572db..f03471dfb 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,36 +4,36 @@ https://alanorth.github.io/cgspace-notes/ - 2019-05-24T12:27:22+03:00 + 2019-05-27T12:04:14+03:00 0 https://alanorth.github.io/cgspace-notes/2019-05/ - 2019-05-24T12:27:22+03:00 + 2019-05-25T14:17:27+03:00 https://alanorth.github.io/cgspace-notes/tags/notes/ - 2019-05-24T12:27:22+03:00 + 2019-05-27T12:04:14+03:00 0 https://alanorth.github.io/cgspace-notes/posts/ - 2019-05-24T12:27:22+03:00 + 2019-05-27T12:04:14+03:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2019-05-24T12:27:22+03:00 + 2019-05-27T12:04:14+03:00 0 https://alanorth.github.io/cgspace-notes/2019-04/ - 2019-04-30T11:39:09+03:00 + 2019-05-27T12:04:14+03:00