From 0fafc7a6264bbd5986c5ac222e3ad7c9bbb2e8a9 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Wed, 30 May 2018 14:48:10 -0700 Subject: [PATCH] Update notes --- content/posts/2018-05.md | 9 +++++++++ docs/2018-05/index.html | 16 +++++++++++++--- docs/sitemap.xml | 10 +++++----- 3 files changed, 27 insertions(+), 8 deletions(-) diff --git a/content/posts/2018-05.md b/content/posts/2018-05.md index c7b50e3c0..aa08acfb0 100644 --- a/content/posts/2018-05.md +++ b/content/posts/2018-05.md @@ -356,3 +356,12 @@ dspace=# select email, netid from eperson where email not like '%cgiar.org%' and - It might be possible to adjust some things, but eventually we'll need a larger VPS instance - For some reason there are no JVM stats in Munin, ugh - Run all system updates on DSpace Test and reboot it +- I generated a list of CIFOR duplicates from the `CIFOR_May_9` collection using the Atmire MQM module and then dumped the HTML source so I could process it for sending to Vika +- I used grep to filter all relevant handle lines from the HTML source then used sed to insert a newline before each "Item1" line (as the duplicates are grouped like Item1, Item2, Item3 for each set of duplicates): + +``` +$ grep -E 'aspect.duplicatechecker.DuplicateResults.field.del_handle_[0-9]{1,3}_Item' ~/Desktop/https\ _dspacetest.cgiar.org_atmire_metadata-quality_duplicate-checker.html > ~/cifor-duplicates.txt +$ sed 's/.*Item1.*/\n&/g' ~/cifor-duplicates.txt > ~/cifor-duplicates-cleaned.txt +``` + +- I told Vika to look through the list manually and indicate which ones are indeed duplicates that we should delete, and which ones to map to CIFOR's collection diff --git a/docs/2018-05/index.html b/docs/2018-05/index.html index 0c268e30f..c0b4b058a 100644 --- a/docs/2018-05/index.html +++ b/docs/2018-05/index.html @@ -27,7 +27,7 @@ Also, I switched it to use OpenJDK instead of Oracle Java, as well as re-worked - + @@ -65,9 +65,9 @@ Also, I switched it to use OpenJDK instead of Oracle Java, as well as re-worked "@type": "BlogPosting", "headline": "May, 2018", "url": "https://alanorth.github.io/cgspace-notes/2018-05/", - "wordCount": "3024", + "wordCount": "3135", "datePublished": "2018-05-01T16:43:54+03:00", - "dateModified": "2018-05-30T09:05:40-07:00", + "dateModified": "2018-05-30T10:50:55-07:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -555,6 +555,16 @@ $ ./bin/post -c countries ~/src/git/DSpace/2018-05-10-countries.csv
  • It might be possible to adjust some things, but eventually we’ll need a larger VPS instance
  • For some reason there are no JVM stats in Munin, ugh
  • Run all system updates on DSpace Test and reboot it
  • +
  • I generated a list of CIFOR duplicates from the CIFOR_May_9 collection using the Atmire MQM module and then dumped the HTML source so I could process it for sending to Vika
  • +
  • I used grep to filter all relevant handle lines from the HTML source then used sed to insert a newline before each “Item1” line (as the duplicates are grouped like Item1, Item2, Item3 for each set of duplicates):
  • + + +
    $ grep -E 'aspect.duplicatechecker.DuplicateResults.field.del_handle_[0-9]{1,3}_Item' ~/Desktop/https\ _dspacetest.cgiar.org_atmire_metadata-quality_duplicate-checker.html > ~/cifor-duplicates.txt
    +$ sed 's/.*Item1.*/\n&/g' ~/cifor-duplicates.txt > ~/cifor-duplicates-cleaned.txt
    +
    + + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index abc6ab005..44eb28bf8 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,7 +4,7 @@ https://alanorth.github.io/cgspace-notes/2018-05/ - 2018-05-30T09:05:40-07:00 + 2018-05-30T10:50:55-07:00 @@ -164,7 +164,7 @@ https://alanorth.github.io/cgspace-notes/ - 2018-05-30T09:05:40-07:00 + 2018-05-30T10:50:55-07:00 0 @@ -175,7 +175,7 @@ https://alanorth.github.io/cgspace-notes/tags/notes/ - 2018-05-30T09:05:40-07:00 + 2018-05-30T10:50:55-07:00 0 @@ -187,13 +187,13 @@ https://alanorth.github.io/cgspace-notes/posts/ - 2018-05-30T09:05:40-07:00 + 2018-05-30T10:50:55-07:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2018-05-30T09:05:40-07:00 + 2018-05-30T10:50:55-07:00 0