From e478850def7b86da685f93f10a478d485f5b3dc5 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Mon, 30 May 2022 16:00:02 +0300 Subject: [PATCH] Add notes for 2022-05-30 --- content/posts/2022-05.md | 21 ++++++++++++++++++++ docs/2022-05/index.html | 26 ++++++++++++++++++++++--- docs/categories/index.html | 2 +- docs/categories/notes/index.html | 2 +- docs/categories/notes/page/2/index.html | 2 +- docs/categories/notes/page/3/index.html | 2 +- docs/categories/notes/page/4/index.html | 2 +- docs/categories/notes/page/5/index.html | 2 +- docs/categories/notes/page/6/index.html | 2 +- docs/index.html | 2 +- docs/page/2/index.html | 2 +- docs/page/3/index.html | 2 +- docs/page/4/index.html | 2 +- docs/page/5/index.html | 2 +- docs/page/6/index.html | 2 +- docs/page/7/index.html | 2 +- docs/page/8/index.html | 2 +- docs/page/9/index.html | 2 +- docs/posts/index.html | 2 +- docs/posts/page/2/index.html | 2 +- docs/posts/page/3/index.html | 2 +- docs/posts/page/4/index.html | 2 +- docs/posts/page/5/index.html | 2 +- docs/posts/page/6/index.html | 2 +- docs/posts/page/7/index.html | 2 +- docs/posts/page/8/index.html | 2 +- docs/posts/page/9/index.html | 2 +- docs/sitemap.xml | 10 +++++----- 28 files changed, 74 insertions(+), 33 deletions(-) diff --git a/content/posts/2022-05.md b/content/posts/2022-05.md index f2736da06..e39354821 100644 --- a/content/posts/2022-05.md +++ b/content/posts/2022-05.md @@ -232,4 +232,25 @@ Would fix 34 occurences of: Martha Lilia Del Río Duque: 0000-0002-0879-0292 - Start a harvest on AReS +## 2022-05-30 + +- Help IITA with some collection authorization issues on CGSpace +- Finally looking into Peter's Altmetric export from 2022-02 + - We want to try to compare some of the information about open access status with that in CGSpace + - I created a new column for all items that have CGSpace handles using this GREL: + +```console +"https://hdl.handle.net/" + value.match(/.*?(10568\/\d+).*?/)[0] +``` + +- With that I can do a join on the CGSpace metadata and perhaps clean up some items + +```console +$ ./bin/dspace metadata-export -f 2022-05-30-cgspace.csv +$ csvcut -c 'id,dc.identifier.uri[en_US],dcterms.accessRights[en_US],dcterms.license[en_US]' 2022-05-30-cgspace.csv | sed '1 s/dc\.identifier\.uri\[en_US\]/dc.identifier.uri/' > /tmp/cgspace.csv +$ csvjoin -c 'dc.identifier.uri' ~/Downloads/2022-05-30-Altmetric-Research-Outputs-CGSpace.csv /tmp/cgspace.csv > /tmp/cgspace-altmetric.csv +``` + +- Examining the data in OpenRefine I spot checked a few records where Altmetric and CGSpace disagree and in most cases I found Altmetric to be wrong... + diff --git a/docs/2022-05/index.html b/docs/2022-05/index.html index 794005c3f..1772bf9b3 100644 --- a/docs/2022-05/index.html +++ b/docs/2022-05/index.html @@ -35,7 +35,7 @@ I purged 93,974 hits from these IPs using my check-spider-ip-hits.sh script - + @@ -76,9 +76,9 @@ I purged 93,974 hits from these IPs using my check-spider-ip-hits.sh script "@type": "BlogPosting", "headline": "May, 2022", "url": "https://alanorth.github.io/cgspace-notes/2022-05/", - "wordCount": "1552", + "wordCount": "1673", "datePublished": "2022-05-04T09:13:39+03:00", - "dateModified": "2022-05-27T16:46:18+03:00", + "dateModified": "2022-05-28T18:25:00+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -404,6 +404,26 @@ I purged 93,974 hits from these IPs using my check-spider-ip-hits.sh script +

2022-05-30

+ +
"https://hdl.handle.net/" + value.match(/.*?(10568\/\d+).*?/)[0]
+
+
$ ./bin/dspace metadata-export -f 2022-05-30-cgspace.csv
+$ csvcut -c 'id,dc.identifier.uri[en_US],dcterms.accessRights[en_US],dcterms.license[en_US]' 2022-05-30-cgspace.csv | sed '1 s/dc\.identifier\.uri\[en_US\]/dc.identifier.uri/' > /tmp/cgspace.csv
+$ csvjoin -c 'dc.identifier.uri' ~/Downloads/2022-05-30-Altmetric-Research-Outputs-CGSpace.csv /tmp/cgspace.csv > /tmp/cgspace-altmetric.csv
+
diff --git a/docs/categories/index.html b/docs/categories/index.html index cbab3132a..50e1bd1e1 100644 --- a/docs/categories/index.html +++ b/docs/categories/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/index.html b/docs/categories/notes/index.html index a46eb24b4..b55f1c363 100644 --- a/docs/categories/notes/index.html +++ b/docs/categories/notes/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/2/index.html b/docs/categories/notes/page/2/index.html index f61bad5d3..93fee745b 100644 --- a/docs/categories/notes/page/2/index.html +++ b/docs/categories/notes/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/3/index.html b/docs/categories/notes/page/3/index.html index 735e7f53c..7c9d35330 100644 --- a/docs/categories/notes/page/3/index.html +++ b/docs/categories/notes/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/4/index.html b/docs/categories/notes/page/4/index.html index 0895caedf..c6f8ab110 100644 --- a/docs/categories/notes/page/4/index.html +++ b/docs/categories/notes/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/5/index.html b/docs/categories/notes/page/5/index.html index 42de63c45..b4752f2b0 100644 --- a/docs/categories/notes/page/5/index.html +++ b/docs/categories/notes/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/6/index.html b/docs/categories/notes/page/6/index.html index 375dd4b9a..10faca58f 100644 --- a/docs/categories/notes/page/6/index.html +++ b/docs/categories/notes/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/index.html b/docs/index.html index c1c43c031..be03b0731 100644 --- a/docs/index.html +++ b/docs/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/2/index.html b/docs/page/2/index.html index ac81588ea..360be40e6 100644 --- a/docs/page/2/index.html +++ b/docs/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/3/index.html b/docs/page/3/index.html index 9e004bc13..f43a6e210 100644 --- a/docs/page/3/index.html +++ b/docs/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/4/index.html b/docs/page/4/index.html index 7388604f7..01128d030 100644 --- a/docs/page/4/index.html +++ b/docs/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/5/index.html b/docs/page/5/index.html index 09194bbe8..8ebd2b0fb 100644 --- a/docs/page/5/index.html +++ b/docs/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/6/index.html b/docs/page/6/index.html index 096694ff2..763fb0324 100644 --- a/docs/page/6/index.html +++ b/docs/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/7/index.html b/docs/page/7/index.html index 93cae2117..298877f2f 100644 --- a/docs/page/7/index.html +++ b/docs/page/7/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/8/index.html b/docs/page/8/index.html index 7584d8b0f..5ffb789bf 100644 --- a/docs/page/8/index.html +++ b/docs/page/8/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/9/index.html b/docs/page/9/index.html index 5f354c5b8..496cd2ae0 100644 --- a/docs/page/9/index.html +++ b/docs/page/9/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/index.html b/docs/posts/index.html index e28eb2e0c..3e1f6cffc 100644 --- a/docs/posts/index.html +++ b/docs/posts/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/2/index.html b/docs/posts/page/2/index.html index 5c6072331..eadee9c1f 100644 --- a/docs/posts/page/2/index.html +++ b/docs/posts/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/3/index.html b/docs/posts/page/3/index.html index 9a123c2dd..25defce2a 100644 --- a/docs/posts/page/3/index.html +++ b/docs/posts/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/4/index.html b/docs/posts/page/4/index.html index ea666cfc9..31f6babd5 100644 --- a/docs/posts/page/4/index.html +++ b/docs/posts/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/5/index.html b/docs/posts/page/5/index.html index 193af1c1e..8d45af10b 100644 --- a/docs/posts/page/5/index.html +++ b/docs/posts/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/6/index.html b/docs/posts/page/6/index.html index 86ae75498..a543b01f0 100644 --- a/docs/posts/page/6/index.html +++ b/docs/posts/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/7/index.html b/docs/posts/page/7/index.html index 724e7778f..070cdf1bf 100644 --- a/docs/posts/page/7/index.html +++ b/docs/posts/page/7/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/8/index.html b/docs/posts/page/8/index.html index 62fb95f30..e1579bebc 100644 --- a/docs/posts/page/8/index.html +++ b/docs/posts/page/8/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/9/index.html b/docs/posts/page/9/index.html index d0efc00cd..3c99fb121 100644 --- a/docs/posts/page/9/index.html +++ b/docs/posts/page/9/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index 0b4d34500..61108c163 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -3,19 +3,19 @@ xmlns:xhtml="http://www.w3.org/1999/xhtml"> https://alanorth.github.io/cgspace-notes/categories/ - 2022-05-27T16:46:18+03:00 + 2022-05-28T18:25:00+03:00 https://alanorth.github.io/cgspace-notes/ - 2022-05-27T16:46:18+03:00 + 2022-05-28T18:25:00+03:00 https://alanorth.github.io/cgspace-notes/2022-05/ - 2022-05-27T16:46:18+03:00 + 2022-05-28T18:25:00+03:00 https://alanorth.github.io/cgspace-notes/categories/notes/ - 2022-05-27T16:46:18+03:00 + 2022-05-28T18:25:00+03:00 https://alanorth.github.io/cgspace-notes/posts/ - 2022-05-27T16:46:18+03:00 + 2022-05-28T18:25:00+03:00 https://alanorth.github.io/cgspace-notes/2022-04/ 2022-05-04T11:09:45+03:00