From 64d5b998f916afc3f9250c0adc1b5a0b395e6bc1 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Tue, 23 Aug 2022 12:14:14 -0700 Subject: [PATCH] Add notes for 2022-08-23 --- content/posts/2022-08.md | 39 ++++++++++++++++++++ docs/2022-08/index.html | 47 +++++++++++++++++++++++-- docs/categories/index.html | 2 +- docs/categories/notes/index.html | 2 +- docs/categories/notes/page/2/index.html | 2 +- docs/categories/notes/page/3/index.html | 2 +- docs/categories/notes/page/4/index.html | 2 +- docs/categories/notes/page/5/index.html | 2 +- docs/categories/notes/page/6/index.html | 2 +- docs/categories/notes/page/7/index.html | 2 +- docs/index.html | 2 +- docs/page/2/index.html | 2 +- docs/page/3/index.html | 2 +- docs/page/4/index.html | 2 +- docs/page/5/index.html | 2 +- docs/page/6/index.html | 2 +- docs/page/7/index.html | 2 +- docs/page/8/index.html | 2 +- docs/page/9/index.html | 2 +- docs/posts/index.html | 2 +- docs/posts/page/2/index.html | 2 +- docs/posts/page/3/index.html | 2 +- docs/posts/page/4/index.html | 2 +- docs/posts/page/5/index.html | 2 +- docs/posts/page/6/index.html | 2 +- docs/posts/page/7/index.html | 2 +- docs/posts/page/8/index.html | 2 +- docs/posts/page/9/index.html | 2 +- docs/sitemap.xml | 10 +++--- 29 files changed, 114 insertions(+), 34 deletions(-) diff --git a/content/posts/2022-08.md b/content/posts/2022-08.md index 92a68fe31..ea59f423a 100644 --- a/content/posts/2022-08.md +++ b/content/posts/2022-08.md @@ -209,4 +209,43 @@ return "||".join(res) - Then I finished adding the `dcterms.relation` and CRP metadata flagged by Peter on the Gender presentations - I'm waiting for him to send me the PDFs and then I will upload them to DSpace Test +## 2022-08-21 + +- Start indexing on AReS +- The load on CGSpace was around 5.0 today, and now that I started the harvesting it's over 10 for an hour now, sigh... + - I'm going to try an experiment to block Googlebot, bingbot, and Yandex for a week to see if the load goes down + +## 2022-08-22 + +- I tried to re-generate the SAF bundle for the MARLO Innovations after improving the AGROVOC subjects and the v3 PDFs, but six are missing from the v3 zip that are present in the original zip: + - ProjectInnovationSummary-WLE-P500-I78.pdf + - ProjectInnovationSummary-WLE-P452-I699.pdf + - ProjectInnovationSummary-WLE-P518-I696.pdf + - ProjectInnovationSummary-WLE-P442-I740.pdf + - ProjectInnovationSummary-WLE-P516-I647.pdf + - ProjectInnovationSummary-WLE-P438-I585.pdf +- I downloaded them manually using the URLs in the original CSV +- I also uploaded a new version of the MELIAs to DSpace Test + +## 2022-08-23 + +- Checking the number of items on CGSpace so we can keep an eye on the 100,000 number: + +```console +dspace=# SELECT COUNT(uuid) FROM item WHERE in_archive='t'; + count +------- + 95716 +(1 row) +``` + +- If I check OAI I see more, but perhaps that counts mapped items multiple times +- Peter said the 303 Gender PPTs were good to go, so I updated the collection mappings and IDs in OpenRefine and then uploaded them to CGSpace: + +```console +$ dspace import --add --eperson=fuu@fuu.com --source /tmp/SimpleArchiveFormat --mapfile=./2022-08-23-gender-ppts.map +``` + +- I created a [GitHub issue for OpenRXV compatibility issues with DSpace 7](https://github.com/ilri/OpenRXV/issues/133) + diff --git a/docs/2022-08/index.html b/docs/2022-08/index.html index 3c2e4398c..b3667b9eb 100644 --- a/docs/2022-08/index.html +++ b/docs/2022-08/index.html @@ -14,7 +14,7 @@ Our request to add CC-BY-3.0-IGO to SPDX was approved a few weeks ago - + @@ -34,9 +34,9 @@ Our request to add CC-BY-3.0-IGO to SPDX was approved a few weeks ago "@type": "BlogPosting", "headline": "August, 2022", "url": "https://alanorth.github.io/cgspace-notes/2022-08/", - "wordCount": "1862", + "wordCount": "2068", "datePublished": "2022-08-01T10:22:36+03:00", - "dateModified": "2022-08-19T21:55:36-07:00", + "dateModified": "2022-08-20T22:37:35-07:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -354,6 +354,47 @@ Our request to add CC-BY-3.0-IGO to SPDX was approved a few weeks ago +

2022-08-21

+ +

2022-08-22

+ +

2022-08-23

+ +
dspace=# SELECT COUNT(uuid) FROM item WHERE in_archive='t';
+ count 
+-------
+ 95716
+(1 row)
+
+
$ dspace import --add --eperson=fuu@fuu.com --source /tmp/SimpleArchiveFormat --mapfile=./2022-08-23-gender-ppts.map
+
diff --git a/docs/categories/index.html b/docs/categories/index.html index 6a2d772e3..03e01d14e 100644 --- a/docs/categories/index.html +++ b/docs/categories/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/index.html b/docs/categories/notes/index.html index b3c914fdf..1b02125ea 100644 --- a/docs/categories/notes/index.html +++ b/docs/categories/notes/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/2/index.html b/docs/categories/notes/page/2/index.html index 6f09d7636..53ba87018 100644 --- a/docs/categories/notes/page/2/index.html +++ b/docs/categories/notes/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/3/index.html b/docs/categories/notes/page/3/index.html index 0850149ac..9dd09ec79 100644 --- a/docs/categories/notes/page/3/index.html +++ b/docs/categories/notes/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/4/index.html b/docs/categories/notes/page/4/index.html index 59126843b..c66cb372d 100644 --- a/docs/categories/notes/page/4/index.html +++ b/docs/categories/notes/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/5/index.html b/docs/categories/notes/page/5/index.html index 8b37d429d..102cca294 100644 --- a/docs/categories/notes/page/5/index.html +++ b/docs/categories/notes/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/6/index.html b/docs/categories/notes/page/6/index.html index af13dac32..3ee93ed35 100644 --- a/docs/categories/notes/page/6/index.html +++ b/docs/categories/notes/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/7/index.html b/docs/categories/notes/page/7/index.html index 5c17ec54c..59d45cf7d 100644 --- a/docs/categories/notes/page/7/index.html +++ b/docs/categories/notes/page/7/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/index.html b/docs/index.html index 5c048ec24..e3f9bf770 100644 --- a/docs/index.html +++ b/docs/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/2/index.html b/docs/page/2/index.html index 90f96ae8f..80d907d58 100644 --- a/docs/page/2/index.html +++ b/docs/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/3/index.html b/docs/page/3/index.html index 10d76b476..e0add7fa5 100644 --- a/docs/page/3/index.html +++ b/docs/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/4/index.html b/docs/page/4/index.html index 5dd27bd2c..3309e40ca 100644 --- a/docs/page/4/index.html +++ b/docs/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/5/index.html b/docs/page/5/index.html index a2d8cb213..373f751ea 100644 --- a/docs/page/5/index.html +++ b/docs/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/6/index.html b/docs/page/6/index.html index 5f7cf63b1..6df6025f9 100644 --- a/docs/page/6/index.html +++ b/docs/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/7/index.html b/docs/page/7/index.html index ad3155e2f..878b859e0 100644 --- a/docs/page/7/index.html +++ b/docs/page/7/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/8/index.html b/docs/page/8/index.html index eef5951d4..e9bf18a8a 100644 --- a/docs/page/8/index.html +++ b/docs/page/8/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/9/index.html b/docs/page/9/index.html index 57d04a6fe..6bfd5235b 100644 --- a/docs/page/9/index.html +++ b/docs/page/9/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/index.html b/docs/posts/index.html index 0d33652fa..450903703 100644 --- a/docs/posts/index.html +++ b/docs/posts/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/2/index.html b/docs/posts/page/2/index.html index 5778bb4ea..5d446685e 100644 --- a/docs/posts/page/2/index.html +++ b/docs/posts/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/3/index.html b/docs/posts/page/3/index.html index c9c1fee45..18b10e3c3 100644 --- a/docs/posts/page/3/index.html +++ b/docs/posts/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/4/index.html b/docs/posts/page/4/index.html index a26f92a55..838630c09 100644 --- a/docs/posts/page/4/index.html +++ b/docs/posts/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/5/index.html b/docs/posts/page/5/index.html index b0ba8623b..bc03bd5ff 100644 --- a/docs/posts/page/5/index.html +++ b/docs/posts/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/6/index.html b/docs/posts/page/6/index.html index b6fb856e6..fd5fc5b02 100644 --- a/docs/posts/page/6/index.html +++ b/docs/posts/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/7/index.html b/docs/posts/page/7/index.html index 0c2a1d522..30bdc2fe4 100644 --- a/docs/posts/page/7/index.html +++ b/docs/posts/page/7/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/8/index.html b/docs/posts/page/8/index.html index 743562ce0..dbaee2c65 100644 --- a/docs/posts/page/8/index.html +++ b/docs/posts/page/8/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/9/index.html b/docs/posts/page/9/index.html index 632b6a85f..5d75b7206 100644 --- a/docs/posts/page/9/index.html +++ b/docs/posts/page/9/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index e08ea14df..1c36ce00f 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -3,19 +3,19 @@ xmlns:xhtml="http://www.w3.org/1999/xhtml"> https://alanorth.github.io/cgspace-notes/2022-08/ - 2022-08-19T21:55:36-07:00 + 2022-08-20T22:37:35-07:00 https://alanorth.github.io/cgspace-notes/categories/ - 2022-08-19T21:55:36-07:00 + 2022-08-20T22:37:35-07:00 https://alanorth.github.io/cgspace-notes/ - 2022-08-19T21:55:36-07:00 + 2022-08-20T22:37:35-07:00 https://alanorth.github.io/cgspace-notes/categories/notes/ - 2022-08-19T21:55:36-07:00 + 2022-08-20T22:37:35-07:00 https://alanorth.github.io/cgspace-notes/posts/ - 2022-08-19T21:55:36-07:00 + 2022-08-20T22:37:35-07:00 https://alanorth.github.io/cgspace-notes/2022-07/ 2022-07-31T15:49:35+03:00