From 8c8e87828ec1828f4bbf1078c189c9f5beef7eb4 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Thu, 23 Jul 2020 12:32:11 +0300 Subject: [PATCH] Add notes for 2020-07-23 --- content/posts/2020-07.md | 22 ++++++++++++++++++++ docs/2020-07/index.html | 27 ++++++++++++++++++++++--- docs/categories/index.html | 2 +- docs/categories/notes/index.html | 2 +- docs/categories/notes/page/2/index.html | 2 +- docs/categories/notes/page/3/index.html | 2 +- docs/categories/notes/page/4/index.html | 2 +- docs/index.html | 2 +- docs/page/2/index.html | 2 +- docs/page/3/index.html | 2 +- docs/page/4/index.html | 2 +- docs/page/5/index.html | 2 +- docs/page/6/index.html | 2 +- docs/posts/index.html | 2 +- docs/posts/page/2/index.html | 2 +- docs/posts/page/3/index.html | 2 +- docs/posts/page/4/index.html | 2 +- docs/posts/page/5/index.html | 2 +- docs/posts/page/6/index.html | 2 +- docs/sitemap.xml | 10 ++++----- 20 files changed, 68 insertions(+), 25 deletions(-) diff --git a/content/posts/2020-07.md b/content/posts/2020-07.md index c17812ba9..1e7e34142 100644 --- a/content/posts/2020-07.md +++ b/content/posts/2020-07.md @@ -648,5 +648,27 @@ OpenRXV harvesting bot; https://github.com/ilri/OpenRXV - [COUNTER_Robots_list.json: Remove anchors from okhttp](https://github.com/atmire/COUNTER-Robots/pull/33) - I will update the agent patterns on the CGSpace `5_x-prod` and 6.x branches - Make some changes to the Bootstrap CSS and HTML configuration to improve readability and style on the CG Core v2 metadata reference guide and send a pull request to Marie ([#29](https://github.com/AgriculturalSemantics/cg-core/pull/29)) +- The `solr-upgrade-statistics-6x` tool keeps crashing due to memory issues when processing 2018 stats + - I reduced the number of records per batch from 10,000 to 5,000 and increased the memory to 3072 and it still crashes... + - I reduced the number of records per batch to 1,000 and it works, but still took like twenty minutes before it even started! + - Eventually after processing a few million records it crashed with this error: + +``` +Exception: Error while creating field 'p_group_id{type=uuid,properties=indexed,stored,multiValued}' from value '10' +org.apache.solr.client.solrj.impl.HttpSolrServer$RemoteSolrException: Error while creating field 'p_group_id{type=uuid,properties=indexed,stored,multiValued}' from value '10' +``` + +- There were four records so I deleted them: + +``` +$ curl -s "http://localhost:8081/solr/statistics-2018/update?softCommit=true" -H "Content-Type: text/xml" --data-binary 'id:10' +``` + +- Meeting with Moayad and Peter and Abenet to discuss the latest AReS changes + +## 2020-07-23 + +- I closed all issues in the [OpenRXV](https://github.com/ilri/OpenRXV/issues) and [AReS](https://github.com/ilri/AReS/issues) GitHub repositories with screenshots so that Moayad can use them for his invoice +- The statistics-2018 core always crashes with the same error even after I deleted the "id:10" records... diff --git a/docs/2020-07/index.html b/docs/2020-07/index.html index 75857aa12..bfebbaad2 100644 --- a/docs/2020-07/index.html +++ b/docs/2020-07/index.html @@ -20,7 +20,7 @@ Since I was restarting Tomcat anyways I decided to redeploy the latest changes f - + @@ -45,9 +45,9 @@ Since I was restarting Tomcat anyways I decided to redeploy the latest changes f "@type": "BlogPosting", "headline": "July, 2020", "url": "https://alanorth.github.io/cgspace-notes/2020-07/", - "wordCount": "4195", + "wordCount": "4352", "datePublished": "2020-07-01T10:53:54+03:00", - "dateModified": "2020-07-21T13:44:52+03:00", + "dateModified": "2020-07-22T11:00:40+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -782,6 +782,27 @@ $ chrt -b 0 dspace solr-upgrade-statistics-6x -n 1000000 -i statistics-2018
  • I will update the agent patterns on the CGSpace 5_x-prod and 6.x branches
  • Make some changes to the Bootstrap CSS and HTML configuration to improve readability and style on the CG Core v2 metadata reference guide and send a pull request to Marie (#29)
  • +
  • The solr-upgrade-statistics-6x tool keeps crashing due to memory issues when processing 2018 stats + +
  • + +
    Exception: Error while creating field 'p_group_id{type=uuid,properties=indexed,stored,multiValued}' from value '10'
    +org.apache.solr.client.solrj.impl.HttpSolrServer$RemoteSolrException: Error while creating field 'p_group_id{type=uuid,properties=indexed,stored,multiValued}' from value '10'
    +
    +
    $ curl -s "http://localhost:8081/solr/statistics-2018/update?softCommit=true" -H "Content-Type: text/xml" --data-binary '<delete><query>id:10</query></delete>'
    +
    +

    2020-07-23

    + diff --git a/docs/categories/index.html b/docs/categories/index.html index 303182b3b..2609cbd4e 100644 --- a/docs/categories/index.html +++ b/docs/categories/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/categories/notes/index.html b/docs/categories/notes/index.html index 51a1bad50..755f2cf17 100644 --- a/docs/categories/notes/index.html +++ b/docs/categories/notes/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/categories/notes/page/2/index.html b/docs/categories/notes/page/2/index.html index c17323b22..860dbbf10 100644 --- a/docs/categories/notes/page/2/index.html +++ b/docs/categories/notes/page/2/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/categories/notes/page/3/index.html b/docs/categories/notes/page/3/index.html index 3e36722cc..3cb2fb86d 100644 --- a/docs/categories/notes/page/3/index.html +++ b/docs/categories/notes/page/3/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/categories/notes/page/4/index.html b/docs/categories/notes/page/4/index.html index 943b91383..9a754cc64 100644 --- a/docs/categories/notes/page/4/index.html +++ b/docs/categories/notes/page/4/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/index.html b/docs/index.html index 5102f828c..9765272a0 100644 --- a/docs/index.html +++ b/docs/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/2/index.html b/docs/page/2/index.html index b7a7c2fc0..cd35110dc 100644 --- a/docs/page/2/index.html +++ b/docs/page/2/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/3/index.html b/docs/page/3/index.html index 1d4e07f69..8e2b37b15 100644 --- a/docs/page/3/index.html +++ b/docs/page/3/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/4/index.html b/docs/page/4/index.html index 3104c1a85..8e5ba23f2 100644 --- a/docs/page/4/index.html +++ b/docs/page/4/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/5/index.html b/docs/page/5/index.html index c8e73f88b..971a53d46 100644 --- a/docs/page/5/index.html +++ b/docs/page/5/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/page/6/index.html b/docs/page/6/index.html index 8393f58c0..b17857550 100644 --- a/docs/page/6/index.html +++ b/docs/page/6/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/index.html b/docs/posts/index.html index 5bf31541c..dcdc61176 100644 --- a/docs/posts/index.html +++ b/docs/posts/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/2/index.html b/docs/posts/page/2/index.html index 79e92274b..4601855f6 100644 --- a/docs/posts/page/2/index.html +++ b/docs/posts/page/2/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/3/index.html b/docs/posts/page/3/index.html index 95560a4e8..15908d569 100644 --- a/docs/posts/page/3/index.html +++ b/docs/posts/page/3/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/4/index.html b/docs/posts/page/4/index.html index edc965d4c..a43552cb2 100644 --- a/docs/posts/page/4/index.html +++ b/docs/posts/page/4/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/5/index.html b/docs/posts/page/5/index.html index 1fc3c8e9d..3b65a9424 100644 --- a/docs/posts/page/5/index.html +++ b/docs/posts/page/5/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/posts/page/6/index.html b/docs/posts/page/6/index.html index 26f179c86..8e3fe5797 100644 --- a/docs/posts/page/6/index.html +++ b/docs/posts/page/6/index.html @@ -9,7 +9,7 @@ - + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index f1b25b710..16cd3811b 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,27 +4,27 @@ https://alanorth.github.io/cgspace-notes/categories/ - 2020-07-21T13:44:52+03:00 + 2020-07-22T11:00:40+03:00 https://alanorth.github.io/cgspace-notes/ - 2020-07-21T13:44:52+03:00 + 2020-07-22T11:00:40+03:00 https://alanorth.github.io/cgspace-notes/2020-07/ - 2020-07-21T13:44:52+03:00 + 2020-07-22T11:00:40+03:00 https://alanorth.github.io/cgspace-notes/categories/notes/ - 2020-07-21T13:44:52+03:00 + 2020-07-22T11:00:40+03:00 https://alanorth.github.io/cgspace-notes/posts/ - 2020-07-21T13:44:52+03:00 + 2020-07-22T11:00:40+03:00