diff --git a/content/posts/2023-03.md b/content/posts/2023-03.md index 41c710040..8cdcc0fc9 100644 --- a/content/posts/2023-03.md +++ b/content/posts/2023-03.md @@ -455,4 +455,41 @@ $ psql dspace < /tmp/reindex.sql - After playing with WebP at Q82 and Q92, I see it has lower ssimulacra2 scores than JPEG Q92 for the dozen test files - Could it just be something with ImageMagick? +## 2023-03-22 + +- I updated csv-metadata-quality to use pandas 2.0.0rc1 and everything seems to work...? + - So the issues with nulls (isna) when I tried the first release candidate a few weeks ago were resolved? +- Meeting with Jawoo and others about a "ChatGPT-like" thing for CGIAR data using CGSpace documents and metadata + +## 2023-03-23 + +- Add a missing IFPRI ORCID identifier to CGSpace and tag his items on CGSpace +- A super unscientific comparison between csv-metadata-quality's pytest regimen using Pandas 1.5.3 and Pandas 2.0.0rc1 + - The data was gathered using [rusage](https://justine.lol/rusage), and this is the results of the last of three consecutive runs: + +``` +# Pandas 1.5.3 +RL: took 1,585,999µs wall time +RL: ballooned to 272,380kb in size +RL: needed 2,093,947µs cpu (25% kernel) +RL: caused 55,856 page faults (100% memcpy) +RL: 699 context switches (1% consensual) +RL: performed 0 reads and 16 write i/o operations + +# Pandas 2.0.0rc1 +RL: took 1,625,718µs wall time +RL: ballooned to 262,116kb in size +RL: needed 2,148,425µs cpu (24% kernel) +RL: caused 63,934 page faults (100% memcpy) +RL: 461 context switches (2% consensual) +RL: performed 0 reads and 16 write i/o operations +``` + +- So it seems that Pandas 2.0.0rc1 took ten megabytes less RAM... interesting to see that the PyArrow-backed dtypes make a measurable difference even on my small test set + - I should try to compare runs of larger input files + +## 2023-03-24 + +- I added a Flyway SQL migration for the PNG bitstream format registry changes on DSpace 7.6 + diff --git a/docs/2023-03/index.html b/docs/2023-03/index.html index 822186344..8760c6936 100644 --- a/docs/2023-03/index.html +++ b/docs/2023-03/index.html @@ -16,7 +16,7 @@ I finally got through with porting the input form from DSpace 6 to DSpace 7 - + @@ -38,9 +38,9 @@ I finally got through with porting the input form from DSpace 6 to DSpace 7 "@type": "BlogPosting", "headline": "March, 2023", "url": "https://alanorth.github.io/cgspace-notes/2023-03/", - "wordCount": "3229", + "wordCount": "3464", "datePublished": "2023-03-01T07:58:36+03:00", - "dateModified": "2023-03-21T16:35:41+03:00", + "dateModified": "2023-03-22T08:28:33+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -619,6 +619,50 @@ pd.options.mode.nullable_dtypes = True +

2023-03-22

+ +

2023-03-23

+ +
# Pandas 1.5.3
+RL: took 1,585,999µs wall time
+RL: ballooned to 272,380kb in size
+RL: needed 2,093,947µs cpu (25% kernel)
+RL: caused 55,856 page faults (100% memcpy)
+RL: 699 context switches (1% consensual)
+RL: performed 0 reads and 16 write i/o operations
+
+# Pandas 2.0.0rc1
+RL: took 1,625,718µs wall time
+RL: ballooned to 262,116kb in size
+RL: needed 2,148,425µs cpu (24% kernel)
+RL: caused 63,934 page faults (100% memcpy)
+RL: 461 context switches (2% consensual)
+RL: performed 0 reads and 16 write i/o operations
+
+

2023-03-24

+ diff --git a/docs/categories/index.html b/docs/categories/index.html index 54c95b8a3..93e653a55 100644 --- a/docs/categories/index.html +++ b/docs/categories/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/index.html b/docs/categories/notes/index.html index 862d32b9f..2f9550a47 100644 --- a/docs/categories/notes/index.html +++ b/docs/categories/notes/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/2/index.html b/docs/categories/notes/page/2/index.html index cf717abae..96706fbb4 100644 --- a/docs/categories/notes/page/2/index.html +++ b/docs/categories/notes/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/3/index.html b/docs/categories/notes/page/3/index.html index f85cd7682..a950f82bf 100644 --- a/docs/categories/notes/page/3/index.html +++ b/docs/categories/notes/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/4/index.html b/docs/categories/notes/page/4/index.html index 045703c87..8570a4d03 100644 --- a/docs/categories/notes/page/4/index.html +++ b/docs/categories/notes/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/5/index.html b/docs/categories/notes/page/5/index.html index 1c971fb4e..22b69838d 100644 --- a/docs/categories/notes/page/5/index.html +++ b/docs/categories/notes/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/6/index.html b/docs/categories/notes/page/6/index.html index 33d69908c..d58da095c 100644 --- a/docs/categories/notes/page/6/index.html +++ b/docs/categories/notes/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/categories/notes/page/7/index.html b/docs/categories/notes/page/7/index.html index 1dad5988c..8c21c704d 100644 --- a/docs/categories/notes/page/7/index.html +++ b/docs/categories/notes/page/7/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/index.html b/docs/index.html index 319837fe9..646964c48 100644 --- a/docs/index.html +++ b/docs/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/10/index.html b/docs/page/10/index.html index 3e3f15fcf..0beccdcae 100644 --- a/docs/page/10/index.html +++ b/docs/page/10/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/2/index.html b/docs/page/2/index.html index 92b5d31a3..a3b745611 100644 --- a/docs/page/2/index.html +++ b/docs/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/3/index.html b/docs/page/3/index.html index 8dadccb8e..fcf4af40f 100644 --- a/docs/page/3/index.html +++ b/docs/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/4/index.html b/docs/page/4/index.html index 0616efeef..bba2fab9a 100644 --- a/docs/page/4/index.html +++ b/docs/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/5/index.html b/docs/page/5/index.html index 24d7235cf..0c361df6e 100644 --- a/docs/page/5/index.html +++ b/docs/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/6/index.html b/docs/page/6/index.html index 918dc56d0..362433a15 100644 --- a/docs/page/6/index.html +++ b/docs/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/7/index.html b/docs/page/7/index.html index 4cb44048e..3c346ad8f 100644 --- a/docs/page/7/index.html +++ b/docs/page/7/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/8/index.html b/docs/page/8/index.html index 22d3b96de..fa2838a96 100644 --- a/docs/page/8/index.html +++ b/docs/page/8/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/page/9/index.html b/docs/page/9/index.html index 1a3e49ea7..d79c6d92f 100644 --- a/docs/page/9/index.html +++ b/docs/page/9/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/index.html b/docs/posts/index.html index 378eb1fff..d231de0d4 100644 --- a/docs/posts/index.html +++ b/docs/posts/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/10/index.html b/docs/posts/page/10/index.html index f5189ed76..a29bd9644 100644 --- a/docs/posts/page/10/index.html +++ b/docs/posts/page/10/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/2/index.html b/docs/posts/page/2/index.html index ed6c738ac..ff006163c 100644 --- a/docs/posts/page/2/index.html +++ b/docs/posts/page/2/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/3/index.html b/docs/posts/page/3/index.html index bb9b18f35..69a58f6fa 100644 --- a/docs/posts/page/3/index.html +++ b/docs/posts/page/3/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/4/index.html b/docs/posts/page/4/index.html index 92e4ae809..0bf5f2071 100644 --- a/docs/posts/page/4/index.html +++ b/docs/posts/page/4/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/5/index.html b/docs/posts/page/5/index.html index 287896bfa..e6d0f9d43 100644 --- a/docs/posts/page/5/index.html +++ b/docs/posts/page/5/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/6/index.html b/docs/posts/page/6/index.html index 09888fae7..bda2f205d 100644 --- a/docs/posts/page/6/index.html +++ b/docs/posts/page/6/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/7/index.html b/docs/posts/page/7/index.html index c38d95b8f..6b43b77eb 100644 --- a/docs/posts/page/7/index.html +++ b/docs/posts/page/7/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/8/index.html b/docs/posts/page/8/index.html index 84f6f36c1..b65029752 100644 --- a/docs/posts/page/8/index.html +++ b/docs/posts/page/8/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/posts/page/9/index.html b/docs/posts/page/9/index.html index ea88183bd..1f0d91b62 100644 --- a/docs/posts/page/9/index.html +++ b/docs/posts/page/9/index.html @@ -10,7 +10,7 @@ - + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index 0f6193e85..d171f8983 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -3,19 +3,19 @@ xmlns:xhtml="http://www.w3.org/1999/xhtml"> https://alanorth.github.io/cgspace-notes/categories/ - 2023-03-21T16:35:41+03:00 + 2023-03-22T08:28:33+03:00 https://alanorth.github.io/cgspace-notes/ - 2023-03-21T16:35:41+03:00 + 2023-03-22T08:28:33+03:00 https://alanorth.github.io/cgspace-notes/2023-03/ - 2023-03-21T16:35:41+03:00 + 2023-03-22T08:28:33+03:00 https://alanorth.github.io/cgspace-notes/categories/notes/ - 2023-03-21T16:35:41+03:00 + 2023-03-22T08:28:33+03:00 https://alanorth.github.io/cgspace-notes/posts/ - 2023-03-21T16:35:41+03:00 + 2023-03-22T08:28:33+03:00 https://alanorth.github.io/cgspace-notes/2023-02/ 2023-03-01T08:30:25+03:00