From bc44226aacd57e47ff286cc40f45234dce32df5f Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Sat, 13 Oct 2018 21:17:20 +0300 Subject: [PATCH] Add notes for 2018-10-13 --- content/posts/2018-10.md | 24 +++++++++++++++++ docs/2015-11/index.html | 2 +- docs/2015-12/index.html | 2 +- docs/2016-01/index.html | 2 +- docs/2016-02/index.html | 2 +- docs/2016-03/index.html | 2 +- docs/2016-04/index.html | 2 +- docs/2016-05/index.html | 2 +- docs/2016-06/index.html | 2 +- docs/2016-07/index.html | 2 +- docs/2016-08/index.html | 2 +- docs/2016-09/index.html | 2 +- docs/2016-10/index.html | 2 +- docs/2016-11/index.html | 2 +- docs/2016-12/index.html | 2 +- docs/2017-01/index.html | 2 +- docs/2017-02/index.html | 2 +- docs/2017-03/index.html | 2 +- docs/2017-04/index.html | 2 +- docs/2017-05/index.html | 2 +- docs/2017-06/index.html | 2 +- docs/2017-07/index.html | 2 +- docs/2017-08/index.html | 2 +- docs/2017-09/index.html | 2 +- docs/2017-10/index.html | 2 +- docs/2017-11/index.html | 2 +- docs/2017-12/index.html | 2 +- docs/2018-01/index.html | 2 +- docs/2018-02/index.html | 2 +- docs/2018-03/index.html | 2 +- docs/2018-04/index.html | 2 +- docs/2018-05/index.html | 2 +- docs/2018-06/index.html | 2 +- docs/2018-07/index.html | 2 +- docs/2018-08/index.html | 2 +- docs/2018-09/index.html | 2 +- docs/2018-10/index.html | 36 ++++++++++++++++++++++--- docs/404.html | 2 +- docs/categories/index.html | 2 +- docs/categories/notes/index.html | 2 +- docs/categories/page/2/index.html | 2 +- docs/categories/page/3/index.html | 2 +- docs/categories/page/4/index.html | 2 +- docs/cgiar-library-migration/index.html | 2 +- docs/index.html | 2 +- docs/page/2/index.html | 2 +- docs/page/3/index.html | 2 +- docs/page/4/index.html | 2 +- docs/posts/index.html | 2 +- docs/posts/page/2/index.html | 2 +- docs/posts/page/3/index.html | 2 +- docs/posts/page/4/index.html | 2 +- docs/sitemap.xml | 10 +++---- docs/tags/index.html | 2 +- docs/tags/notes/index.html | 2 +- docs/tags/notes/page/2/index.html | 2 +- docs/tags/notes/page/3/index.html | 2 +- docs/tags/notes/page/4/index.html | 2 +- docs/tags/page/2/index.html | 2 +- docs/tags/page/3/index.html | 2 +- docs/tags/page/4/index.html | 2 +- 61 files changed, 119 insertions(+), 67 deletions(-) diff --git a/content/posts/2018-10.md b/content/posts/2018-10.md index 43f8d30b3..81234d322 100644 --- a/content/posts/2018-10.md +++ b/content/posts/2018-10.md @@ -222,4 +222,28 @@ COPY 10000 - CTA uploaded some infographics that are very tall and their thumbnails disrupt the item lists on the front page and in their communities and collections - I decided to constrain the max height of these to 200px using CSS ([#392](https://github.com/ilri/DSpace/pull/392)) +## 2018-10-13 + +- Run all system updates on DSpace Test (linode19) and reboot it +- Look through Peter's list of 746 author corrections in OpenRefine +- I first facet by blank, trim whitespace, and then check for weird characters that might be indicative of encoding issues with this GREL: + +``` +or( + isNotNull(value.match(/.*\uFFFD.*/)), + isNotNull(value.match(/.*\u00A0.*/)), + isNotNull(value.match(/.*\u200A.*/)), + isNotNull(value.match(/.*\u2019.*/)), + isNotNull(value.match(/.*\u00b4.*/)) +) +``` + +- Then I exported and applied them on my local test server: + +``` +$ ./fix-metadata-values.py -i 2018-10-11-top-authors.csv -db dspace -u dspace -p 'fuuu' -f dc.contributor.author -t CORRECT -m 3 +``` + +- I will apply these on CGSpace when I do the other updates tomorrow, as well as double check the high scoring ones to see if they are correct in Sisay's author controlled vocabulary + diff --git a/docs/2015-11/index.html b/docs/2015-11/index.html index 5396b6368..b797d88ef 100644 --- a/docs/2015-11/index.html +++ b/docs/2015-11/index.html @@ -38,7 +38,7 @@ $ psql -c 'SELECT * from pg_stat_activity;' | grep idle | grep -c cgspac "/> - + diff --git a/docs/2015-12/index.html b/docs/2015-12/index.html index c4da1043a..fa4945b59 100644 --- a/docs/2015-12/index.html +++ b/docs/2015-12/index.html @@ -40,7 +40,7 @@ Replace lzop with xz in log compression cron jobs on DSpace Test—it uses less "/> - + diff --git a/docs/2016-01/index.html b/docs/2016-01/index.html index f843b2d0a..99b16af86 100644 --- a/docs/2016-01/index.html +++ b/docs/2016-01/index.html @@ -30,7 +30,7 @@ Update GitHub wiki for documentation of maintenance tasks. "/> - + diff --git a/docs/2016-02/index.html b/docs/2016-02/index.html index 232f3f117..944598374 100644 --- a/docs/2016-02/index.html +++ b/docs/2016-02/index.html @@ -44,7 +44,7 @@ Also, lots of things like “COTE D`LVOIRE” and “COTE D IVOIRE&r "/> - + diff --git a/docs/2016-03/index.html b/docs/2016-03/index.html index f333e1ac5..24a190b78 100644 --- a/docs/2016-03/index.html +++ b/docs/2016-03/index.html @@ -30,7 +30,7 @@ Reinstall my local (Mac OS X) DSpace stack with Tomcat 7, PostgreSQL 9.3, and Ja "/> - + diff --git a/docs/2016-04/index.html b/docs/2016-04/index.html index 3925b3d69..4c102a8cd 100644 --- a/docs/2016-04/index.html +++ b/docs/2016-04/index.html @@ -34,7 +34,7 @@ Also, I noticed the checker log has some errors we should pay attention to: "/> - + diff --git a/docs/2016-05/index.html b/docs/2016-05/index.html index ad21be527..9aaab994c 100644 --- a/docs/2016-05/index.html +++ b/docs/2016-05/index.html @@ -38,7 +38,7 @@ There are 3,000 IPs accessing the REST API in a 24-hour period! "/> - + diff --git a/docs/2016-06/index.html b/docs/2016-06/index.html index 524e57028..c40f5e330 100644 --- a/docs/2016-06/index.html +++ b/docs/2016-06/index.html @@ -36,7 +36,7 @@ Working on second phase of metadata migration, looks like this will work for mov "/> - + diff --git a/docs/2016-07/index.html b/docs/2016-07/index.html index d7e33dde6..98e5fd4e3 100644 --- a/docs/2016-07/index.html +++ b/docs/2016-07/index.html @@ -52,7 +52,7 @@ In this case the select query was showing 95 results before the update "/> - + diff --git a/docs/2016-08/index.html b/docs/2016-08/index.html index d781d6d33..69b9de1b5 100644 --- a/docs/2016-08/index.html +++ b/docs/2016-08/index.html @@ -46,7 +46,7 @@ $ git rebase -i dspace-5.5 "/> - + diff --git a/docs/2016-09/index.html b/docs/2016-09/index.html index 8a1b591df..891b59b76 100644 --- a/docs/2016-09/index.html +++ b/docs/2016-09/index.html @@ -38,7 +38,7 @@ $ ldapsearch -x -H ldaps://svcgroot2.cgiarad.org:3269/ -b "dc=cgiarad,dc=or "/> - + diff --git a/docs/2016-10/index.html b/docs/2016-10/index.html index 698e50151..7ab32690e 100644 --- a/docs/2016-10/index.html +++ b/docs/2016-10/index.html @@ -46,7 +46,7 @@ I exported a random item’s metadata as CSV, deleted all columns except id "/> - + diff --git a/docs/2016-11/index.html b/docs/2016-11/index.html index a63399a50..514dfdd3e 100644 --- a/docs/2016-11/index.html +++ b/docs/2016-11/index.html @@ -30,7 +30,7 @@ Add dc.type to the output options for Atmire’s Listings and Reports module "/> - + diff --git a/docs/2016-12/index.html b/docs/2016-12/index.html index bc0afa758..eeb7a0375 100644 --- a/docs/2016-12/index.html +++ b/docs/2016-12/index.html @@ -54,7 +54,7 @@ Another worrying error from dspace.log is: "/> - + diff --git a/docs/2017-01/index.html b/docs/2017-01/index.html index a6250e618..cb496ccc6 100644 --- a/docs/2017-01/index.html +++ b/docs/2017-01/index.html @@ -30,7 +30,7 @@ I asked on the dspace-tech mailing list because it seems to be broken, and actua "/> - + diff --git a/docs/2017-02/index.html b/docs/2017-02/index.html index b661721a3..4b9251f93 100644 --- a/docs/2017-02/index.html +++ b/docs/2017-02/index.html @@ -58,7 +58,7 @@ Looks like we’ll be using cg.identifier.ccafsprojectpii as the field name "/> - + diff --git a/docs/2017-03/index.html b/docs/2017-03/index.html index 66feeabdc..59361e577 100644 --- a/docs/2017-03/index.html +++ b/docs/2017-03/index.html @@ -62,7 +62,7 @@ $ identify ~/Desktop/alc_contrastes_desafios.jpg "/> - + diff --git a/docs/2017-04/index.html b/docs/2017-04/index.html index c1b48166d..961c7edd9 100644 --- a/docs/2017-04/index.html +++ b/docs/2017-04/index.html @@ -48,7 +48,7 @@ $ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Th "/> - + diff --git a/docs/2017-05/index.html b/docs/2017-05/index.html index 285dc2d02..6bfcad16c 100644 --- a/docs/2017-05/index.html +++ b/docs/2017-05/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/2017-06/index.html b/docs/2017-06/index.html index 18b7af73f..50a7cc3be 100644 --- a/docs/2017-06/index.html +++ b/docs/2017-06/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/2017-07/index.html b/docs/2017-07/index.html index 41e75ad6c..631fe0779 100644 --- a/docs/2017-07/index.html +++ b/docs/2017-07/index.html @@ -42,7 +42,7 @@ We can use PostgreSQL’s extended output format (-x) plus sed to format the "/> - + diff --git a/docs/2017-08/index.html b/docs/2017-08/index.html index d65c3b543..ff05b563e 100644 --- a/docs/2017-08/index.html +++ b/docs/2017-08/index.html @@ -62,7 +62,7 @@ Then I cleaned up the author authorities and HTML characters in OpenRefine and s "/> - + diff --git a/docs/2017-09/index.html b/docs/2017-09/index.html index 31fe78bd4..3787ee889 100644 --- a/docs/2017-09/index.html +++ b/docs/2017-09/index.html @@ -38,7 +38,7 @@ Ask Sisay to clean up the WLE approvers a bit, as Marianne’s user account "/> - + diff --git a/docs/2017-10/index.html b/docs/2017-10/index.html index a6e0550af..aef14033b 100644 --- a/docs/2017-10/index.html +++ b/docs/2017-10/index.html @@ -42,7 +42,7 @@ Add Katherine Lutz to the groups for content submission and edit steps of the CG "/> - + diff --git a/docs/2017-11/index.html b/docs/2017-11/index.html index 851fc873c..df782e7f0 100644 --- a/docs/2017-11/index.html +++ b/docs/2017-11/index.html @@ -62,7 +62,7 @@ COPY 54701 "/> - + diff --git a/docs/2017-12/index.html b/docs/2017-12/index.html index 71128b0fe..2791e6c6b 100644 --- a/docs/2017-12/index.html +++ b/docs/2017-12/index.html @@ -32,7 +32,7 @@ The list of connections to XMLUI and REST API for today: "/> - + diff --git a/docs/2018-01/index.html b/docs/2018-01/index.html index e1917b70d..c5e56dd84 100644 --- a/docs/2018-01/index.html +++ b/docs/2018-01/index.html @@ -170,7 +170,7 @@ Danny wrote to ask for help renewing the wildcard ilri.org certificate and I adv "/> - + diff --git a/docs/2018-02/index.html b/docs/2018-02/index.html index 529f7e086..fbb9b80af 100644 --- a/docs/2018-02/index.html +++ b/docs/2018-02/index.html @@ -32,7 +32,7 @@ I copied the logic in the jmx_tomcat_dbpools provided by Ubuntu’s munin-pl "/> - + diff --git a/docs/2018-03/index.html b/docs/2018-03/index.html index a5c552fb1..87d10f5fc 100644 --- a/docs/2018-03/index.html +++ b/docs/2018-03/index.html @@ -26,7 +26,7 @@ Export a CSV of the IITA community metadata for Martin Mueller "/> - + diff --git a/docs/2018-04/index.html b/docs/2018-04/index.html index a757ef10f..567793c5f 100644 --- a/docs/2018-04/index.html +++ b/docs/2018-04/index.html @@ -28,7 +28,7 @@ Catalina logs at least show some memory errors yesterday: "/> - + diff --git a/docs/2018-05/index.html b/docs/2018-05/index.html index 52cdc8e96..b875287c4 100644 --- a/docs/2018-05/index.html +++ b/docs/2018-05/index.html @@ -40,7 +40,7 @@ Also, I switched it to use OpenJDK instead of Oracle Java, as well as re-worked "/> - + diff --git a/docs/2018-06/index.html b/docs/2018-06/index.html index 1ffb655af..855497697 100644 --- a/docs/2018-06/index.html +++ b/docs/2018-06/index.html @@ -68,7 +68,7 @@ sys 2m7.289s "/> - + diff --git a/docs/2018-07/index.html b/docs/2018-07/index.html index 1af55335b..d9c07a5fb 100644 --- a/docs/2018-07/index.html +++ b/docs/2018-07/index.html @@ -46,7 +46,7 @@ There is insufficient memory for the Java Runtime Environment to continue. "/> - + diff --git a/docs/2018-08/index.html b/docs/2018-08/index.html index c91ca9d5c..359c9d546 100644 --- a/docs/2018-08/index.html +++ b/docs/2018-08/index.html @@ -54,7 +54,7 @@ I ran all system updates on DSpace Test and rebooted it "/> - + diff --git a/docs/2018-09/index.html b/docs/2018-09/index.html index 2ee36b4ea..86dc24ed0 100644 --- a/docs/2018-09/index.html +++ b/docs/2018-09/index.html @@ -32,7 +32,7 @@ I’m testing the new DSpace 5.8 branch in my Ubuntu 18.04 environment and I "/> - + diff --git a/docs/2018-10/index.html b/docs/2018-10/index.html index bbd1e451a..9ad0ee6f9 100644 --- a/docs/2018-10/index.html +++ b/docs/2018-10/index.html @@ -9,12 +9,12 @@ - + - + @@ -24,9 +24,9 @@ "@type": "BlogPosting", "headline": "October, 2018", "url": "https://alanorth.github.io/cgspace-notes/2018-10/", - "wordCount": "1407", + "wordCount": "1519", "datePublished": "2018-10-01T22:31:54+03:00", - "dateModified": "2018-10-11T11:17:07+03:00", + "dateModified": "2018-10-11T14:25:13+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -344,6 +344,34 @@ COPY 10000
  • I decided to constrain the max height of these to 200px using CSS (#392)
  • +

    2018-10-13

    + + + +
    or(
    +  isNotNull(value.match(/.*\uFFFD.*/)),
    +  isNotNull(value.match(/.*\u00A0.*/)),
    +  isNotNull(value.match(/.*\u200A.*/)),
    +  isNotNull(value.match(/.*\u2019.*/)),
    +  isNotNull(value.match(/.*\u00b4.*/))
    +)
    +
    + + + +
    $ ./fix-metadata-values.py -i 2018-10-11-top-authors.csv -db dspace -u dspace -p 'fuuu' -f dc.contributor.author -t CORRECT -m 3
    +
    + + + diff --git a/docs/404.html b/docs/404.html index 2a68b558b..af460d773 100644 --- a/docs/404.html +++ b/docs/404.html @@ -13,7 +13,7 @@ - + diff --git a/docs/categories/index.html b/docs/categories/index.html index f52df31c2..37046a8f5 100644 --- a/docs/categories/index.html +++ b/docs/categories/index.html @@ -13,7 +13,7 @@ - + diff --git a/docs/categories/notes/index.html b/docs/categories/notes/index.html index 3c2922fc5..0ec0e20cf 100644 --- a/docs/categories/notes/index.html +++ b/docs/categories/notes/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/categories/page/2/index.html b/docs/categories/page/2/index.html index 627b3ca2a..b57ccac58 100644 --- a/docs/categories/page/2/index.html +++ b/docs/categories/page/2/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/categories/page/3/index.html b/docs/categories/page/3/index.html index b1245afb5..9bf5676ff 100644 --- a/docs/categories/page/3/index.html +++ b/docs/categories/page/3/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/categories/page/4/index.html b/docs/categories/page/4/index.html index baa645c3e..72dd3d768 100644 --- a/docs/categories/page/4/index.html +++ b/docs/categories/page/4/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/cgiar-library-migration/index.html b/docs/cgiar-library-migration/index.html index 77fc5d263..c7fc414f5 100644 --- a/docs/cgiar-library-migration/index.html +++ b/docs/cgiar-library-migration/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/index.html b/docs/index.html index c9ac48a71..7cee9dcc1 100644 --- a/docs/index.html +++ b/docs/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/page/2/index.html b/docs/page/2/index.html index c1d1b5be3..a04049eea 100644 --- a/docs/page/2/index.html +++ b/docs/page/2/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/page/3/index.html b/docs/page/3/index.html index e8941a779..41407e9bc 100644 --- a/docs/page/3/index.html +++ b/docs/page/3/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/page/4/index.html b/docs/page/4/index.html index c7bbc6de9..02b2c1d16 100644 --- a/docs/page/4/index.html +++ b/docs/page/4/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/posts/index.html b/docs/posts/index.html index fa3e01fd9..5e5f974b1 100644 --- a/docs/posts/index.html +++ b/docs/posts/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/posts/page/2/index.html b/docs/posts/page/2/index.html index 854f45719..51f6c7686 100644 --- a/docs/posts/page/2/index.html +++ b/docs/posts/page/2/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/posts/page/3/index.html b/docs/posts/page/3/index.html index 3e5cf7ad0..a3763fe29 100644 --- a/docs/posts/page/3/index.html +++ b/docs/posts/page/3/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/posts/page/4/index.html b/docs/posts/page/4/index.html index 7a48d9dcd..cbcb372b9 100644 --- a/docs/posts/page/4/index.html +++ b/docs/posts/page/4/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index fd1e49671..68864a430 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,7 +4,7 @@ https://alanorth.github.io/cgspace-notes/2018-10/ - 2018-10-11T11:17:07+03:00 + 2018-10-11T14:25:13+03:00 @@ -189,7 +189,7 @@ https://alanorth.github.io/cgspace-notes/ - 2018-10-11T11:17:07+03:00 + 2018-10-11T14:25:13+03:00 0 @@ -200,7 +200,7 @@ https://alanorth.github.io/cgspace-notes/tags/notes/ - 2018-10-11T11:17:07+03:00 + 2018-10-11T14:25:13+03:00 0 @@ -212,13 +212,13 @@ https://alanorth.github.io/cgspace-notes/posts/ - 2018-10-11T11:17:07+03:00 + 2018-10-11T14:25:13+03:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2018-10-11T11:17:07+03:00 + 2018-10-11T14:25:13+03:00 0 diff --git a/docs/tags/index.html b/docs/tags/index.html index f2b5f4506..d9ce8d548 100644 --- a/docs/tags/index.html +++ b/docs/tags/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/tags/notes/index.html b/docs/tags/notes/index.html index 106341779..f2d03a1d6 100644 --- a/docs/tags/notes/index.html +++ b/docs/tags/notes/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/tags/notes/page/2/index.html b/docs/tags/notes/page/2/index.html index 51e932d24..f208efbc1 100644 --- a/docs/tags/notes/page/2/index.html +++ b/docs/tags/notes/page/2/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/tags/notes/page/3/index.html b/docs/tags/notes/page/3/index.html index 47e9c6240..bb5c4e48f 100644 --- a/docs/tags/notes/page/3/index.html +++ b/docs/tags/notes/page/3/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/tags/notes/page/4/index.html b/docs/tags/notes/page/4/index.html index 55c0cfee9..6efac860e 100644 --- a/docs/tags/notes/page/4/index.html +++ b/docs/tags/notes/page/4/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/tags/page/2/index.html b/docs/tags/page/2/index.html index f138d0876..d124ee77b 100644 --- a/docs/tags/page/2/index.html +++ b/docs/tags/page/2/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/tags/page/3/index.html b/docs/tags/page/3/index.html index 0c80bc41f..3ad0b0391 100644 --- a/docs/tags/page/3/index.html +++ b/docs/tags/page/3/index.html @@ -14,7 +14,7 @@ - + diff --git a/docs/tags/page/4/index.html b/docs/tags/page/4/index.html index 0a6989e2e..cd756d94b 100644 --- a/docs/tags/page/4/index.html +++ b/docs/tags/page/4/index.html @@ -14,7 +14,7 @@ - +