From 50725d412fc7bd7262d0209060013139a0080974 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Wed, 21 Mar 2018 11:44:06 +0200 Subject: [PATCH] Add notes for 2018-03-21 --- content/posts/2018-03.md | 22 ++++++++++++++++++++++ docs/2018-03/index.html | 32 +++++++++++++++++++++++++++++--- docs/sitemap.xml | 10 +++++----- 3 files changed, 56 insertions(+), 8 deletions(-) diff --git a/content/posts/2018-03.md b/content/posts/2018-03.md index 81cc7bc1b..65a988717 100644 --- a/content/posts/2018-03.md +++ b/content/posts/2018-03.md @@ -348,3 +348,25 @@ java.lang.IllegalArgumentException: No choices plugin was configured for field ``` - I have to figure that one out... + +## 2018-03-21 + +- Looks like the indexing gets confused that there is still data in the `authority` column +- Unfortunately this causes those items to simply not be indexed, which users noticed because item counts were cut in half and old items showed up in RSS! +- Since we've migrated the ORCID identifiers associated with the authority data to the `cg.creator.id` field we can nullify the authorities remaining in the database: + +```sql +dspace=# UPDATE metadatavalue SET authority=NULL WHERE resource_type_id=2 AND metadata_field_id=3 AND authority IS NOT NULL; +UPDATE 195463 +``` + +- After this the indexing works as usual and item counts and facets are back to normal +- Send Peter a list of all authors to correct: + +```sql +dspace=# \copy (select distinct text_value, count(*) as count from metadatavalue where metadata_field_id = (select metadata_field_id from metadatafieldregistry where element += 'contributor' and qualifier = 'author') AND resource_type_id = 2 group by text_value order by count desc) to /tmp/authors.csv with csv header; +COPY 56156 +``` + +- Afterwards we'll want to do some batch tagging of ORCID identifiers to these names diff --git a/docs/2018-03/index.html b/docs/2018-03/index.html index 0247b0d4b..3c6dca7b7 100644 --- a/docs/2018-03/index.html +++ b/docs/2018-03/index.html @@ -20,7 +20,7 @@ Export a CSV of the IITA community metadata for Martin Mueller - + @@ -51,9 +51,9 @@ Export a CSV of the IITA community metadata for Martin Mueller "@type": "BlogPosting", "headline": "March, 2018", "url": "https://alanorth.github.io/cgspace-notes/2018-03/", - "wordCount": "1948", + "wordCount": "2113", "datePublished": "2018-03-02T16:07:54+02:00", - "dateModified": "2018-03-20T20:31:54+02:00", + "dateModified": "2018-03-20T21:04:10+02:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -512,6 +512,32 @@ java.lang.IllegalArgumentException: No choices plugin was configured for field
  • I have to figure that one out…
  • +

    2018-03-21

    + + + +
    dspace=# UPDATE metadatavalue SET authority=NULL WHERE resource_type_id=2 AND metadata_field_id=3 AND authority IS NOT NULL;
    +UPDATE 195463
    +
    + + + +
    dspace=# \copy (select distinct text_value, count(*) as count from metadatavalue where metadata_field_id = (select metadata_field_id from metadatafieldregistry where element
    += 'contributor' and qualifier = 'author') AND resource_type_id = 2 group by text_value order by count desc) to /tmp/authors.csv with csv header;
    +COPY 56156
    +
    + + + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index bb4005a6d..a69b05ba3 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,7 +4,7 @@ https://alanorth.github.io/cgspace-notes/2018-03/ - 2018-03-20T20:31:54+02:00 + 2018-03-20T21:04:10+02:00 @@ -154,7 +154,7 @@ https://alanorth.github.io/cgspace-notes/ - 2018-03-20T20:31:54+02:00 + 2018-03-20T21:04:10+02:00 0 @@ -165,7 +165,7 @@ https://alanorth.github.io/cgspace-notes/tags/notes/ - 2018-03-20T20:31:54+02:00 + 2018-03-20T21:04:10+02:00 0 @@ -177,13 +177,13 @@ https://alanorth.github.io/cgspace-notes/posts/ - 2018-03-20T20:31:54+02:00 + 2018-03-20T21:04:10+02:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2018-03-20T20:31:54+02:00 + 2018-03-20T21:04:10+02:00 0