Update theme and regenerate public

This commit is contained in:
Alan Orth 2016-11-14 09:27:03 +02:00
parent 3669ce96d2
commit f0480fa373
Signed by: alanorth
GPG Key ID: 0FB860CC9C45B1B9
32 changed files with 4103 additions and 1219 deletions

View File

@ -2,38 +2,87 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="November, 2015" />
<meta property="og:description" content="2015-11-22
CGSpace went down
Looks like DSpace exhausted its PostgreSQL connection pool
Last week I had increased the limit from 30 to 60, which seemed to help, but now there are many more idle connections:
$ psql -c &#39;SELECT * from pg_stat_activity;&#39; | grep idle | grep -c cgspace
78
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2015-11/" />
<meta property="og:updated_time" content="2015-11-23T17:00:57&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="November, 2015">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2015-11-23T17:00:57&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="November, 2015">
<meta itemprop="description" content="2015-11-22
CGSpace went down
Looks like DSpace exhausted its PostgreSQL connection pool
Last week I had increased the limit from 30 to 60, which seemed to help, but now there are many more idle connections:
$ psql -c &#39;SELECT * from pg_stat_activity;&#39; | grep idle | grep -c cgspace
78
">
<meta itemprop="dateModified" content="2015-11-23T17:00:57&#43;03:00" />
<meta itemprop="wordCount" content="798">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2015-11/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="November, 2015"/>
<meta name="twitter:description" content="2015-11-22
CGSpace went down
Looks like DSpace exhausted its PostgreSQL connection pool
Last week I had increased the limit from 30 to 60, which seemed to help, but now there are many more idle connections:
$ psql -c &#39;SELECT * from pg_stat_activity;&#39; | grep idle | grep -c cgspace
78
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="November, 2015">
<meta property="twitter:description" content="">
@ -52,8 +101,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +131,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2015-11/">November, 2015</a></h2>
@ -239,11 +293,13 @@ db.statementpool = true
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -281,7 +337,6 @@ db.statementpool = true
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,90 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="December, 2015" />
<meta property="og:description" content="2015-12-02
Replace lzop with xz in log compression cron jobs on DSpace Test—it uses less space:
# cd /home/dspacetest.cgiar.org/log
# ls -lh dspace.log.2015-11-18*
-rw-rw-r-- 1 tomcat7 tomcat7 2.0M Nov 18 23:59 dspace.log.2015-11-18
-rw-rw-r-- 1 tomcat7 tomcat7 387K Nov 18 23:59 dspace.log.2015-11-18.lzo
-rw-rw-r-- 1 tomcat7 tomcat7 169K Nov 18 23:59 dspace.log.2015-11-18.xz
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2015-12/" />
<meta property="og:updated_time" content="2015-12-02T13:18:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="December, 2015">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2015-12-02T13:18:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="December, 2015">
<meta itemprop="description" content="2015-12-02
Replace lzop with xz in log compression cron jobs on DSpace Test—it uses less space:
# cd /home/dspacetest.cgiar.org/log
# ls -lh dspace.log.2015-11-18*
-rw-rw-r-- 1 tomcat7 tomcat7 2.0M Nov 18 23:59 dspace.log.2015-11-18
-rw-rw-r-- 1 tomcat7 tomcat7 387K Nov 18 23:59 dspace.log.2015-11-18.lzo
-rw-rw-r-- 1 tomcat7 tomcat7 169K Nov 18 23:59 dspace.log.2015-11-18.xz
">
<meta itemprop="dateModified" content="2015-12-02T13:18:00&#43;03:00" />
<meta itemprop="wordCount" content="753">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2015-12/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="December, 2015"/>
<meta name="twitter:description" content="2015-12-02
Replace lzop with xz in log compression cron jobs on DSpace Test—it uses less space:
# cd /home/dspacetest.cgiar.org/log
# ls -lh dspace.log.2015-11-18*
-rw-rw-r-- 1 tomcat7 tomcat7 2.0M Nov 18 23:59 dspace.log.2015-11-18
-rw-rw-r-- 1 tomcat7 tomcat7 387K Nov 18 23:59 dspace.log.2015-11-18.lzo
-rw-rw-r-- 1 tomcat7 tomcat7 169K Nov 18 23:59 dspace.log.2015-11-18.xz
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="December, 2015">
<meta property="twitter:description" content="">
@ -52,8 +104,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +134,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2015-12/">December, 2015</a></h2>
@ -254,11 +311,13 @@ $ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -296,7 +355,6 @@ $ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,75 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="January, 2016" />
<meta property="og:description" content="2016-01-13
Move ILRI collection 10568/12503 from 10568/27869 to 10568/27629 using the move_collections.sh script I wrote last year.
I realized it is only necessary to clear the Cocoon cache after moving collections—rather than reindexing—as no metadata has changed, and therefore no search or browse indexes need to be updated.
Update GitHub wiki for documentation of maintenance tasks.
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-01/" />
<meta property="og:updated_time" content="2016-01-13T13:18:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="January, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-01-13T13:18:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="January, 2016">
<meta itemprop="description" content="2016-01-13
Move ILRI collection 10568/12503 from 10568/27869 to 10568/27629 using the move_collections.sh script I wrote last year.
I realized it is only necessary to clear the Cocoon cache after moving collections—rather than reindexing—as no metadata has changed, and therefore no search or browse indexes need to be updated.
Update GitHub wiki for documentation of maintenance tasks.
">
<meta itemprop="dateModified" content="2016-01-13T13:18:00&#43;03:00" />
<meta itemprop="wordCount" content="466">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-01/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="January, 2016"/>
<meta name="twitter:description" content="2016-01-13
Move ILRI collection 10568/12503 from 10568/27869 to 10568/27629 using the move_collections.sh script I wrote last year.
I realized it is only necessary to clear the Cocoon cache after moving collections—rather than reindexing—as no metadata has changed, and therefore no search or browse indexes need to be updated.
Update GitHub wiki for documentation of maintenance tasks.
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="January, 2016">
<meta property="twitter:description" content="">
@ -52,8 +89,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +119,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-01/">January, 2016</a></h2>
@ -179,11 +221,13 @@ $ find SimpleArchiveForBio/ -iname &ldquo;*.pdf&rdquo; -exec basename {} \; | so
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -221,7 +265,6 @@ $ find SimpleArchiveForBio/ -iname &ldquo;*.pdf&rdquo; -exec basename {} \; | so
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,96 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="February, 2016" />
<meta property="og:description" content="2016-02-05
Looking at some DAGRIS data for Abenet Yabowork
Lots of issues with spaces, newlines, etc causing the import to fail
I noticed we have a very interesting list of countries on CGSpace:
Not only are there 49,000 countries, we have some blanks (25)&hellip;
Also, lots of things like &ldquo;COTE D`LVOIRE&rdquo; and &ldquo;COTE D IVOIRE&rdquo;
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-02/" />
<meta property="og:updated_time" content="2016-02-05T13:18:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="February, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-02-05T13:18:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="February, 2016">
<meta itemprop="description" content="2016-02-05
Looking at some DAGRIS data for Abenet Yabowork
Lots of issues with spaces, newlines, etc causing the import to fail
I noticed we have a very interesting list of countries on CGSpace:
Not only are there 49,000 countries, we have some blanks (25)&hellip;
Also, lots of things like &ldquo;COTE D`LVOIRE&rdquo; and &ldquo;COTE D IVOIRE&rdquo;
">
<meta itemprop="dateModified" content="2016-02-05T13:18:00&#43;03:00" />
<meta itemprop="wordCount" content="1657">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-02/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="February, 2016"/>
<meta name="twitter:description" content="2016-02-05
Looking at some DAGRIS data for Abenet Yabowork
Lots of issues with spaces, newlines, etc causing the import to fail
I noticed we have a very interesting list of countries on CGSpace:
Not only are there 49,000 countries, we have some blanks (25)&hellip;
Also, lots of things like &ldquo;COTE D`LVOIRE&rdquo; and &ldquo;COTE D IVOIRE&rdquo;
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="February, 2016">
<meta property="twitter:description" content="">
@ -52,8 +110,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +140,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-02/">February, 2016</a></h2>
@ -418,11 +481,13 @@ Bitstream: tést señora alimentación.pdf
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -460,7 +525,6 @@ Bitstream: tést señora alimentación.pdf
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,75 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="March, 2016" />
<meta property="og:description" content="2016-03-02
Looking at issues with author authorities on CGSpace
For some reason we still have the index-lucene-update cron job active on CGSpace, but I&rsquo;m pretty sure we don&rsquo;t need it as of the latest few versions of Atmire&rsquo;s Listings and Reports module
Reinstall my local (Mac OS X) DSpace stack with Tomcat 7, PostgreSQL 9.3, and Java JDK 1.7 to match environment on CGSpace server
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-03/" />
<meta property="og:updated_time" content="2016-03-02T16:50:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="March, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-03-02T16:50:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="March, 2016">
<meta itemprop="description" content="2016-03-02
Looking at issues with author authorities on CGSpace
For some reason we still have the index-lucene-update cron job active on CGSpace, but I&rsquo;m pretty sure we don&rsquo;t need it as of the latest few versions of Atmire&rsquo;s Listings and Reports module
Reinstall my local (Mac OS X) DSpace stack with Tomcat 7, PostgreSQL 9.3, and Java JDK 1.7 to match environment on CGSpace server
">
<meta itemprop="dateModified" content="2016-03-02T16:50:00&#43;03:00" />
<meta itemprop="wordCount" content="1581">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-03/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="March, 2016"/>
<meta name="twitter:description" content="2016-03-02
Looking at issues with author authorities on CGSpace
For some reason we still have the index-lucene-update cron job active on CGSpace, but I&rsquo;m pretty sure we don&rsquo;t need it as of the latest few versions of Atmire&rsquo;s Listings and Reports module
Reinstall my local (Mac OS X) DSpace stack with Tomcat 7, PostgreSQL 9.3, and Java JDK 1.7 to match environment on CGSpace server
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="March, 2016">
<meta property="twitter:description" content="">
@ -52,8 +89,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +119,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-03/">March, 2016</a></h2>
@ -332,11 +374,13 @@
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -374,7 +418,6 @@
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,81 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="April, 2016" />
<meta property="og:description" content="2016-04-04
Looking at log file use on CGSpace and notice that we need to work on our cron setup a bit
We are backing up all logs in the log folder, including useless stuff like solr, cocoon, handle-plugin, etc
After running DSpace for over five years I&rsquo;ve never needed to look in any other log file than dspace.log, leave alone one from last year!
This will save us a few gigs of backup space we&rsquo;re paying for on S3
Also, I noticed the checker log has some errors we should pay attention to:
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-04/" />
<meta property="og:updated_time" content="2016-04-04T11:06:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="April, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-04-04T11:06:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="April, 2016">
<meta itemprop="description" content="2016-04-04
Looking at log file use on CGSpace and notice that we need to work on our cron setup a bit
We are backing up all logs in the log folder, including useless stuff like solr, cocoon, handle-plugin, etc
After running DSpace for over five years I&rsquo;ve never needed to look in any other log file than dspace.log, leave alone one from last year!
This will save us a few gigs of backup space we&rsquo;re paying for on S3
Also, I noticed the checker log has some errors we should pay attention to:
">
<meta itemprop="dateModified" content="2016-04-04T11:06:00&#43;03:00" />
<meta itemprop="wordCount" content="2006">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-04/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="April, 2016"/>
<meta name="twitter:description" content="2016-04-04
Looking at log file use on CGSpace and notice that we need to work on our cron setup a bit
We are backing up all logs in the log folder, including useless stuff like solr, cocoon, handle-plugin, etc
After running DSpace for over five years I&rsquo;ve never needed to look in any other log file than dspace.log, leave alone one from last year!
This will save us a few gigs of backup space we&rsquo;re paying for on S3
Also, I noticed the checker log has some errors we should pay attention to:
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="April, 2016">
<meta property="twitter:description" content="">
@ -52,8 +95,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +125,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-04/">April, 2016</a></h2>
@ -545,11 +593,13 @@ dspace.log.2016-04-27:7271
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -587,7 +637,6 @@ dspace.log.2016-04-27:7271
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,87 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="May, 2016" />
<meta property="og:description" content="2016-05-01
Since yesterday there have been 10,000 REST errors and the site has been unstable again
I have blocked access to the API now
There are 3,000 IPs accessing the REST API in a 24-hour period!
# awk &#39;{print $1}&#39; /var/log/nginx/rest.log | uniq | wc -l
3168
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-05/" />
<meta property="og:updated_time" content="2016-05-01T23:06:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="May, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-05-01T23:06:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="May, 2016">
<meta itemprop="description" content="2016-05-01
Since yesterday there have been 10,000 REST errors and the site has been unstable again
I have blocked access to the API now
There are 3,000 IPs accessing the REST API in a 24-hour period!
# awk &#39;{print $1}&#39; /var/log/nginx/rest.log | uniq | wc -l
3168
">
<meta itemprop="dateModified" content="2016-05-01T23:06:00&#43;03:00" />
<meta itemprop="wordCount" content="1349">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-05/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="May, 2016"/>
<meta name="twitter:description" content="2016-05-01
Since yesterday there have been 10,000 REST errors and the site has been unstable again
I have blocked access to the API now
There are 3,000 IPs accessing the REST API in a 24-hour period!
# awk &#39;{print $1}&#39; /var/log/nginx/rest.log | uniq | wc -l
3168
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="May, 2016">
<meta property="twitter:description" content="">
@ -52,8 +101,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +131,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-05/">May, 2016</a></h2>
@ -391,11 +445,13 @@ sys 0m20.540s
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -433,7 +489,6 @@ sys 0m20.540s
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,84 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="June, 2016" />
<meta property="og:description" content="2016-06-01
Experimenting with IFPRI OAI (we want to harvest their publications)
After reading the ContentDM documentation I found IFPRI&rsquo;s OAI endpoint: http://ebrary.ifpri.org/oai/oai.php
After reading the OAI documentation and testing with an OAI validator I found out how to get their publications
This is their publications set: http://ebrary.ifpri.org/oai/oai.php?verb=ListRecords&amp;from=2016-01-01&amp;set=p15738coll2&amp;metadataPrefix=oai_dc
You can see the others by using the OAI ListSets verb: http://ebrary.ifpri.org/oai/oai.php?verb=ListSets
Working on second phase of metadata migration, looks like this will work for moving CPWF-specific data in dc.identifier.fund to cg.identifier.cpwfproject and then the rest to dc.description.sponsorship
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-06/" />
<meta property="og:updated_time" content="2016-06-01T10:53:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="June, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-06-01T10:53:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="June, 2016">
<meta itemprop="description" content="2016-06-01
Experimenting with IFPRI OAI (we want to harvest their publications)
After reading the ContentDM documentation I found IFPRI&rsquo;s OAI endpoint: http://ebrary.ifpri.org/oai/oai.php
After reading the OAI documentation and testing with an OAI validator I found out how to get their publications
This is their publications set: http://ebrary.ifpri.org/oai/oai.php?verb=ListRecords&amp;from=2016-01-01&amp;set=p15738coll2&amp;metadataPrefix=oai_dc
You can see the others by using the OAI ListSets verb: http://ebrary.ifpri.org/oai/oai.php?verb=ListSets
Working on second phase of metadata migration, looks like this will work for moving CPWF-specific data in dc.identifier.fund to cg.identifier.cpwfproject and then the rest to dc.description.sponsorship
">
<meta itemprop="dateModified" content="2016-06-01T10:53:00&#43;03:00" />
<meta itemprop="wordCount" content="1549">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-06/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="June, 2016"/>
<meta name="twitter:description" content="2016-06-01
Experimenting with IFPRI OAI (we want to harvest their publications)
After reading the ContentDM documentation I found IFPRI&rsquo;s OAI endpoint: http://ebrary.ifpri.org/oai/oai.php
After reading the OAI documentation and testing with an OAI validator I found out how to get their publications
This is their publications set: http://ebrary.ifpri.org/oai/oai.php?verb=ListRecords&amp;from=2016-01-01&amp;set=p15738coll2&amp;metadataPrefix=oai_dc
You can see the others by using the OAI ListSets verb: http://ebrary.ifpri.org/oai/oai.php?verb=ListSets
Working on second phase of metadata migration, looks like this will work for moving CPWF-specific data in dc.identifier.fund to cg.identifier.cpwfproject and then the rest to dc.description.sponsorship
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="June, 2016">
<meta property="twitter:description" content="">
@ -52,8 +98,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +128,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-06/">June, 2016</a></h2>
@ -438,11 +489,13 @@ $ ./delete-metadata-values.py -f dc.contributor.corporate -i Corporate-Authors-D
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -480,7 +533,6 @@ $ ./delete-metadata-values.py -f dc.contributor.corporate -i Corporate-Authors-D
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,108 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="July, 2016" />
<meta property="og:description" content="2016-07-01
Add dc.description.sponsorship to Discovery sidebar facets and make investors clickable in item view (#232)
I think this query should find and replace all authors that have &ldquo;,&rdquo; at the end of their names:
dspacetest=# update metadatavalue set text_value = regexp_replace(text_value, &#39;(^.&#43;?),$&#39;, &#39;\1&#39;) where metadata_field_id=3 and resource_type_id=2 and text_value ~ &#39;^.&#43;?,$&#39;;
UPDATE 95
dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and resource_type_id=2 and text_value ~ &#39;^.&#43;?,$&#39;;
text_value
------------
(0 rows)
In this case the select query was showing 95 results before the update
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-07/" />
<meta property="og:updated_time" content="2016-07-01T10:53:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="July, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-07-01T10:53:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="July, 2016">
<meta itemprop="description" content="2016-07-01
Add dc.description.sponsorship to Discovery sidebar facets and make investors clickable in item view (#232)
I think this query should find and replace all authors that have &ldquo;,&rdquo; at the end of their names:
dspacetest=# update metadatavalue set text_value = regexp_replace(text_value, &#39;(^.&#43;?),$&#39;, &#39;\1&#39;) where metadata_field_id=3 and resource_type_id=2 and text_value ~ &#39;^.&#43;?,$&#39;;
UPDATE 95
dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and resource_type_id=2 and text_value ~ &#39;^.&#43;?,$&#39;;
text_value
------------
(0 rows)
In this case the select query was showing 95 results before the update
">
<meta itemprop="dateModified" content="2016-07-01T10:53:00&#43;03:00" />
<meta itemprop="wordCount" content="866">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-07/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="July, 2016"/>
<meta name="twitter:description" content="2016-07-01
Add dc.description.sponsorship to Discovery sidebar facets and make investors clickable in item view (#232)
I think this query should find and replace all authors that have &ldquo;,&rdquo; at the end of their names:
dspacetest=# update metadatavalue set text_value = regexp_replace(text_value, &#39;(^.&#43;?),$&#39;, &#39;\1&#39;) where metadata_field_id=3 and resource_type_id=2 and text_value ~ &#39;^.&#43;?,$&#39;;
UPDATE 95
dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and resource_type_id=2 and text_value ~ &#39;^.&#43;?,$&#39;;
text_value
------------
(0 rows)
In this case the select query was showing 95 results before the update
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="July, 2016">
<meta property="twitter:description" content="">
@ -52,8 +122,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +152,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-07/">July, 2016</a></h2>
@ -340,11 +415,13 @@ discovery.index.authority.ignore-variants=true
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -382,7 +459,6 @@ discovery.index.authority.ignore-variants=true
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,99 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="August, 2016" />
<meta property="og:description" content="2016-08-01
Add updated distribution license from Sisay (#259)
Play with upgrading Mirage 2 dependencies in bower.json because most are several versions of out date
Bootstrap is at 3.3.0 but upstream is at 3.3.7, and upgrading to anything beyond 3.3.1 breaks glyphicons and probably more
bower stuff is a dead end, waste of time, too many issues
Anything after Bootstrap 3.3.1 makes glyphicons disappear (HTTP 404 trying to access from incorrect path of fonts)
Start working on DSpace 5.15.5 port:
$ git checkout -b 55new 5_x-prod
$ git reset --hard ilri/5_x-prod
$ git rebase -i dspace-5.5
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-08/" />
<meta property="og:updated_time" content="2016-08-01T15:53:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="August, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-08-01T15:53:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="August, 2016">
<meta itemprop="description" content="2016-08-01
Add updated distribution license from Sisay (#259)
Play with upgrading Mirage 2 dependencies in bower.json because most are several versions of out date
Bootstrap is at 3.3.0 but upstream is at 3.3.7, and upgrading to anything beyond 3.3.1 breaks glyphicons and probably more
bower stuff is a dead end, waste of time, too many issues
Anything after Bootstrap 3.3.1 makes glyphicons disappear (HTTP 404 trying to access from incorrect path of fonts)
Start working on DSpace 5.15.5 port:
$ git checkout -b 55new 5_x-prod
$ git reset --hard ilri/5_x-prod
$ git rebase -i dspace-5.5
">
<meta itemprop="dateModified" content="2016-08-01T15:53:00&#43;03:00" />
<meta itemprop="wordCount" content="1514">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-08/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="August, 2016"/>
<meta name="twitter:description" content="2016-08-01
Add updated distribution license from Sisay (#259)
Play with upgrading Mirage 2 dependencies in bower.json because most are several versions of out date
Bootstrap is at 3.3.0 but upstream is at 3.3.7, and upgrading to anything beyond 3.3.1 breaks glyphicons and probably more
bower stuff is a dead end, waste of time, too many issues
Anything after Bootstrap 3.3.1 makes glyphicons disappear (HTTP 404 trying to access from incorrect path of fonts)
Start working on DSpace 5.15.5 port:
$ git checkout -b 55new 5_x-prod
$ git reset --hard ilri/5_x-prod
$ git rebase -i dspace-5.5
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="August, 2016">
<meta property="twitter:description" content="">
@ -52,8 +113,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +143,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-08/">August, 2016</a></h2>
@ -419,11 +485,13 @@ $ JAVA_OPTS=&quot;-Dfile.encoding=UTF-8 -Xmx512m&quot; /home/cgspace.cgiar.org/b
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -461,7 +529,6 @@ $ JAVA_OPTS=&quot;-Dfile.encoding=UTF-8 -Xmx512m&quot; /home/cgspace.cgiar.org/b
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,87 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="September, 2016" />
<meta property="og:description" content="2016-09-01
Discuss helping CCAFS with some batch tagging of ORCID IDs for their authors
Discuss how the migration of CGIAR&rsquo;s Active Directory to a flat structure will break our LDAP groups in DSpace
We had been using DC=ILRI to determine whether a user was ILRI or not
It looks like we might be able to use OUs now, instead of DCs:
$ ldapsearch -x -H ldaps://svcgroot2.cgiarad.org:3269/ -b &quot;dc=cgiarad,dc=org&quot; -D &quot;admigration1@cgiarad.org&quot; -W &quot;(sAMAccountName=admigration1)&quot;
" />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-09/" />
<meta property="og:updated_time" content="2016-09-01T15:53:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="September, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-09-01T15:53:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="September, 2016">
<meta itemprop="description" content="2016-09-01
Discuss helping CCAFS with some batch tagging of ORCID IDs for their authors
Discuss how the migration of CGIAR&rsquo;s Active Directory to a flat structure will break our LDAP groups in DSpace
We had been using DC=ILRI to determine whether a user was ILRI or not
It looks like we might be able to use OUs now, instead of DCs:
$ ldapsearch -x -H ldaps://svcgroot2.cgiarad.org:3269/ -b &quot;dc=cgiarad,dc=org&quot; -D &quot;admigration1@cgiarad.org&quot; -W &quot;(sAMAccountName=admigration1)&quot;
">
<meta itemprop="dateModified" content="2016-09-01T15:53:00&#43;03:00" />
<meta itemprop="wordCount" content="3298">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-09/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="September, 2016"/>
<meta name="twitter:description" content="2016-09-01
Discuss helping CCAFS with some batch tagging of ORCID IDs for their authors
Discuss how the migration of CGIAR&rsquo;s Active Directory to a flat structure will break our LDAP groups in DSpace
We had been using DC=ILRI to determine whether a user was ILRI or not
It looks like we might be able to use OUs now, instead of DCs:
$ ldapsearch -x -H ldaps://svcgroot2.cgiarad.org:3269/ -b &quot;dc=cgiarad,dc=org&quot; -D &quot;admigration1@cgiarad.org&quot; -W &quot;(sAMAccountName=admigration1)&quot;
"/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="September, 2016">
<meta property="twitter:description" content="">
@ -52,8 +101,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +131,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-09/">September, 2016</a></h2>
@ -727,11 +781,13 @@ $ ./delete-metadata-values.py -i ilrisubjects-delete-13.csv -f cg.subject.ilri -
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -769,7 +825,6 @@ $ ./delete-metadata-values.py -i ilrisubjects-delete-13.csv -f cg.subject.ilri -
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,51 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="October, 2016" />
<meta property="og:description" content="2016-10-03 Testing adding ORCIDs to a CSV file for a single item to see if the author orders get messed up Need to test the following scenarios to see how author order is affected: ORCIDs only ORCIDs plus normal authors I exported a random item&rsquo;s metadata as CSV, deleted all columns except id and collection, and made a new coloum called ORCID:dc.contributor.author with the following random ORCIDs from the ORCID registry: 0000-0002-6115-0956||0000-0002-3812-8793||0000-0001-7462-405X Hmm, with the dc." />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-10/" />
<meta property="og:updated_time" content="2016-10-03T15:53:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="October, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-10-03T15:53:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="October, 2016">
<meta itemprop="description" content="2016-10-03 Testing adding ORCIDs to a CSV file for a single item to see if the author orders get messed up Need to test the following scenarios to see how author order is affected: ORCIDs only ORCIDs plus normal authors I exported a random item&rsquo;s metadata as CSV, deleted all columns except id and collection, and made a new coloum called ORCID:dc.contributor.author with the following random ORCIDs from the ORCID registry: 0000-0002-6115-0956||0000-0002-3812-8793||0000-0001-7462-405X Hmm, with the dc.">
<meta itemprop="dateModified" content="2016-10-03T15:53:00&#43;03:00" />
<meta itemprop="wordCount" content="1828">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-10/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="October, 2016"/>
<meta name="twitter:description" content="2016-10-03 Testing adding ORCIDs to a CSV file for a single item to see if the author orders get messed up Need to test the following scenarios to see how author order is affected: ORCIDs only ORCIDs plus normal authors I exported a random item&rsquo;s metadata as CSV, deleted all columns except id and collection, and made a new coloum called ORCID:dc.contributor.author with the following random ORCIDs from the ORCID registry: 0000-0002-6115-0956||0000-0002-3812-8793||0000-0001-7462-405X Hmm, with the dc."/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="October, 2016">
<meta property="twitter:description" content="">
@ -52,8 +65,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +95,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-10/">October, 2016</a></h2>
@ -406,11 +424,13 @@ dspace=# update metadatavalue set text_value = regexp_replace(text_value, 'http:
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -448,7 +468,6 @@ dspace=# update metadatavalue set text_value = regexp_replace(text_value, 'http:
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,38 +2,51 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="November, 2016" />
<meta property="og:description" content="2016-11-01 Add dc.type to the output options for Atmire&rsquo;s Listings and Reports module (#286) 2016-11-02 Migrate DSpace Test to DSpace 5.5 (notes) Run all updates on DSpace Test and reboot the server Looks like the OAI bug from DSpace 5.1 that caused validation at Base Search to fail is now fixed and DSpace Test passes validation! (#63) Indexing Discovery on DSpace Test took 332 minutes, which is like five times as long as it usually takes At the end it appeared to finish correctly but there were lots of errors right after it finished: 2016-11-02 15:09:48,578 INFO com." />
<meta property="og:type" content="article" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-11/" />
<meta property="og:updated_time" content="2016-11-01T09:21:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="November, 2016">
<meta property="og:description" content="">
<meta property="og:type" content="article">
<meta property="article:published_time" content="2016-11-01T09:21:00&#43;03:00">
<meta property="article:author" content="Alan Orth">
<meta itemprop="name" content="November, 2016">
<meta itemprop="description" content="2016-11-01 Add dc.type to the output options for Atmire&rsquo;s Listings and Reports module (#286) 2016-11-02 Migrate DSpace Test to DSpace 5.5 (notes) Run all updates on DSpace Test and reboot the server Looks like the OAI bug from DSpace 5.1 that caused validation at Base Search to fail is now fixed and DSpace Test passes validation! (#63) Indexing Discovery on DSpace Test took 332 minutes, which is like five times as long as it usually takes At the end it appeared to finish correctly but there were lots of errors right after it finished: 2016-11-02 15:09:48,578 INFO com.">
<meta itemprop="dateModified" content="2016-11-01T09:21:00&#43;03:00" />
<meta itemprop="wordCount" content="1152">
<meta itemprop="keywords" content="notes," />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2016-11/">
<meta name="twitter:card" content="summary"/>
<meta name="twitter:title" content="November, 2016"/>
<meta name="twitter:description" content="2016-11-01 Add dc.type to the output options for Atmire&rsquo;s Listings and Reports module (#286) 2016-11-02 Migrate DSpace Test to DSpace 5.5 (notes) Run all updates on DSpace Test and reboot the server Looks like the OAI bug from DSpace 5.1 that caused validation at Base Search to fail is now fixed and DSpace Test passes validation! (#63) Indexing Discovery on DSpace Test took 332 minutes, which is like five times as long as it usually takes At the end it appeared to finish correctly but there were lots of errors right after it finished: 2016-11-02 15:09:48,578 INFO com."/>
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="November, 2016">
<meta property="twitter:description" content="">
@ -52,8 +65,11 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
</head>
<body>
@ -79,6 +95,8 @@
<div class="col-sm-8 blog-main">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-11/">November, 2016</a></h2>
@ -286,7 +304,7 @@ dspace=# select count(text_value) from metadatavalue where resource_type_id=2 an
</code></pre>
<ul>
<li>Generate a list of all these so I can fix them in batch:</li>
<li>Generate a list of all these so I can maybe fix them in batch:</li>
</ul>
<pre><code>dspace=# \copy (select distinct text_lang, count(*) from metadatavalue where resource_type_id=2 group by text_lang order by count desc) to /tmp/text-langs.csv with csv;
@ -301,16 +319,50 @@ COPY 14
UPDATE 85
</code></pre>
<ul>
<li>The <code>fix-metadata.py</code> script I have is meant for specific metadata values, so if I want to update some <code>text_lang</code> values I should just do it directly in the database</li>
<li>For example, on a limited set:</li>
</ul>
<pre><code>dspace=# update metadatavalue set text_lang=NULL where resource_type_id=2 and metadata_field_id=203 and text_value='LIVESTOCK' and text_lang='';
UPDATE 420
</code></pre>
<ul>
<li>And assuming I want to do it for all fields:</li>
</ul>
<pre><code>dspacetest=# update metadatavalue set text_lang=NULL where resource_type_id=2 and text_lang='';
UPDATE 183726
</code></pre>
<ul>
<li>After that restarted Tomcat and PostgreSQL (because I&rsquo;m superstitious about caches) and now I see the following in REST API query:</li>
</ul>
<pre><code>$ curl -s -H &quot;accept: application/json&quot; -H &quot;Content-Type: application/json&quot; -X POST &quot;http://localhost:8080/rest/items/find-by-metadata-field&quot; -d '{&quot;key&quot;: &quot;cg.subject.ilri&quot;,&quot;value&quot;: &quot;SEEDS&quot;}' | jq length
71
$ curl -s -H &quot;accept: application/json&quot; -H &quot;Content-Type: application/json&quot; -X POST &quot;http://localhost:8080/rest/items/find-by-metadata-field&quot; -d '{&quot;key&quot;: &quot;cg.subject.ilri&quot;,&quot;value&quot;: &quot;SEEDS&quot;, &quot;language&quot;:&quot;&quot;}' | jq length
0
$ curl -s -H &quot;accept: application/json&quot; -H &quot;Content-Type: application/json&quot; -X POST &quot;http://localhost:8080/rest/items/find-by-metadata-field&quot; -d '{&quot;key&quot;: &quot;cg.subject.ilri&quot;,&quot;value&quot;: &quot;SEEDS&quot;, &quot;language&quot;:&quot;en_US&quot;}' | jq length
</code></pre>
<ul>
<li>Not sure what&rsquo;s going on, but Discovery shows 83 values, and database shows 85, so I&rsquo;m going to reindex Discovery just in case</li>
</ul>
</article>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -348,7 +400,6 @@ UPDATE 85
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

6
public/css/cookieconsent.min.css vendored Normal file
View File

@ -0,0 +1,6 @@
.cc-window{opacity:1;transition:opacity 1s ease}.cc-window.cc-invisible{opacity:0}.cc-animate.cc-revoke{transition:transform 1s ease}.cc-animate.cc-revoke.cc-top{transform:translateY(-2em)}.cc-animate.cc-revoke.cc-bottom{transform:translateY(2em)}.cc-animate.cc-revoke.cc-active.cc-bottom,.cc-animate.cc-revoke.cc-active.cc-top,.cc-revoke:hover{transform:translateY(0)}.cc-grower{max-height:0;overflow:hidden;transition:max-height 1s}
.cc-link,.cc-revoke:hover{text-decoration:underline}.cc-revoke,.cc-window{position:fixed;overflow:hidden;box-sizing:border-box;font-family:Helvetica,Calibri,Arial,sans-serif;font-size:16px;line-height:1.5em;display:-ms-flexbox;display:flex;-ms-flex-wrap:nowrap;flex-wrap:nowrap;z-index:9999}.cc-window.cc-static{position:static}.cc-window.cc-floating{padding:2em;max-width:24em;-ms-flex-direction:column;flex-direction:column}.cc-window.cc-banner{padding:1em 1.8em;width:100%;-ms-flex-direction:row;flex-direction:row}.cc-revoke{padding:.5em}.cc-header{font-size:18px;font-weight:700}.cc-btn,.cc-close,.cc-link,.cc-revoke{cursor:pointer}.cc-link{opacity:.8;display:inline-block;padding:.2em}.cc-link:hover{opacity:1}.cc-link:active,.cc-link:visited{color:initial}.cc-btn{display:block;padding:.4em .8em;font-size:.9em;font-weight:700;border-width:2px;border-style:solid;text-align:center;white-space:nowrap}.cc-banner .cc-btn:last-child{min-width:140px}.cc-highlight .cc-btn:first-child{background-color:transparent;border-color:transparent}.cc-highlight .cc-btn:first-child:hover{background-color:transparent;text-decoration:underline}.cc-close{display:block;position:absolute;top:.5em;right:.5em;font-size:1.6em;opacity:.9;line-height:.75}.cc-close:hover{opacity:1}
.cc-revoke.cc-top{top:0;left:3em;border-bottom-left-radius:.5em;border-bottom-right-radius:.5em}.cc-revoke.cc-bottom{bottom:0;left:3em;border-top-left-radius:.5em;border-top-right-radius:.5em}.cc-revoke.cc-left{left:3em;right:unset}.cc-revoke.cc-right{right:3em;left:unset}.cc-top{top:1em}.cc-left{left:1em}.cc-right{right:1em}.cc-bottom{bottom:1em}.cc-floating>.cc-link{margin-bottom:1em}.cc-floating .cc-message{display:block;margin-bottom:1em}.cc-window.cc-floating .cc-compliance{-ms-flex:1;flex:1}.cc-window.cc-banner{-ms-flex-align:center;-ms-grid-row-align:center;align-items:center}.cc-banner.cc-top{left:0;right:0;top:0}.cc-banner.cc-bottom{left:0;right:0;bottom:0}.cc-banner .cc-message{-ms-flex:1;flex:1}.cc-compliance{display:-ms-flexbox;display:flex;-ms-flex-align:center;align-items:center;-ms-flex-line-pack:justify;align-content:space-between}.cc-compliance>.cc-btn{-ms-flex:1;flex:1}.cc-btn+.cc-btn{margin-left:.5em}
@media print{.cc-revoke,.cc-window{display:none}}@media screen and (max-width:900px){.cc-btn{white-space:normal}}@media screen and (max-width:414px) and (orientation:portrait),screen and (max-width:736px) and (orientation:landscape){.cc-window.cc-top{top:0}.cc-window.cc-bottom{bottom:0}.cc-window.cc-banner,.cc-window.cc-left,.cc-window.cc-right{left:0;right:0}.cc-window.cc-banner{-ms-flex-direction:column;flex-direction:column}.cc-window.cc-banner .cc-compliance{-ms-flex:1;flex:1}.cc-window.cc-floating{max-width:none}.cc-window .cc-message{margin-bottom:1em}.cc-window.cc-banner{-ms-flex-align:unset;-ms-grid-row-align:unset;align-items:unset}}
.cc-floating.cc-theme-classic{padding:1.2em;border-radius:5px}.cc-floating.cc-type-info.cc-theme-classic .cc-compliance{text-align:center;display:inline;-ms-flex:none;flex:none}.cc-theme-classic .cc-btn{border-radius:5px}.cc-theme-classic .cc-btn:last-child{min-width:140px}.cc-floating.cc-type-info.cc-theme-classic .cc-btn{display:inline-block}
.cc-theme-edgeless.cc-window{padding:0}.cc-floating.cc-theme-edgeless .cc-message{margin:2em 2em 1.5em}.cc-banner.cc-theme-edgeless .cc-btn{margin:0;padding:.8em 1.8em;height:100%}.cc-banner.cc-theme-edgeless .cc-message{margin-left:1em}.cc-floating.cc-theme-edgeless .cc-btn+.cc-btn{margin-left:0}

File diff suppressed because one or more lines are too long

Binary file not shown.

Binary file not shown.

File diff suppressed because it is too large Load Diff

Before

Width:  |  Height:  |  Size: 382 KiB

After

Width:  |  Height:  |  Size: 434 KiB

Binary file not shown.

View File

@ -2,35 +2,33 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="CGSpace Notes" />
<meta property="og:description" content="" />
<meta property="og:type" content="website" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/" />
<meta property="og:updated_time" content="2016-11-01T09:21:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="CGSpace Notes">
<meta property="og:description" content="">
<meta property="og:type" content="blog">
<meta itemprop="name" content="CGSpace Notes">
<meta itemprop="description" content="">
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/">
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="CGSpace Notes">
<meta property="twitter:description" content="">
@ -49,8 +47,15 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
<link href="https://alanorth.github.io/cgspace-notes/index.xml" rel="alternate" type="application/rss+xml" title="CGSpace Notes" />
<link href="https://alanorth.github.io/cgspace-notes/index.xml" rel="feed" type="application/rss+xml" title="CGSpace Notes" />
</head>
<body>
@ -79,7 +84,9 @@
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-11/">November, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-11-01T09:21:00&#43;03:00">Tue Nov 01, 2016</time> by Alan Orth in
@ -93,7 +100,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-10/">October, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-10-03T15:53:00&#43;03:00">Mon Oct 03, 2016</time> by Alan Orth in
@ -107,7 +116,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-09/">September, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-09-01T15:53:00&#43;03:00">Thu Sep 01, 2016</time> by Alan Orth in
@ -133,7 +144,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-08/">August, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-08-01T15:53:00&#43;03:00">Mon Aug 01, 2016</time> by Alan Orth in
@ -163,7 +176,9 @@ $ git rebase -i dspace-5.5
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-07/">July, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-07-01T10:53:00&#43;03:00">Fri Jul 01, 2016</time> by Alan Orth in
@ -196,7 +211,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-06/">June, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-06-01T10:53:00&#43;03:00">Wed Jun 01, 2016</time> by Alan Orth in
@ -221,7 +238,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-05/">May, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-05-01T23:06:00&#43;03:00">Sun May 01, 2016</time> by Alan Orth in
@ -247,7 +266,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-04/">April, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-04-04T11:06:00&#43;03:00">Mon Apr 04, 2016</time> by Alan Orth in
@ -271,7 +292,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-03/">March, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-03-02T16:50:00&#43;03:00">Wed Mar 02, 2016</time> by Alan Orth in
@ -293,7 +316,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-02/">February, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-02-05T13:18:00&#43;03:00">Fri Feb 05, 2016</time> by Alan Orth in
@ -323,6 +348,7 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
<nav class="blog-pagination">
@ -331,12 +357,12 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
<a class="btn btn-outline-primary" href="/page/2/" role="button">Next page</a>
</nav>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -374,7 +400,6 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -213,7 +213,7 @@ dspace=# select count(text_value) from metadatavalue where resource_type_id=2 an
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;Generate a list of all these so I can fix them in batch:&lt;/li&gt;
&lt;li&gt;Generate a list of all these so I can maybe fix them in batch:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspace=# \copy (select distinct text_lang, count(*) from metadatavalue where resource_type_id=2 group by text_lang order by count desc) to /tmp/text-langs.csv with csv;
@ -227,6 +227,38 @@ COPY 14
&lt;pre&gt;&lt;code&gt;dspace=# update metadatavalue set text_lang=&#39;en_US&#39; where resource_type_id=2 and metadata_field_id=203 and text_value=&#39;SEEDS&#39;;
UPDATE 85
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;The &lt;code&gt;fix-metadata.py&lt;/code&gt; script I have is meant for specific metadata values, so if I want to update some &lt;code&gt;text_lang&lt;/code&gt; values I should just do it directly in the database&lt;/li&gt;
&lt;li&gt;For example, on a limited set:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspace=# update metadatavalue set text_lang=NULL where resource_type_id=2 and metadata_field_id=203 and text_value=&#39;LIVESTOCK&#39; and text_lang=&#39;&#39;;
UPDATE 420
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;And assuming I want to do it for all fields:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspacetest=# update metadatavalue set text_lang=NULL where resource_type_id=2 and text_lang=&#39;&#39;;
UPDATE 183726
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;After that restarted Tomcat and PostgreSQL (because I&amp;rsquo;m superstitious about caches) and now I see the following in REST API query:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;}&#39; | jq length
71
$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;, &amp;quot;language&amp;quot;:&amp;quot;&amp;quot;}&#39; | jq length
0
$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;, &amp;quot;language&amp;quot;:&amp;quot;en_US&amp;quot;}&#39; | jq length
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;Not sure what&amp;rsquo;s going on, but Discovery shows 83 values, and database shows 85, so I&amp;rsquo;m going to reindex Discovery just in case&lt;/li&gt;
&lt;/ul&gt;
</description>
</item>

1
public/js/cookieconsent.min.js vendored Normal file

File diff suppressed because one or more lines are too long

View File

@ -2,35 +2,33 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="CGSpace Notes" />
<meta property="og:description" content="" />
<meta property="og:type" content="website" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/" />
<meta property="og:updated_time" content="2016-01-13T13:18:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="CGSpace Notes">
<meta property="og:description" content="">
<meta property="og:type" content="blog">
<meta itemprop="name" content="CGSpace Notes">
<meta itemprop="description" content="">
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/">
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="CGSpace Notes">
<meta property="twitter:description" content="">
@ -49,8 +47,15 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
<link href="https://alanorth.github.io/cgspace-notes/index.xml" rel="alternate" type="application/rss+xml" title="CGSpace Notes" />
<link href="https://alanorth.github.io/cgspace-notes/index.xml" rel="feed" type="application/rss+xml" title="CGSpace Notes" />
</head>
<body>
@ -79,7 +84,9 @@
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-01/">January, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-01-13T13:18:00&#43;03:00">Wed Jan 13, 2016</time> by Alan Orth in
@ -101,7 +108,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2015-12/">December, 2015</a></h2>
<p class="blog-post-meta"><time datetime="2015-12-02T13:18:00&#43;03:00">Wed Dec 02, 2015</time> by Alan Orth in
@ -128,7 +137,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2015-11/">November, 2015</a></h2>
<p class="blog-post-meta"><time datetime="2015-11-23T17:00:57&#43;03:00">Mon Nov 23, 2015</time> by Alan Orth in
@ -155,6 +166,7 @@
<nav class="blog-pagination">
@ -163,12 +175,12 @@
</nav>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -206,7 +218,6 @@
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,35 +2,33 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="Posts" />
<meta property="og:description" content="" />
<meta property="og:type" content="website" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/post/" />
<meta property="og:updated_time" content="2016-11-01T09:21:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="Posts">
<meta property="og:description" content="">
<meta property="og:type" content="blog">
<meta itemprop="name" content="Posts">
<meta itemprop="description" content="">
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/post/">
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="Posts">
<meta property="twitter:description" content="">
@ -49,8 +47,15 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
<link href="https://alanorth.github.io/cgspace-notes/post/index.xml" rel="alternate" type="application/rss+xml" title="CGSpace Notes" />
<link href="https://alanorth.github.io/cgspace-notes/post/index.xml" rel="feed" type="application/rss+xml" title="CGSpace Notes" />
</head>
<body>
@ -79,7 +84,9 @@
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-11/">November, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-11-01T09:21:00&#43;03:00">Tue Nov 01, 2016</time> by Alan Orth in
@ -93,7 +100,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-10/">October, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-10-03T15:53:00&#43;03:00">Mon Oct 03, 2016</time> by Alan Orth in
@ -107,7 +116,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-09/">September, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-09-01T15:53:00&#43;03:00">Thu Sep 01, 2016</time> by Alan Orth in
@ -133,7 +144,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-08/">August, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-08-01T15:53:00&#43;03:00">Mon Aug 01, 2016</time> by Alan Orth in
@ -163,7 +176,9 @@ $ git rebase -i dspace-5.5
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-07/">July, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-07-01T10:53:00&#43;03:00">Fri Jul 01, 2016</time> by Alan Orth in
@ -196,7 +211,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-06/">June, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-06-01T10:53:00&#43;03:00">Wed Jun 01, 2016</time> by Alan Orth in
@ -221,7 +238,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-05/">May, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-05-01T23:06:00&#43;03:00">Sun May 01, 2016</time> by Alan Orth in
@ -247,7 +266,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-04/">April, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-04-04T11:06:00&#43;03:00">Mon Apr 04, 2016</time> by Alan Orth in
@ -271,7 +292,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-03/">March, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-03-02T16:50:00&#43;03:00">Wed Mar 02, 2016</time> by Alan Orth in
@ -293,7 +316,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-02/">February, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-02-05T13:18:00&#43;03:00">Fri Feb 05, 2016</time> by Alan Orth in
@ -323,6 +348,7 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
<nav class="blog-pagination">
@ -331,12 +357,12 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
<a class="btn btn-outline-primary" href="/post/page/2/" role="button">Next page</a>
</nav>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -374,7 +400,6 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -213,7 +213,7 @@ dspace=# select count(text_value) from metadatavalue where resource_type_id=2 an
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;Generate a list of all these so I can fix them in batch:&lt;/li&gt;
&lt;li&gt;Generate a list of all these so I can maybe fix them in batch:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspace=# \copy (select distinct text_lang, count(*) from metadatavalue where resource_type_id=2 group by text_lang order by count desc) to /tmp/text-langs.csv with csv;
@ -227,6 +227,38 @@ COPY 14
&lt;pre&gt;&lt;code&gt;dspace=# update metadatavalue set text_lang=&#39;en_US&#39; where resource_type_id=2 and metadata_field_id=203 and text_value=&#39;SEEDS&#39;;
UPDATE 85
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;The &lt;code&gt;fix-metadata.py&lt;/code&gt; script I have is meant for specific metadata values, so if I want to update some &lt;code&gt;text_lang&lt;/code&gt; values I should just do it directly in the database&lt;/li&gt;
&lt;li&gt;For example, on a limited set:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspace=# update metadatavalue set text_lang=NULL where resource_type_id=2 and metadata_field_id=203 and text_value=&#39;LIVESTOCK&#39; and text_lang=&#39;&#39;;
UPDATE 420
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;And assuming I want to do it for all fields:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspacetest=# update metadatavalue set text_lang=NULL where resource_type_id=2 and text_lang=&#39;&#39;;
UPDATE 183726
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;After that restarted Tomcat and PostgreSQL (because I&amp;rsquo;m superstitious about caches) and now I see the following in REST API query:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;}&#39; | jq length
71
$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;, &amp;quot;language&amp;quot;:&amp;quot;&amp;quot;}&#39; | jq length
0
$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;, &amp;quot;language&amp;quot;:&amp;quot;en_US&amp;quot;}&#39; | jq length
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;Not sure what&amp;rsquo;s going on, but Discovery shows 83 values, and database shows 85, so I&amp;rsquo;m going to reindex Discovery just in case&lt;/li&gt;
&lt;/ul&gt;
</description>
</item>

View File

@ -2,35 +2,33 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="Posts" />
<meta property="og:description" content="" />
<meta property="og:type" content="website" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/post/" />
<meta property="og:updated_time" content="2016-01-13T13:18:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="Posts">
<meta property="og:description" content="">
<meta property="og:type" content="blog">
<meta itemprop="name" content="Posts">
<meta itemprop="description" content="">
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/post/">
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="Posts">
<meta property="twitter:description" content="">
@ -49,8 +47,15 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
<link href="https://alanorth.github.io/cgspace-notes/post/index.xml" rel="alternate" type="application/rss+xml" title="CGSpace Notes" />
<link href="https://alanorth.github.io/cgspace-notes/post/index.xml" rel="feed" type="application/rss+xml" title="CGSpace Notes" />
</head>
<body>
@ -79,7 +84,9 @@
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-01/">January, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-01-13T13:18:00&#43;03:00">Wed Jan 13, 2016</time> by Alan Orth in
@ -101,7 +108,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2015-12/">December, 2015</a></h2>
<p class="blog-post-meta"><time datetime="2015-12-02T13:18:00&#43;03:00">Wed Dec 02, 2015</time> by Alan Orth in
@ -128,7 +137,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2015-11/">November, 2015</a></h2>
<p class="blog-post-meta"><time datetime="2015-11-23T17:00:57&#43;03:00">Mon Nov 23, 2015</time> by Alan Orth in
@ -155,6 +166,7 @@
<nav class="blog-pagination">
@ -163,12 +175,12 @@
</nav>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -206,7 +218,6 @@
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -2,35 +2,33 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="Notes" />
<meta property="og:description" content="" />
<meta property="og:type" content="website" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/tags/notes/" />
<meta property="og:updated_time" content="2016-11-01T09:21:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="Notes">
<meta property="og:description" content="">
<meta property="og:type" content="blog">
<meta itemprop="name" content="Notes">
<meta itemprop="description" content="">
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/tags/notes/">
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="Notes">
<meta property="twitter:description" content="">
@ -49,8 +47,15 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
<link href="https://alanorth.github.io/cgspace-notes/tags/notes/index.xml" rel="alternate" type="application/rss+xml" title="CGSpace Notes" />
<link href="https://alanorth.github.io/cgspace-notes/tags/notes/index.xml" rel="feed" type="application/rss+xml" title="CGSpace Notes" />
</head>
<body>
@ -79,7 +84,9 @@
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-11/">November, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-11-01T09:21:00&#43;03:00">Tue Nov 01, 2016</time> by Alan Orth in
@ -93,7 +100,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-10/">October, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-10-03T15:53:00&#43;03:00">Mon Oct 03, 2016</time> by Alan Orth in
@ -107,7 +116,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-09/">September, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-09-01T15:53:00&#43;03:00">Thu Sep 01, 2016</time> by Alan Orth in
@ -133,7 +144,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-08/">August, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-08-01T15:53:00&#43;03:00">Mon Aug 01, 2016</time> by Alan Orth in
@ -163,7 +176,9 @@ $ git rebase -i dspace-5.5
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-07/">July, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-07-01T10:53:00&#43;03:00">Fri Jul 01, 2016</time> by Alan Orth in
@ -196,7 +211,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-06/">June, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-06-01T10:53:00&#43;03:00">Wed Jun 01, 2016</time> by Alan Orth in
@ -221,7 +238,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-05/">May, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-05-01T23:06:00&#43;03:00">Sun May 01, 2016</time> by Alan Orth in
@ -247,7 +266,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-04/">April, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-04-04T11:06:00&#43;03:00">Mon Apr 04, 2016</time> by Alan Orth in
@ -271,7 +292,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-03/">March, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-03-02T16:50:00&#43;03:00">Wed Mar 02, 2016</time> by Alan Orth in
@ -293,7 +316,9 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-02/">February, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-02-05T13:18:00&#43;03:00">Fri Feb 05, 2016</time> by Alan Orth in
@ -323,6 +348,7 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
<nav class="blog-pagination">
@ -331,12 +357,12 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
<a class="btn btn-outline-primary" href="/tags/notes/page/2/" role="button">Next page</a>
</nav>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -374,7 +400,6 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

View File

@ -212,7 +212,7 @@ dspace=# select count(text_value) from metadatavalue where resource_type_id=2 an
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;Generate a list of all these so I can fix them in batch:&lt;/li&gt;
&lt;li&gt;Generate a list of all these so I can maybe fix them in batch:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspace=# \copy (select distinct text_lang, count(*) from metadatavalue where resource_type_id=2 group by text_lang order by count desc) to /tmp/text-langs.csv with csv;
@ -226,6 +226,38 @@ COPY 14
&lt;pre&gt;&lt;code&gt;dspace=# update metadatavalue set text_lang=&#39;en_US&#39; where resource_type_id=2 and metadata_field_id=203 and text_value=&#39;SEEDS&#39;;
UPDATE 85
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;The &lt;code&gt;fix-metadata.py&lt;/code&gt; script I have is meant for specific metadata values, so if I want to update some &lt;code&gt;text_lang&lt;/code&gt; values I should just do it directly in the database&lt;/li&gt;
&lt;li&gt;For example, on a limited set:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspace=# update metadatavalue set text_lang=NULL where resource_type_id=2 and metadata_field_id=203 and text_value=&#39;LIVESTOCK&#39; and text_lang=&#39;&#39;;
UPDATE 420
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;And assuming I want to do it for all fields:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;dspacetest=# update metadatavalue set text_lang=NULL where resource_type_id=2 and text_lang=&#39;&#39;;
UPDATE 183726
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;After that restarted Tomcat and PostgreSQL (because I&amp;rsquo;m superstitious about caches) and now I see the following in REST API query:&lt;/li&gt;
&lt;/ul&gt;
&lt;pre&gt;&lt;code&gt;$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;}&#39; | jq length
71
$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;, &amp;quot;language&amp;quot;:&amp;quot;&amp;quot;}&#39; | jq length
0
$ curl -s -H &amp;quot;accept: application/json&amp;quot; -H &amp;quot;Content-Type: application/json&amp;quot; -X POST &amp;quot;http://localhost:8080/rest/items/find-by-metadata-field&amp;quot; -d &#39;{&amp;quot;key&amp;quot;: &amp;quot;cg.subject.ilri&amp;quot;,&amp;quot;value&amp;quot;: &amp;quot;SEEDS&amp;quot;, &amp;quot;language&amp;quot;:&amp;quot;en_US&amp;quot;}&#39; | jq length
&lt;/code&gt;&lt;/pre&gt;
&lt;ul&gt;
&lt;li&gt;Not sure what&amp;rsquo;s going on, but Discovery shows 83 values, and database shows 85, so I&amp;rsquo;m going to reindex Discovery just in case&lt;/li&gt;
&lt;/ul&gt;
</description>
</item>

View File

@ -2,35 +2,33 @@
<html lang="en">
<head>
<meta charset="utf-8">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta name="description" content="">
<meta name="author" content="Alan Orth">
<meta property="og:title" content="Notes" />
<meta property="og:description" content="" />
<meta property="og:type" content="website" />
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/tags/notes/" />
<meta property="og:updated_time" content="2016-01-13T13:18:00&#43;03:00"/>
<!-- OpenGraph Metadata: http://ogp.me/ -->
<meta property="og:title" content="Notes">
<meta property="og:description" content="">
<meta property="og:type" content="blog">
<meta itemprop="name" content="Notes">
<meta itemprop="description" content="">
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/tags/notes/">
<!-- Metadata for Twitter: https://dev.twitter.com/cards/markup -->
<meta property="twitter:card" content="summary">
<meta property="twitter:title" content="Notes">
<meta property="twitter:description" content="">
@ -49,8 +47,15 @@
<!-- combined, minified CSS -->
<link href="https://alanorth.github.io/cgspace-notes/css/style.css" rel="stylesheet">
<!-- RSS 2.0 feed -->
<link href="https://alanorth.github.io/cgspace-notes/index.xml" type="application/rss+xml" rel="alternate">
<link href="https://alanorth.github.io/cgspace-notes/tags/notes/index.xml" rel="alternate" type="application/rss+xml" title="CGSpace Notes" />
<link href="https://alanorth.github.io/cgspace-notes/tags/notes/index.xml" rel="feed" type="application/rss+xml" title="CGSpace Notes" />
</head>
<body>
@ -79,7 +84,9 @@
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-01/">January, 2016</a></h2>
<p class="blog-post-meta"><time datetime="2016-01-13T13:18:00&#43;03:00">Wed Jan 13, 2016</time> by Alan Orth in
@ -101,7 +108,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2015-12/">December, 2015</a></h2>
<p class="blog-post-meta"><time datetime="2015-12-02T13:18:00&#43;03:00">Wed Dec 02, 2015</time> by Alan Orth in
@ -128,7 +137,9 @@
</article>
<article class="blog-post">
<article class="blog-post">
<header>
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2015-11/">November, 2015</a></h2>
<p class="blog-post-meta"><time datetime="2015-11-23T17:00:57&#43;03:00">Mon Nov 23, 2015</time> by Alan Orth in
@ -155,6 +166,7 @@
<nav class="blog-pagination">
@ -163,12 +175,12 @@
</nav>
</div> <!-- /.blog-main -->
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
<aside class="col-sm-3 offset-sm-1 blog-sidebar">
@ -206,7 +218,6 @@
</aside>
</div> <!-- /.row -->
</div> <!-- /.container -->

@ -1 +1 @@
Subproject commit 5f5f8191dfb5078f1c53474272974e64bb195db8
Subproject commit e3f93bd38bd2c9d7aadf550b5d323ad45c566b0b