diff --git a/content/post/2017-04.md b/content/post/2017-04.md index f41f5f0ef..988893917 100644 --- a/content/post/2017-04.md +++ b/content/post/2017-04.md @@ -12,4 +12,36 @@ tags = ["Notes"] ![dc.rights in the submission form](/cgspace-notes/2017/04/dc-rights.png) +- Remove redundant/duplicate text in the DSpace submission license +- Testing the CMYK patch on a collection with 650 items: + +``` +$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt +``` + + +## 2017-04-03 + +- Continue testing the CMYK patch on more communities: + +``` +$ [dspace]/bin/dspace filter-media -f -i 10568/1 -p "ImageMagick PDF Thumbnail" -v >> /tmp/filter-media-cmyk.txt 2>&1 +``` + +- So far there are almost 500: + +``` +$ grep -c profile /tmp/filter-media-cmyk.txt +484 +``` + +- Looking at the CG Core document again, I'll send some feedback to Peter and Abenet: + - We use cg.contributor.crp to indicate the CRP(s) affiliated with the item + - DSpace has dc.date.available, but this field isn't particularly meaningful other than as an automatic timestamp at the time of item accession (and is identical to dc.date.accessioned) + - dc.relation exists in CGSpace, but isn't used—rather dc.relation.ispartofseries, which is used ~5,000 times to Series name and number within that series +- Also, I'm noticing some weird outliers in `cg.coverage.region`, need to remember to go correct these later: + +``` +dspace=# select text_value from metadatavalue where resource_type_id=2 and metadata_field_id=227; +``` diff --git a/public/2015-11/index.html b/public/2015-11/index.html index c7adf0049..9f100cbce 100644 --- a/public/2015-11/index.html +++ b/public/2015-11/index.html @@ -25,7 +25,7 @@ $ psql -c 'SELECT * from pg_stat_activity;' | grep idle | grep -c cgspac - + @@ -71,7 +71,7 @@ $ psql -c 'SELECT * from pg_stat_activity;' | grep idle | grep -c cgspac "url": "https://alanorth.github.io/cgspace-notes/2015-11/", "wordCount": "798", "datePublished": "2015-11-23T17:00:57+03:00", - "dateModified": "2015-11-23T17:00:57+03:00", + "dateModified": "2016-09-28T17:02:30+03:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2015-12/index.html b/public/2015-12/index.html index 933b0eab5..a40bfce2a 100644 --- a/public/2015-12/index.html +++ b/public/2015-12/index.html @@ -26,7 +26,7 @@ Replace lzop with xz in log compression cron jobs on DSpace Test—it uses less - + @@ -73,7 +73,7 @@ Replace lzop with xz in log compression cron jobs on DSpace Test—it uses less "url": "https://alanorth.github.io/cgspace-notes/2015-12/", "wordCount": "753", "datePublished": "2015-12-02T13:18:00+03:00", - "dateModified": "2015-12-02T13:18:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-01/index.html b/public/2016-01/index.html index 28a36a744..c68e3537f 100644 --- a/public/2016-01/index.html +++ b/public/2016-01/index.html @@ -21,7 +21,7 @@ Update GitHub wiki for documentation of maintenance tasks. - + @@ -63,7 +63,7 @@ Update GitHub wiki for documentation of maintenance tasks. "url": "https://alanorth.github.io/cgspace-notes/2016-01/", "wordCount": "466", "datePublished": "2016-01-13T13:18:00+03:00", - "dateModified": "2016-01-13T13:18:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-02/index.html b/public/2016-02/index.html index 99dd1e1ea..38888e1de 100644 --- a/public/2016-02/index.html +++ b/public/2016-02/index.html @@ -28,7 +28,7 @@ Also, lots of things like “COTE D`LVOIRE” and “COTE D IVOIRE&r - + @@ -77,7 +77,7 @@ Also, lots of things like “COTE D`LVOIRE” and “COTE D IVOIRE&r "url": "https://alanorth.github.io/cgspace-notes/2016-02/", "wordCount": "1657", "datePublished": "2016-02-05T13:18:00+03:00", - "dateModified": "2016-02-05T13:18:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-03/index.html b/public/2016-03/index.html index 66643832c..033196aa1 100644 --- a/public/2016-03/index.html +++ b/public/2016-03/index.html @@ -21,7 +21,7 @@ Reinstall my local (Mac OS X) DSpace stack with Tomcat 7, PostgreSQL 9.3, and Ja - + @@ -63,7 +63,7 @@ Reinstall my local (Mac OS X) DSpace stack with Tomcat 7, PostgreSQL 9.3, and Ja "url": "https://alanorth.github.io/cgspace-notes/2016-03/", "wordCount": "1581", "datePublished": "2016-03-02T16:50:00+03:00", - "dateModified": "2016-03-02T16:50:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-04/index.html b/public/2016-04/index.html index c7980c46a..fc8532a34 100644 --- a/public/2016-04/index.html +++ b/public/2016-04/index.html @@ -23,7 +23,7 @@ Also, I noticed the checker log has some errors we should pay attention to: - + @@ -67,7 +67,7 @@ Also, I noticed the checker log has some errors we should pay attention to: "url": "https://alanorth.github.io/cgspace-notes/2016-04/", "wordCount": "2006", "datePublished": "2016-04-04T11:06:00+03:00", - "dateModified": "2016-04-04T11:06:00+03:00", + "dateModified": "2016-09-28T17:02:30+03:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-05/index.html b/public/2016-05/index.html index d8e1a3e1b..952bd7243 100644 --- a/public/2016-05/index.html +++ b/public/2016-05/index.html @@ -25,7 +25,7 @@ There are 3,000 IPs accessing the REST API in a 24-hour period! - + @@ -71,7 +71,7 @@ There are 3,000 IPs accessing the REST API in a 24-hour period! "url": "https://alanorth.github.io/cgspace-notes/2016-05/", "wordCount": "1349", "datePublished": "2016-05-01T23:06:00+03:00", - "dateModified": "2016-05-01T23:06:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-06/index.html b/public/2016-06/index.html index 2071346be..5489ac1d5 100644 --- a/public/2016-06/index.html +++ b/public/2016-06/index.html @@ -24,7 +24,7 @@ Working on second phase of metadata migration, looks like this will work for mov - + @@ -69,7 +69,7 @@ Working on second phase of metadata migration, looks like this will work for mov "url": "https://alanorth.github.io/cgspace-notes/2016-06/", "wordCount": "1549", "datePublished": "2016-06-01T10:53:00+03:00", - "dateModified": "2016-06-01T10:53:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-07/index.html b/public/2016-07/index.html index 59ac884fd..52a43fc3e 100644 --- a/public/2016-07/index.html +++ b/public/2016-07/index.html @@ -32,7 +32,7 @@ In this case the select query was showing 95 results before the update - + @@ -85,7 +85,7 @@ In this case the select query was showing 95 results before the update "url": "https://alanorth.github.io/cgspace-notes/2016-07/", "wordCount": "866", "datePublished": "2016-07-01T10:53:00+03:00", - "dateModified": "2016-07-01T10:53:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-08/index.html b/public/2016-08/index.html index 69a52c7c9..ffc13933d 100644 --- a/public/2016-08/index.html +++ b/public/2016-08/index.html @@ -29,7 +29,7 @@ $ git rebase -i dspace-5.5 - + @@ -79,7 +79,7 @@ $ git rebase -i dspace-5.5 "url": "https://alanorth.github.io/cgspace-notes/2016-08/", "wordCount": "1514", "datePublished": "2016-08-01T15:53:00+03:00", - "dateModified": "2016-08-01T15:53:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-09/index.html b/public/2016-09/index.html index 88d1e5e73..237df471d 100644 --- a/public/2016-09/index.html +++ b/public/2016-09/index.html @@ -25,7 +25,7 @@ $ ldapsearch -x -H ldaps://svcgroot2.cgiarad.org:3269/ -b "dc=cgiarad,dc=or - + @@ -71,7 +71,7 @@ $ ldapsearch -x -H ldaps://svcgroot2.cgiarad.org:3269/ -b "dc=cgiarad,dc=or "url": "https://alanorth.github.io/cgspace-notes/2016-09/", "wordCount": "3298", "datePublished": "2016-09-01T15:53:00+03:00", - "dateModified": "2016-09-01T15:53:00+03:00", + "dateModified": "2017-01-09T16:18:07+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-10/index.html b/public/2016-10/index.html index 15e4263f2..26131c510 100644 --- a/public/2016-10/index.html +++ b/public/2016-10/index.html @@ -29,7 +29,7 @@ I exported a random item’s metadata as CSV, deleted all columns except id - + @@ -79,7 +79,7 @@ I exported a random item’s metadata as CSV, deleted all columns except id "url": "https://alanorth.github.io/cgspace-notes/2016-10/", "wordCount": "1828", "datePublished": "2016-10-03T15:53:00+03:00", - "dateModified": "2016-10-03T15:53:00+03:00", + "dateModified": "2017-01-10T16:21:47+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-11/index.html b/public/2016-11/index.html index a59faf43b..267a25ac6 100644 --- a/public/2016-11/index.html +++ b/public/2016-11/index.html @@ -21,7 +21,7 @@ Add dc.type to the output options for Atmire’s Listings and Reports module - + @@ -63,7 +63,7 @@ Add dc.type to the output options for Atmire’s Listings and Reports module "url": "https://alanorth.github.io/cgspace-notes/2016-11/", "wordCount": "2825", "datePublished": "2016-11-01T09:21:00+03:00", - "dateModified": "2016-11-01T09:21:00+03:00", + "dateModified": "2017-01-10T16:21:47+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2016-12/index.html b/public/2016-12/index.html index 1a01ff5af..9313db0cd 100644 --- a/public/2016-12/index.html +++ b/public/2016-12/index.html @@ -33,7 +33,7 @@ Another worrying error from dspace.log is: - + @@ -87,7 +87,7 @@ Another worrying error from dspace.log is: "url": "https://alanorth.github.io/cgspace-notes/2016-12/", "wordCount": "4078", "datePublished": "2016-12-02T10:43:00+03:00", - "dateModified": "2016-12-02T10:43:00+03:00", + "dateModified": "2017-01-10T16:21:47+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2017-01/index.html b/public/2017-01/index.html index b3f04adf6..de5c2a326 100644 --- a/public/2017-01/index.html +++ b/public/2017-01/index.html @@ -21,7 +21,7 @@ I asked on the dspace-tech mailing list because it seems to be broken, and actua - + @@ -63,7 +63,7 @@ I asked on the dspace-tech mailing list because it seems to be broken, and actua "url": "https://alanorth.github.io/cgspace-notes/2017-01/", "wordCount": "1594", "datePublished": "2017-01-02T10:43:00+03:00", - "dateModified": "2017-01-02T10:43:00+03:00", + "dateModified": "2017-01-29T13:18:32+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2017-02/index.html b/public/2017-02/index.html index 51c0021a8..e58cc6b91 100644 --- a/public/2017-02/index.html +++ b/public/2017-02/index.html @@ -35,7 +35,7 @@ Looks like we’ll be using cg.identifier.ccafsprojectpii as the field name - + @@ -91,7 +91,7 @@ Looks like we’ll be using cg.identifier.ccafsprojectpii as the field name "url": "https://alanorth.github.io/cgspace-notes/2017-02/", "wordCount": "2028", "datePublished": "2017-02-07T07:04:52-08:00", - "dateModified": "2017-02-07T07:04:52-08:00", + "dateModified": "2017-02-28T22:58:29+02:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2017-03/index.html b/public/2017-03/index.html index 114c23b71..631fa0aaa 100644 --- a/public/2017-03/index.html +++ b/public/2017-03/index.html @@ -37,7 +37,7 @@ $ identify ~/Desktop/alc_contrastes_desafios.jpg - + @@ -95,7 +95,7 @@ $ identify ~/Desktop/alc_contrastes_desafios.jpg "url": "https://alanorth.github.io/cgspace-notes/2017-03/", "wordCount": "1538", "datePublished": "2017-03-01T17:08:52+02:00", - "dateModified": "2017-03-01T17:08:52+02:00", + "dateModified": "2017-03-31T05:36:10+03:00", "author": { "@type": "Person", "name": "Alan Orth" diff --git a/public/2017-04/index.html b/public/2017-04/index.html index 77dc75838..cabf51509 100644 --- a/public/2017-04/index.html +++ b/public/2017-04/index.html @@ -15,6 +15,14 @@ Quick proof-of-concept hack to add dc.rights to the input form, including some i + +Remove redundant/duplicate text in the DSpace submission license +Testing the CMYK patch on a collection with 650 items: + + +$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt + + " /> @@ -22,7 +30,7 @@ Quick proof-of-concept hack to add dc.rights to the input form, including some i - + @@ -51,6 +59,14 @@ Quick proof-of-concept hack to add dc.rights to the input form, including some i + +Remove redundant/duplicate text in the DSpace submission license +Testing the CMYK patch on a collection with 650 items: + + +$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt + + "/> @@ -63,9 +79,9 @@ Quick proof-of-concept hack to add dc.rights to the input form, including some i "@type": "BlogPosting", "headline": "April, 2017", "url": "https://alanorth.github.io/cgspace-notes/2017-04/", - "wordCount": "33", + "wordCount": "197", "datePublished": "2017-04-02T17:08:52+02:00", - "dateModified": "2017-04-02T17:08:52+02:00", + "dateModified": "2017-04-02T17:57:26+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -138,8 +154,47 @@ Quick proof-of-concept hack to add dc.rights to the input form, including some i
$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt
+
+
+$ [dspace]/bin/dspace filter-media -f -i 10568/1 -p "ImageMagick PDF Thumbnail" -v >> /tmp/filter-media-cmyk.txt 2>&1
+
+
+$ grep -c profile /tmp/filter-media-cmyk.txt
+484
+
+
+cg.coverage.region
, need to remember to go correct these later:dspace=# select text_value from metadatavalue where resource_type_id=2 and metadata_field_id=227;
+
+
diff --git a/public/index.html b/public/index.html
index f10ed23de..9cd1a250e 100644
--- a/public/index.html
+++ b/public/index.html
@@ -112,6 +112,14 @@
$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt
+
+
Read more →
diff --git a/public/index.xml b/public/index.xml
index e94798833..4543c4ffb 100644
--- a/public/index.xml
+++ b/public/index.xml
@@ -24,7 +24,46 @@
<p><img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2017/04/dc-rights.png" alt="dc.rights in the submission form" /></p>
-<p></p>
+<ul>
+<li>Remove redundant/duplicate text in the DSpace submission license</li>
+<li>Testing the CMYK patch on a collection with 650 items:</li>
+</ul>
+
+<pre><code>$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt
+</code></pre>
+
+<p></p>
+
+<h2 id="2017-04-03">2017-04-03</h2>
+
+<ul>
+<li>Continue testing the CMYK patch on more communities:</li>
+</ul>
+
+<pre><code>$ [dspace]/bin/dspace filter-media -f -i 10568/1 -p "ImageMagick PDF Thumbnail" -v >> /tmp/filter-media-cmyk.txt 2>&1
+</code></pre>
+
+<ul>
+<li>So far there are almost 500:</li>
+</ul>
+
+<pre><code>$ grep -c profile /tmp/filter-media-cmyk.txt
+484
+</code></pre>
+
+<ul>
+<li>Looking at the CG Core document again, I’ll send some feedback to Peter and Abenet:
+
+<ul>
+<li>We use cg.contributor.crp to indicate the CRP(s) affiliated with the item</li>
+<li>DSpace has dc.date.available, but this field isn’t particularly meaningful other than as an automatic timestamp at the time of item accession (and is identical to dc.date.accessioned)</li>
+<li>dc.relation exists in CGSpace, but isn’t used—rather dc.relation.ispartofseries, which is used ~5,000 times to Series name and number within that series</li>
+</ul></li>
+<li>Also, I’m noticing some weird outliers in <code>cg.coverage.region</code>, need to remember to go correct these later:</li>
+</ul>
+
+<pre><code>dspace=# select text_value from metadatavalue where resource_type_id=2 and metadata_field_id=227;
+</code></pre>
$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt
+
+
Read more →
diff --git a/public/post/index.xml b/public/post/index.xml
index b74a131ea..c4c5808ac 100644
--- a/public/post/index.xml
+++ b/public/post/index.xml
@@ -24,7 +24,46 @@
<p><img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2017/04/dc-rights.png" alt="dc.rights in the submission form" /></p>
-<p></p>
+<ul>
+<li>Remove redundant/duplicate text in the DSpace submission license</li>
+<li>Testing the CMYK patch on a collection with 650 items:</li>
+</ul>
+
+<pre><code>$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt
+</code></pre>
+
+<p></p>
+
+<h2 id="2017-04-03">2017-04-03</h2>
+
+<ul>
+<li>Continue testing the CMYK patch on more communities:</li>
+</ul>
+
+<pre><code>$ [dspace]/bin/dspace filter-media -f -i 10568/1 -p "ImageMagick PDF Thumbnail" -v >> /tmp/filter-media-cmyk.txt 2>&1
+</code></pre>
+
+<ul>
+<li>So far there are almost 500:</li>
+</ul>
+
+<pre><code>$ grep -c profile /tmp/filter-media-cmyk.txt
+484
+</code></pre>
+
+<ul>
+<li>Looking at the CG Core document again, I’ll send some feedback to Peter and Abenet:
+
+<ul>
+<li>We use cg.contributor.crp to indicate the CRP(s) affiliated with the item</li>
+<li>DSpace has dc.date.available, but this field isn’t particularly meaningful other than as an automatic timestamp at the time of item accession (and is identical to dc.date.accessioned)</li>
+<li>dc.relation exists in CGSpace, but isn’t used—rather dc.relation.ispartofseries, which is used ~5,000 times to Series name and number within that series</li>
+</ul></li>
+<li>Also, I’m noticing some weird outliers in <code>cg.coverage.region</code>, need to remember to go correct these later:</li>
+</ul>
+
+<pre><code>dspace=# select text_value from metadatavalue where resource_type_id=2 and metadata_field_id=227;
+</code></pre>
$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt
+
+
Read more →
diff --git a/public/tags/notes/index.xml b/public/tags/notes/index.xml
index ad889a186..cf19bc4f0 100644
--- a/public/tags/notes/index.xml
+++ b/public/tags/notes/index.xml
@@ -23,7 +23,46 @@
<p><img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2017/04/dc-rights.png" alt="dc.rights in the submission form" /></p>
-<p></p>
+<ul>
+<li>Remove redundant/duplicate text in the DSpace submission license</li>
+<li>Testing the CMYK patch on a collection with 650 items:</li>
+</ul>
+
+<pre><code>$ [dspace]/bin/dspace filter-media -f -i 10568/16498 -p "ImageMagick PDF Thumbnail" -v >& /tmp/filter-media-cmyk.txt
+</code></pre>
+
+<p></p>
+
+<h2 id="2017-04-03">2017-04-03</h2>
+
+<ul>
+<li>Continue testing the CMYK patch on more communities:</li>
+</ul>
+
+<pre><code>$ [dspace]/bin/dspace filter-media -f -i 10568/1 -p "ImageMagick PDF Thumbnail" -v >> /tmp/filter-media-cmyk.txt 2>&1
+</code></pre>
+
+<ul>
+<li>So far there are almost 500:</li>
+</ul>
+
+<pre><code>$ grep -c profile /tmp/filter-media-cmyk.txt
+484
+</code></pre>
+
+<ul>
+<li>Looking at the CG Core document again, I’ll send some feedback to Peter and Abenet:
+
+<ul>
+<li>We use cg.contributor.crp to indicate the CRP(s) affiliated with the item</li>
+<li>DSpace has dc.date.available, but this field isn’t particularly meaningful other than as an automatic timestamp at the time of item accession (and is identical to dc.date.accessioned)</li>
+<li>dc.relation exists in CGSpace, but isn’t used—rather dc.relation.ispartofseries, which is used ~5,000 times to Series name and number within that series</li>
+</ul></li>
+<li>Also, I’m noticing some weird outliers in <code>cg.coverage.region</code>, need to remember to go correct these later:</li>
+</ul>
+
+<pre><code>dspace=# select text_value from metadatavalue where resource_type_id=2 and metadata_field_id=227;
+</code></pre>