mirror of
https://github.com/alanorth/cgspace-notes.git
synced 2024-11-29 09:58:22 +01:00
Add notes for 2019-05-27
This commit is contained in:
parent
48c14002d1
commit
9e2cca9df8
@ -418,4 +418,29 @@ $ ./delete-metadata-values.py -i /tmp/2019-05-17-delete-14-Investors.csv -db dsp
|
|||||||
$ dspace import -a -e me@cgiar.org -m 2019-05-25-AfricaRice.map -s /tmp/SimpleArchiveFormat
|
$ dspace import -a -e me@cgiar.org -m 2019-05-25-AfricaRice.map -s /tmp/SimpleArchiveFormat
|
||||||
```
|
```
|
||||||
|
|
||||||
|
## 2019-05-27
|
||||||
|
|
||||||
|
- Peter sent me over two thousand corrections for the authors on CGSpace that I had dumped last month
|
||||||
|
- I proofed them for whitespace and invalid special characters in OpenRefine and then applied them on CGSpace and DSpace Test:
|
||||||
|
|
||||||
|
```
|
||||||
|
$ ./fix-metadata-values.py -i /tmp/2019-05-27-fix-2472-Authors.csv -db dspace -u dspace -p 'fuuu' -f dc.contributor.author -m 3 -t corrections -d
|
||||||
|
```
|
||||||
|
|
||||||
|
- Then start a full Discovery re-indexing on each server:
|
||||||
|
|
||||||
|
```
|
||||||
|
$ export JAVA_OPTS="-Dfile.encoding=UTF-8 -Xmx1024m"
|
||||||
|
$ time schedtool -B -e ionice -c2 -n7 nice -n19 dspace index-discovery -b
|
||||||
|
```
|
||||||
|
|
||||||
|
- Export new list of all authors from CGSpace database to send to Peter:
|
||||||
|
|
||||||
|
```
|
||||||
|
dspace=# \copy (select distinct text_value, count(*) as count from metadatavalue where metadata_field_id = (select metadata_field_id from metadatafieldregistry where element = 'contributor' and qualifier = 'author') AND resource_type_id = 2 group by text_value order by count desc) to /tmp/2019-05-27-all-authors.csv with csv header;
|
||||||
|
COPY 64871
|
||||||
|
```
|
||||||
|
|
||||||
|
- Run all system updates on DSpace Test (linode19) and reboot it
|
||||||
|
|
||||||
<!-- vim: set sw=2 ts=2: -->
|
<!-- vim: set sw=2 ts=2: -->
|
||||||
|
@ -38,7 +38,7 @@ $ ./delete-metadata-values.py -i /tmp/2019-02-21-delete-1-region.csv -db dspace
|
|||||||
<meta property="og:type" content="article" />
|
<meta property="og:type" content="article" />
|
||||||
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2019-04/" />
|
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2019-04/" />
|
||||||
<meta property="article:published_time" content="2019-04-01T09:00:43+03:00"/>
|
<meta property="article:published_time" content="2019-04-01T09:00:43+03:00"/>
|
||||||
<meta property="article:modified_time" content="2019-04-30T11:39:09+03:00"/>
|
<meta property="article:modified_time" content="2019-05-27T12:04:14+03:00"/>
|
||||||
|
|
||||||
<meta name="twitter:card" content="summary"/>
|
<meta name="twitter:card" content="summary"/>
|
||||||
<meta name="twitter:title" content="April, 2019"/>
|
<meta name="twitter:title" content="April, 2019"/>
|
||||||
@ -81,9 +81,9 @@ $ ./delete-metadata-values.py -i /tmp/2019-02-21-delete-1-region.csv -db dspace
|
|||||||
"@type": "BlogPosting",
|
"@type": "BlogPosting",
|
||||||
"headline": "April, 2019",
|
"headline": "April, 2019",
|
||||||
"url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-04\/",
|
"url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-04\/",
|
||||||
"wordCount": "6800",
|
"wordCount": "6799",
|
||||||
"datePublished": "2019-04-01T09:00:43\x2b03:00",
|
"datePublished": "2019-04-01T09:00:43\x2b03:00",
|
||||||
"dateModified": "2019-04-30T11:39:09\x2b03:00",
|
"dateModified": "2019-05-27T12:04:14\x2b03:00",
|
||||||
"author": {
|
"author": {
|
||||||
"@type": "Person",
|
"@type": "Person",
|
||||||
"name": "Alan Orth"
|
"name": "Alan Orth"
|
||||||
@ -1339,7 +1339,7 @@ item_id | submitter_id | in_archive | withdrawn | last_modified | o
|
|||||||
<ul>
|
<ul>
|
||||||
<li><p>Export a list of authors for Peter to look through:</p>
|
<li><p>Export a list of authors for Peter to look through:</p>
|
||||||
|
|
||||||
<pre><code>dspacetest=# # \copy (select distinct text_value, count(*) as count from metadatavalue where metadata_field_id = (select metadata_field_id from metadatafieldregistry where element = 'contributor' and qualifier = 'author') AND resource_type_id = 2 group by text_value order by count desc) to /tmp/2019-04-26-all-authors.csv with csv header;
|
<pre><code>dspace=# \copy (select distinct text_value, count(*) as count from metadatavalue where metadata_field_id = (select metadata_field_id from metadatafieldregistry where element = 'contributor' and qualifier = 'author') AND resource_type_id = 2 group by text_value order by count desc) to /tmp/2019-04-26-all-authors.csv with csv header;
|
||||||
COPY 65752
|
COPY 65752
|
||||||
</code></pre></li>
|
</code></pre></li>
|
||||||
</ul>
|
</ul>
|
||||||
|
@ -28,7 +28,7 @@ But after this I tried to delete the item from the XMLUI and it is still present
|
|||||||
<meta property="og:type" content="article" />
|
<meta property="og:type" content="article" />
|
||||||
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2019-05/" />
|
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2019-05/" />
|
||||||
<meta property="article:published_time" content="2019-05-01T07:37:43+03:00"/>
|
<meta property="article:published_time" content="2019-05-01T07:37:43+03:00"/>
|
||||||
<meta property="article:modified_time" content="2019-05-24T12:27:22+03:00"/>
|
<meta property="article:modified_time" content="2019-05-25T14:17:27+03:00"/>
|
||||||
|
|
||||||
<meta name="twitter:card" content="summary"/>
|
<meta name="twitter:card" content="summary"/>
|
||||||
<meta name="twitter:title" content="May, 2019"/>
|
<meta name="twitter:title" content="May, 2019"/>
|
||||||
@ -61,9 +61,9 @@ But after this I tried to delete the item from the XMLUI and it is still present
|
|||||||
"@type": "BlogPosting",
|
"@type": "BlogPosting",
|
||||||
"headline": "May, 2019",
|
"headline": "May, 2019",
|
||||||
"url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-05\/",
|
"url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-05\/",
|
||||||
"wordCount": "2874",
|
"wordCount": "3023",
|
||||||
"datePublished": "2019-05-01T07:37:43\x2b03:00",
|
"datePublished": "2019-05-01T07:37:43\x2b03:00",
|
||||||
"dateModified": "2019-05-24T12:27:22\x2b03:00",
|
"dateModified": "2019-05-25T14:17:27\x2b03:00",
|
||||||
"author": {
|
"author": {
|
||||||
"@type": "Person",
|
"@type": "Person",
|
||||||
"name": "Alan Orth"
|
"name": "Alan Orth"
|
||||||
@ -649,6 +649,33 @@ $ ./delete-metadata-values.py -i /tmp/2019-05-17-delete-14-Investors.csv -db dsp
|
|||||||
</code></pre></li>
|
</code></pre></li>
|
||||||
</ul>
|
</ul>
|
||||||
|
|
||||||
|
<h2 id="2019-05-27">2019-05-27</h2>
|
||||||
|
|
||||||
|
<ul>
|
||||||
|
<li><p>Peter sent me over two thousand corrections for the authors on CGSpace that I had dumped last month</p>
|
||||||
|
|
||||||
|
<ul>
|
||||||
|
<li><p>I proofed them for whitespace and invalid special characters in OpenRefine and then applied them on CGSpace and DSpace Test:</p>
|
||||||
|
|
||||||
|
<pre><code>$ ./fix-metadata-values.py -i /tmp/2019-05-27-fix-2472-Authors.csv -db dspace -u dspace -p 'fuuu' -f dc.contributor.author -m 3 -t corrections -d
|
||||||
|
</code></pre></li>
|
||||||
|
</ul></li>
|
||||||
|
|
||||||
|
<li><p>Then start a full Discovery re-indexing on each server:</p>
|
||||||
|
|
||||||
|
<pre><code>$ export JAVA_OPTS="-Dfile.encoding=UTF-8 -Xmx1024m"
|
||||||
|
$ time schedtool -B -e ionice -c2 -n7 nice -n19 dspace index-discovery -b
|
||||||
|
</code></pre></li>
|
||||||
|
|
||||||
|
<li><p>Export new list of all authors from CGSpace database to send to Peter:</p>
|
||||||
|
|
||||||
|
<pre><code>dspace=# \copy (select distinct text_value, count(*) as count from metadatavalue where metadata_field_id = (select metadata_field_id from metadatafieldregistry where element = 'contributor' and qualifier = 'author') AND resource_type_id = 2 group by text_value order by count desc) to /tmp/2019-05-27-all-authors.csv with csv header;
|
||||||
|
COPY 64871
|
||||||
|
</code></pre></li>
|
||||||
|
|
||||||
|
<li><p>Run all system updates on DSpace Test (linode19) and reboot it</p></li>
|
||||||
|
</ul>
|
||||||
|
|
||||||
<!-- vim: set sw=2 ts=2: -->
|
<!-- vim: set sw=2 ts=2: -->
|
||||||
|
|
||||||
|
|
||||||
|
@ -4,36 +4,36 @@
|
|||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/</loc>
|
||||||
<lastmod>2019-05-24T12:27:22+03:00</lastmod>
|
<lastmod>2019-05-27T12:04:14+03:00</lastmod>
|
||||||
<priority>0</priority>
|
<priority>0</priority>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/2019-05/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/2019-05/</loc>
|
||||||
<lastmod>2019-05-24T12:27:22+03:00</lastmod>
|
<lastmod>2019-05-25T14:17:27+03:00</lastmod>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/tags/notes/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/tags/notes/</loc>
|
||||||
<lastmod>2019-05-24T12:27:22+03:00</lastmod>
|
<lastmod>2019-05-27T12:04:14+03:00</lastmod>
|
||||||
<priority>0</priority>
|
<priority>0</priority>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/posts/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/posts/</loc>
|
||||||
<lastmod>2019-05-24T12:27:22+03:00</lastmod>
|
<lastmod>2019-05-27T12:04:14+03:00</lastmod>
|
||||||
<priority>0</priority>
|
<priority>0</priority>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/tags/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/tags/</loc>
|
||||||
<lastmod>2019-05-24T12:27:22+03:00</lastmod>
|
<lastmod>2019-05-27T12:04:14+03:00</lastmod>
|
||||||
<priority>0</priority>
|
<priority>0</priority>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/2019-04/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/2019-04/</loc>
|
||||||
<lastmod>2019-04-30T11:39:09+03:00</lastmod>
|
<lastmod>2019-05-27T12:04:14+03:00</lastmod>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
|
Loading…
Reference in New Issue
Block a user