mirror of
https://github.com/alanorth/cgspace-notes.git
synced 2024-11-10 17:15:46 +01:00
Update notes for 2019-09-21
This commit is contained in:
parent
ddf3b1346b
commit
01348c687d
@ -303,6 +303,6 @@ $ dspace import -a me@cgiar.org -m 2019-09-20-bioversity2.map -s /home/aorth/Bio
|
|||||||
- langid seems to be the best considering the above experiences
|
- langid seems to be the best considering the above experiences
|
||||||
- I added very experimental language detection to the [csv-metadata-quality](https://github.com/ilri/csv-metadata-quality) module
|
- I added very experimental language detection to the [csv-metadata-quality](https://github.com/ilri/csv-metadata-quality) module
|
||||||
- It works by checking the predicted language of the `dc.title` field against the item's `dc.language.iso` field
|
- It works by checking the predicted language of the `dc.title` field against the item's `dc.language.iso` field
|
||||||
- I tested it on the Bioversity migration data set and actually managed to correct about eight incorrect language fields in their records!
|
- I tested it on the Bioversity migration data set and it actually helped me correct eleven language fields in their records!
|
||||||
|
|
||||||
<!-- vim: set sw=2 ts=2: -->
|
<!-- vim: set sw=2 ts=2: -->
|
||||||
|
@ -40,7 +40,7 @@ Here are the top ten IPs in the nginx XMLUI and REST/OAI logs this morning:
|
|||||||
<meta property="og:type" content="article" />
|
<meta property="og:type" content="article" />
|
||||||
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2019-09/" />
|
<meta property="og:url" content="https://alanorth.github.io/cgspace-notes/2019-09/" />
|
||||||
<meta property="article:published_time" content="2019-09-01T10:17:51+03:00" />
|
<meta property="article:published_time" content="2019-09-01T10:17:51+03:00" />
|
||||||
<meta property="article:modified_time" content="2019-09-21T02:25:19+03:00" />
|
<meta property="article:modified_time" content="2019-09-22T01:36:39+03:00" />
|
||||||
|
|
||||||
<meta name="twitter:card" content="summary"/>
|
<meta name="twitter:card" content="summary"/>
|
||||||
<meta name="twitter:title" content="September, 2019"/>
|
<meta name="twitter:title" content="September, 2019"/>
|
||||||
@ -85,9 +85,9 @@ Here are the top ten IPs in the nginx XMLUI and REST/OAI logs this morning:
|
|||||||
"@type": "BlogPosting",
|
"@type": "BlogPosting",
|
||||||
"headline": "September, 2019",
|
"headline": "September, 2019",
|
||||||
"url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-09\/",
|
"url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-09\/",
|
||||||
"wordCount": "2325",
|
"wordCount": "2324",
|
||||||
"datePublished": "2019-09-01T10:17:51\x2b03:00",
|
"datePublished": "2019-09-01T10:17:51\x2b03:00",
|
||||||
"dateModified": "2019-09-21T02:25:19\x2b03:00",
|
"dateModified": "2019-09-22T01:36:39\x2b03:00",
|
||||||
"author": {
|
"author": {
|
||||||
"@type": "Person",
|
"@type": "Person",
|
||||||
"name": "Alan Orth"
|
"name": "Alan Orth"
|
||||||
@ -531,7 +531,7 @@ $ dspace import -a me@cgiar.org -m 2019-09-20-bioversity2.map -s /home/aorth/Bio
|
|||||||
|
|
||||||
<ul>
|
<ul>
|
||||||
<li>It works by checking the predicted language of the <code>dc.title</code> field against the item’s <code>dc.language.iso</code> field</li>
|
<li>It works by checking the predicted language of the <code>dc.title</code> field against the item’s <code>dc.language.iso</code> field</li>
|
||||||
<li>I tested it on the Bioversity migration data set and actually managed to correct about eight incorrect language fields in their records!</li>
|
<li>I tested it on the Bioversity migration data set and it actually helped me correct eleven language fields in their records!</li>
|
||||||
</ul></li>
|
</ul></li>
|
||||||
</ul>
|
</ul>
|
||||||
|
|
||||||
|
@ -4,27 +4,27 @@
|
|||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/</loc>
|
||||||
<lastmod>2019-09-21T02:25:19+03:00</lastmod>
|
<lastmod>2019-09-22T01:36:39+03:00</lastmod>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/tags/notes/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/tags/notes/</loc>
|
||||||
<lastmod>2019-09-21T02:25:19+03:00</lastmod>
|
<lastmod>2019-09-22T01:36:39+03:00</lastmod>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/posts/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/posts/</loc>
|
||||||
<lastmod>2019-09-21T02:25:19+03:00</lastmod>
|
<lastmod>2019-09-22T01:36:39+03:00</lastmod>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/2019-09/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/2019-09/</loc>
|
||||||
<lastmod>2019-09-21T02:25:19+03:00</lastmod>
|
<lastmod>2019-09-22T01:36:39+03:00</lastmod>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
<loc>https://alanorth.github.io/cgspace-notes/tags/</loc>
|
<loc>https://alanorth.github.io/cgspace-notes/tags/</loc>
|
||||||
<lastmod>2019-09-21T02:25:19+03:00</lastmod>
|
<lastmod>2019-09-22T01:36:39+03:00</lastmod>
|
||||||
</url>
|
</url>
|
||||||
|
|
||||||
<url>
|
<url>
|
||||||
|
Loading…
Reference in New Issue
Block a user