diff --git a/content/posts/2019-07.md b/content/posts/2019-07.md index 19bed3af7..f7c98a6d1 100644 --- a/content/posts/2019-07.md +++ b/content/posts/2019-07.md @@ -392,6 +392,7 @@ value.replace(/\s+\|\|/,"||").replace(/\|\|\s+/,"||") - I turned the Pandas script into a proper Python package called [csv-metadata-quality](https://git.sr.ht/~alanorth/csv-metadata-quality) - It supports CSV and Excel files - It fixes whitespace errors and erroneous multi-value separators ("|") and validates ISSN, ISBNs, and dates + - Also I added a bunch of other checks/fixes for unnecessary and "suspicious" Unicode characters - Inform Bioversity that there is an error in their CSV, seemingly caused by quotes in the citation field diff --git a/docs/2019-07/index.html b/docs/2019-07/index.html index 2d5847171..7d1277e12 100644 --- a/docs/2019-07/index.html +++ b/docs/2019-07/index.html @@ -21,7 +21,7 @@ Abenet had another similar issue a few days ago when trying to find the stats fo - + @@ -47,9 +47,9 @@ Abenet had another similar issue a few days ago when trying to find the stats fo "@type": "BlogPosting", "headline": "July, 2019", "url": "https:\/\/alanorth.github.io\/cgspace-notes\/2019-07\/", - "wordCount": "2243", + "wordCount": "2257", "datePublished": "2019-07-01T12:13:51\x2b03:00", - "dateModified": "2019-07-26T18:49:38\x2b03:00", + "dateModified": "2019-07-29T12:51:19\x2b03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -588,6 +588,7 @@ issn.validate('1020-3362')
  • Inform Bioversity that there is an error in their CSV, seemingly caused by quotes in the citation field
  • diff --git a/docs/sitemap.xml b/docs/sitemap.xml index 2abec0c7b..eb9ff6e94 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,30 +4,30 @@ https://alanorth.github.io/cgspace-notes/ - 2019-07-26T18:49:38+03:00 + 2019-07-29T12:51:19+03:00 0 https://alanorth.github.io/cgspace-notes/2019-07/ - 2019-07-26T18:49:38+03:00 + 2019-07-29T12:51:19+03:00 https://alanorth.github.io/cgspace-notes/tags/notes/ - 2019-07-26T18:49:38+03:00 + 2019-07-29T12:51:19+03:00 0 https://alanorth.github.io/cgspace-notes/posts/ - 2019-07-26T18:49:38+03:00 + 2019-07-29T12:51:19+03:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2019-07-26T18:49:38+03:00 + 2019-07-29T12:51:19+03:00 0