diff --git a/content/posts/2018-07.md b/content/posts/2018-07.md index 31e975949..377d83f46 100644 --- a/content/posts/2018-07.md +++ b/content/posts/2018-07.md @@ -314,5 +314,15 @@ $ grep -c -E 'session_id=[A-Z0-9]{32}:ip_addr=95.108.181.88' dspace.log.2018-07- - So this bot is just like Baiduspider, and I need to add it to the nginx rate limiting - I'll also add it to Tomcat's Crawler Session Manager Valve to force the re-use of a common Tomcat sesssion for all crawlers just in case +- Generate a list of all affiliations in CGSpace to send to Mohamed Salem to compare with the list on MEL (sorting the list by most occurrences): + +``` +dspace=# \copy (select distinct text_value, count(*) as count from metadatavalue where resource_type_id=2 and metadata_field_id=211 group by text_value order by count desc) to /tmp/affiliations.csv with csv header +COPY 4518 +dspace=# \q +$ csvcut -c 1 < /tmp/affiliations.csv > /tmp/affiliations-1.csv +``` + +- We also need to discuss standardizing our countries and comparing our ORCID iDs diff --git a/docs/2018-07/index.html b/docs/2018-07/index.html index 087330b7b..c59f017f5 100644 --- a/docs/2018-07/index.html +++ b/docs/2018-07/index.html @@ -30,7 +30,7 @@ There is insufficient memory for the Java Runtime Environment to continue. - + @@ -71,9 +71,9 @@ There is insufficient memory for the Java Runtime Environment to continue. "@type": "BlogPosting", "headline": "July, 2018", "url": "https://alanorth.github.io/cgspace-notes/2018-07/", - "wordCount": "2079", + "wordCount": "2156", "datePublished": "2018-07-01T12:56:54+03:00", - "dateModified": "2018-07-12T08:35:39+03:00", + "dateModified": "2018-07-12T09:00:08+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -493,6 +493,17 @@ org.apache.solr.client.solrj.SolrServerException: IOException occured when talki + +
dspace=# \copy (select distinct text_value, count(*) as count from metadatavalue where resource_type_id=2 and metadata_field_id=211 group by text_value order by count desc) to /tmp/affiliations.csv with csv header
+COPY 4518
+dspace=# \q
+$ csvcut -c 1 < /tmp/affiliations.csv > /tmp/affiliations-1.csv
+
+ + diff --git a/docs/robots.txt b/docs/robots.txt index 0f0d86454..2176f05a2 100644 --- a/docs/robots.txt +++ b/docs/robots.txt @@ -37,7 +37,7 @@ Disallow: /cgspace-notes/2015-12/ Disallow: /cgspace-notes/2015-11/ Disallow: /cgspace-notes/ Disallow: /cgspace-notes/categories/ -Disallow: /cgspace-notes/categories/notes/ Disallow: /cgspace-notes/tags/notes/ +Disallow: /cgspace-notes/categories/notes/ Disallow: /cgspace-notes/posts/ Disallow: /cgspace-notes/tags/ diff --git a/docs/sitemap.xml b/docs/sitemap.xml index abee96094..df1ae01f6 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,7 +4,7 @@ https://alanorth.github.io/cgspace-notes/2018-07/ - 2018-07-12T08:35:39+03:00 + 2018-07-12T09:00:08+03:00 @@ -174,7 +174,7 @@ https://alanorth.github.io/cgspace-notes/ - 2018-07-12T08:35:39+03:00 + 2018-07-12T09:00:08+03:00 0 @@ -183,27 +183,27 @@ 0 + + https://alanorth.github.io/cgspace-notes/tags/notes/ + 2018-07-12T09:00:08+03:00 + 0 + + https://alanorth.github.io/cgspace-notes/categories/notes/ 2018-03-09T22:10:33+02:00 0 - - https://alanorth.github.io/cgspace-notes/tags/notes/ - 2018-07-12T08:35:39+03:00 - 0 - - https://alanorth.github.io/cgspace-notes/posts/ - 2018-07-12T08:35:39+03:00 + 2018-07-12T09:00:08+03:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2018-07-12T08:35:39+03:00 + 2018-07-12T09:00:08+03:00 0