From 2304f65bf8403f0f8359eb792d7921f54ac8d8fa Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Sat, 12 Aug 2017 08:40:59 +0300 Subject: [PATCH] Update notes for 2017-08-11 --- content/post/2017-08.md | 1 + public/2017-08/index.html | 7 ++++--- public/sitemap.xml | 10 +++++----- 3 files changed, 10 insertions(+), 8 deletions(-) diff --git a/content/post/2017-08.md b/content/post/2017-08.md index 606606684..befd4c551 100644 --- a/content/post/2017-08.md +++ b/content/post/2017-08.md @@ -89,3 +89,4 @@ dspace#= \copy (select distinct text_value, count(*) from metadatavalue where me - I learned this on a recent discussion on the DSpace wiki - I need to either look into setting up a database pool through JNDI or increase the PostgreSQL max connections - Also, I need to find out where the load is coming from (rest?) and possibly block bots from accessing dynamic pages like Browse and Discover instead of just sending an X-Robots-Tag HTTP header +- I noticed that Google has bitstreams from the `rest` interface in the search index. I need to ask on the dspace-tech mailing list to see what other people are doing about this, and maybe start issuing an `X-Robots-Tag: none` there! diff --git a/public/2017-08/index.html b/public/2017-08/index.html index 704a4714e..821d7b49a 100644 --- a/public/2017-08/index.html +++ b/public/2017-08/index.html @@ -37,7 +37,7 @@ Then I cleaned up the author authorities and HTML characters in OpenRefine and s - + @@ -85,9 +85,9 @@ Then I cleaned up the author authorities and HTML characters in OpenRefine and s "@type": "BlogPosting", "headline": "August, 2017", "url": "https://alanorth.github.io/cgspace-notes/2017-08/", - "wordCount": "1148", + "wordCount": "1188", "datePublished": "2017-08-01T11:51:52+03:00", - "dateModified": "2017-08-12T00:02:42+03:00", + "dateModified": "2017-08-12T00:04:09+03:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -261,6 +261,7 @@ Then I cleaned up the author authorities and HTML characters in OpenRefine and s
  • I learned this on a recent discussion on the DSpace wiki
  • I need to either look into setting up a database pool through JNDI or increase the PostgreSQL max connections
  • Also, I need to find out where the load is coming from (rest?) and possibly block bots from accessing dynamic pages like Browse and Discover instead of just sending an X-Robots-Tag HTTP header
  • +
  • I noticed that Google has bitstreams from the rest interface in the search index. I need to ask on the dspace-tech mailing list to see what other people are doing about this, and maybe start issuing an X-Robots-Tag: none there!
  • diff --git a/public/sitemap.xml b/public/sitemap.xml index 10b0d3467..b99b82424 100644 --- a/public/sitemap.xml +++ b/public/sitemap.xml @@ -4,7 +4,7 @@ https://alanorth.github.io/cgspace-notes/2017-08/ - 2017-08-12T00:02:42+03:00 + 2017-08-12T00:04:09+03:00 @@ -114,7 +114,7 @@ https://alanorth.github.io/cgspace-notes/ - 2017-08-12T00:02:42+03:00 + 2017-08-12T00:04:09+03:00 0 @@ -125,19 +125,19 @@ https://alanorth.github.io/cgspace-notes/tags/notes/ - 2017-08-12T00:02:42+03:00 + 2017-08-12T00:04:09+03:00 0 https://alanorth.github.io/cgspace-notes/post/ - 2017-08-12T00:02:42+03:00 + 2017-08-12T00:04:09+03:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2017-08-12T00:02:42+03:00 + 2017-08-12T00:04:09+03:00 0