From b51bbdb91c9d50a69b8df24b626b340eb58b4f0d Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Sun, 31 Dec 2017 06:47:41 -0800 Subject: [PATCH] Add notes for 2017-12-30 --- content/post/2017-12.md | 31 +++++++++++++++++++++++++++++ public/2017-12/index.html | 41 ++++++++++++++++++++++++++++++++++++--- public/sitemap.xml | 10 +++++----- 3 files changed, 74 insertions(+), 8 deletions(-) diff --git a/content/post/2017-12.md b/content/post/2017-12.md index 759d2f2db..a2c1c433d 100644 --- a/content/post/2017-12.md +++ b/content/post/2017-12.md @@ -699,3 +699,34 @@ DELETE 20 ``` - I need to figure out why we have records with language `in` because that's not a language! + +## 2017-12-30 + +- Linode alerted that CGSpace was using 259% CPU from 4 to 6 AM +- Uptime Robot noticed that the server went down for 1 minute a few hours later, around 9AM +- Here's the XMLUI logs: + +``` +# cat /var/log/nginx/access.log /var/log/nginx/access.log.1 /var/log/nginx/library-access.log /var/log/nginx/library-access.log.1 | grep -E "30/Dec/2017" | awk '{print $1}' | sort -n | uniq -c | sort -h | tail + 637 207.46.13.106 + 641 157.55.39.186 + 715 68.180.229.254 + 924 104.196.152.243 + 1012 66.249.64.95 + 1060 216.244.66.245 + 1120 54.175.208.220 + 1287 66.249.64.93 + 1586 66.249.64.78 + 3653 66.249.64.91 +``` + +- Looks pretty normal actually, but I don't know who 54.175.208.220 is +- They identify as "com.plumanalytics", which Google says is associated with Elsevier +- They only seem to have used one Tomcat session so that's good, I guess I don't need to add them to the Tomcat Crawler Session Manager valve: + +``` +$ grep 54.175.208.220 dspace.log.2017-12-30 | grep -o -E 'session_id=[A-Z0-9]{32}' | sort -n | uniq | wc -l +1 +``` + +- 216.244.66.245 seems to be moz.com's DotBot diff --git a/public/2017-12/index.html b/public/2017-12/index.html index e4b557d96..9f2b52158 100644 --- a/public/2017-12/index.html +++ b/public/2017-12/index.html @@ -23,7 +23,7 @@ The list of connections to XMLUI and REST API for today: - + @@ -56,9 +56,9 @@ The list of connections to XMLUI and REST API for today: "@type": "BlogPosting", "headline": "December, 2017", "url": "https://alanorth.github.io/cgspace-notes/2017-12/", - "wordCount": "3897", + "wordCount": "4050", "datePublished": "2017-12-01T13:53:54+03:00", - "dateModified": "2017-12-25T22:26:01+02:00", + "dateModified": "2017-12-29T18:45:09+02:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -904,6 +904,41 @@ DELETE 20
  • I need to figure out why we have records with language in because that’s not a language!
  • +

    2017-12-30

    + + + +
    # cat /var/log/nginx/access.log /var/log/nginx/access.log.1 /var/log/nginx/library-access.log /var/log/nginx/library-access.log.1 | grep -E "30/Dec/2017" | awk '{print $1}' | sort -n | uniq -c | sort -h | tail
    +    637 207.46.13.106
    +    641 157.55.39.186
    +    715 68.180.229.254
    +    924 104.196.152.243
    +   1012 66.249.64.95
    +   1060 216.244.66.245
    +   1120 54.175.208.220
    +   1287 66.249.64.93
    +   1586 66.249.64.78
    +   3653 66.249.64.91
    +
    + + + +
    $ grep 54.175.208.220 dspace.log.2017-12-30 | grep -o -E 'session_id=[A-Z0-9]{32}' | sort -n | uniq | wc -l          
    +1 
    +
    + + + diff --git a/public/sitemap.xml b/public/sitemap.xml index 47e0d9015..99bf14330 100644 --- a/public/sitemap.xml +++ b/public/sitemap.xml @@ -4,7 +4,7 @@ https://alanorth.github.io/cgspace-notes/2017-12/ - 2017-12-25T22:26:01+02:00 + 2017-12-29T18:45:09+02:00 @@ -139,7 +139,7 @@ https://alanorth.github.io/cgspace-notes/ - 2017-12-25T22:26:01+02:00 + 2017-12-29T18:45:09+02:00 0 @@ -150,7 +150,7 @@ https://alanorth.github.io/cgspace-notes/tags/notes/ - 2017-12-25T22:26:01+02:00 + 2017-12-29T18:45:09+02:00 0 @@ -162,13 +162,13 @@ https://alanorth.github.io/cgspace-notes/post/ - 2017-12-25T22:26:01+02:00 + 2017-12-29T18:45:09+02:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2017-12-25T22:26:01+02:00 + 2017-12-29T18:45:09+02:00 0