diff --git a/content/posts/2020-08.md b/content/posts/2020-08.md
index 4ab970c88..37fd18e04 100644
--- a/content/posts/2020-08.md
+++ b/content/posts/2020-08.md
@@ -385,4 +385,17 @@ dspace=# SELECT count(text_value) FROM metadatavalue WHERE metadata_field_id = 2
- I noticed a bunch of user agents with "Crawl" in the Solr stats, which is strange because the DSpace spider agents file has had "crawl" for a long time (and it is case insensitive)
- In any case I will purge them and add them to the Tomcat Crawler Session Manager Valve so that at least their sessions get re-used
+## 2020-08-13
+
+- Linode keeps sending mails that the load and outgoing bandwidth is above the threshold
+ - I took a look briefly and found two IPs with the "Delphi 2009" user agent
+ - Then there is 88.99.115.53 which made 82,000 requests in 2020 so far with no user agent
+ - 64.62.202.73 has made 7,000 requests with this user agent `Mozilla/5.0 (compatible; +centuryb.o.t9[at]gmail.com)`
+ - I had added it to the Tomcat Crawler Session Manager Valve last week but never purged the hits from Solr
+ - 195.54.160.163 is making thousands of requests with user agents liket this:
+
+`(CASE WHEN 2850=9474 THEN 2850 ELSE NULL END)`
+
+- I purged 150,000 hits from 2020 and 2020 from these user agents and hosts
+
diff --git a/docs/2020-08/index.html b/docs/2020-08/index.html
index 586c2a7af..d837597df 100644
--- a/docs/2020-08/index.html
+++ b/docs/2020-08/index.html
@@ -19,7 +19,7 @@ It is class based so I can easily add support for other vocabularies, and the te
-
+
@@ -43,9 +43,9 @@ It is class based so I can easily add support for other vocabularies, and the te
"@type": "BlogPosting",
"headline": "August, 2020",
"url": "https://alanorth.github.io/cgspace-notes/2020-08/",
- "wordCount": "2443",
+ "wordCount": "2554",
"datePublished": "2020-08-02T15:35:54+03:00",
- "dateModified": "2020-08-10T15:59:22+03:00",
+ "dateModified": "2020-08-11T11:35:05+03:00",
"author": {
"@type": "Person",
"name": "Alan Orth"
@@ -550,6 +550,22 @@ $ curl -s "http://localhost:8081/solr/statistics-2010/update?softCommit=tru
+
2020-08-13
+
+- Linode keeps sending mails that the load and outgoing bandwidth is above the threshold
+
+- I took a look briefly and found two IPs with the “Delphi 2009” user agent
+- Then there is 88.99.115.53 which made 82,000 requests in 2020 so far with no user agent
+- 64.62.202.73 has made 7,000 requests with this user agent
Mozilla/5.0 (compatible; +centuryb.o.t9[at]gmail.com)
+- I had added it to the Tomcat Crawler Session Manager Valve last week but never purged the hits from Solr
+- 195.54.160.163 is making thousands of requests with user agents liket this:
+
+
+
+(CASE WHEN 2850=9474 THEN 2850 ELSE NULL END)
+
+- I purged 150,000 hits from 2020 and 2020 from these user agents and hosts
+
diff --git a/docs/categories/index.html b/docs/categories/index.html
index decf36a9f..00b82285d 100644
--- a/docs/categories/index.html
+++ b/docs/categories/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/categories/notes/index.html b/docs/categories/notes/index.html
index 1f1405fc4..ee7849083 100644
--- a/docs/categories/notes/index.html
+++ b/docs/categories/notes/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/categories/notes/page/2/index.html b/docs/categories/notes/page/2/index.html
index 2d24dd186..e456a8f40 100644
--- a/docs/categories/notes/page/2/index.html
+++ b/docs/categories/notes/page/2/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/categories/notes/page/3/index.html b/docs/categories/notes/page/3/index.html
index 0406ae1cd..86f2338be 100644
--- a/docs/categories/notes/page/3/index.html
+++ b/docs/categories/notes/page/3/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/categories/notes/page/4/index.html b/docs/categories/notes/page/4/index.html
index 4663436b0..7c40fc2ee 100644
--- a/docs/categories/notes/page/4/index.html
+++ b/docs/categories/notes/page/4/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/index.html b/docs/index.html
index ffbab9252..a56b81956 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/page/2/index.html b/docs/page/2/index.html
index 747f7a589..b95c9f969 100644
--- a/docs/page/2/index.html
+++ b/docs/page/2/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/page/3/index.html b/docs/page/3/index.html
index 020248691..a9d854ae8 100644
--- a/docs/page/3/index.html
+++ b/docs/page/3/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/page/4/index.html b/docs/page/4/index.html
index f3c9a2dbf..32628af38 100644
--- a/docs/page/4/index.html
+++ b/docs/page/4/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/page/5/index.html b/docs/page/5/index.html
index 2f8f257de..dca9a6059 100644
--- a/docs/page/5/index.html
+++ b/docs/page/5/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/page/6/index.html b/docs/page/6/index.html
index 8c2aa8256..6db475464 100644
--- a/docs/page/6/index.html
+++ b/docs/page/6/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/posts/index.html b/docs/posts/index.html
index d22281c61..b4a799a38 100644
--- a/docs/posts/index.html
+++ b/docs/posts/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/posts/page/2/index.html b/docs/posts/page/2/index.html
index 7612d58a1..23990c11d 100644
--- a/docs/posts/page/2/index.html
+++ b/docs/posts/page/2/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/posts/page/3/index.html b/docs/posts/page/3/index.html
index 724115d01..f450e0005 100644
--- a/docs/posts/page/3/index.html
+++ b/docs/posts/page/3/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/posts/page/4/index.html b/docs/posts/page/4/index.html
index c46c98a6d..c5e9ec501 100644
--- a/docs/posts/page/4/index.html
+++ b/docs/posts/page/4/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/posts/page/5/index.html b/docs/posts/page/5/index.html
index 8558a5d8c..74321b930 100644
--- a/docs/posts/page/5/index.html
+++ b/docs/posts/page/5/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/posts/page/6/index.html b/docs/posts/page/6/index.html
index 36ca45b93..1f238c2b2 100644
--- a/docs/posts/page/6/index.html
+++ b/docs/posts/page/6/index.html
@@ -9,7 +9,7 @@
-
+
diff --git a/docs/sitemap.xml b/docs/sitemap.xml
index ecfee172a..9f5a2d25b 100644
--- a/docs/sitemap.xml
+++ b/docs/sitemap.xml
@@ -4,27 +4,27 @@
https://alanorth.github.io/cgspace-notes/2020-08/
- 2020-08-10T15:59:22+03:00
+ 2020-08-11T11:35:05+03:00
https://alanorth.github.io/cgspace-notes/categories/
- 2020-08-10T15:59:22+03:00
+ 2020-08-11T11:35:05+03:00
https://alanorth.github.io/cgspace-notes/
- 2020-08-10T15:59:22+03:00
+ 2020-08-11T11:35:05+03:00
https://alanorth.github.io/cgspace-notes/categories/notes/
- 2020-08-10T15:59:22+03:00
+ 2020-08-11T11:35:05+03:00
https://alanorth.github.io/cgspace-notes/posts/
- 2020-08-10T15:59:22+03:00
+ 2020-08-11T11:35:05+03:00