diff --git a/content/posts/2023-03.md b/content/posts/2023-03.md
index 8cdcc0fc9..5a6a9cef4 100644
--- a/content/posts/2023-03.md
+++ b/content/posts/2023-03.md
@@ -492,4 +492,29 @@ RL: performed 0 reads and 16 write i/o operations
- I added a Flyway SQL migration for the PNG bitstream format registry changes on DSpace 7.6
+## 2023-03-26
+
+- There seems to be a slightly high load on CGSpace
+ - I don't see any locks in PostgreSQL, but there's some new bot I have never heard of:
+
+```console
+92.119.18.13 - - [26/Mar/2023:18:41:47 +0200] "GET /handle/10568/16500/discover?filtertype_0=impactarea&filter_relational_operator_0=equals&filter_0=Climate+adaptation+and+mitigation&filtertype=sdg&filter_relational_operator=equals&filter=SDG+11+-+Sustainable+cities+and+communities HTTP/2.0" 200 7856 "-" "colly - https://github.com/gocolly/colly"
+```
+
+- In the last week I see a handful of IPs making requests with this agent:
+
+```console
+# zcat --force /var/log/nginx/access.log /var/log/nginx/access.log.1 /var/log/nginx/access.log.{2,3,4,5,6,7}.gz | grep go
+colly | awk '{print $1}' | sort | uniq -c | sort -h
+ 2 194.233.95.37
+ 4304 92.119.18.142
+ 9496 5.180.208.152
+ 27477 92.119.18.13
+```
+
+- Most of these come from Packethub S.A. / ASN 62240 (CLOUVIDER Clouvider - Global ASN, GB)
+- Oh, I've apparently seen this user agent before, as it is in our ILRI spider user agent overrides
+- I exported CGSpace to check for missing Initiative collection mappings
+- Start a harvest on AReS
+
diff --git a/docs/2023-03/index.html b/docs/2023-03/index.html
index 8760c6936..4af119410 100644
--- a/docs/2023-03/index.html
+++ b/docs/2023-03/index.html
@@ -16,7 +16,7 @@ I finally got through with porting the input form from DSpace 6 to DSpace 7
-
+
@@ -38,9 +38,9 @@ I finally got through with porting the input form from DSpace 6 to DSpace 7
"@type": "BlogPosting",
"headline": "March, 2023",
"url": "https://alanorth.github.io/cgspace-notes/2023-03/",
- "wordCount": "3464",
+ "wordCount": "3600",
"datePublished": "2023-03-01T07:58:36+03:00",
- "dateModified": "2023-03-22T08:28:33+03:00",
+ "dateModified": "2023-03-24T13:19:13+03:00",
"author": {
"@type": "Person",
"name": "Alan Orth"
@@ -663,6 +663,30 @@ RL: performed 0 reads and 16 write i/o operations
- I added a Flyway SQL migration for the PNG bitstream format registry changes on DSpace 7.6
+2023-03-26
+
+- There seems to be a slightly high load on CGSpace
+
+- I don’t see any locks in PostgreSQL, but there’s some new bot I have never heard of:
+
+
+
+92.119.18.13 - - [26/Mar/2023:18:41:47 +0200] "GET /handle/10568/16500/discover?filtertype_0=impactarea&filter_relational_operator_0=equals&filter_0=Climate+adaptation+and+mitigation&filtertype=sdg&filter_relational_operator=equals&filter=SDG+11+-+Sustainable+cities+and+communities HTTP/2.0" 200 7856 "-" "colly - https://github.com/gocolly/colly"
+
+- In the last week I see a handful of IPs making requests with this agent:
+
+# zcat --force /var/log/nginx/access.log /var/log/nginx/access.log.1 /var/log/nginx/access.log.{2,3,4,5,6,7}.gz | grep go
+colly | awk '{print $1}' | sort | uniq -c | sort -h
+ 2 194.233.95.37
+ 4304 92.119.18.142
+ 9496 5.180.208.152
+ 27477 92.119.18.13
+
+- Most of these come from Packethub S.A. / ASN 62240 (CLOUVIDER Clouvider - Global ASN, GB)
+- Oh, I’ve apparently seen this user agent before, as it is in our ILRI spider user agent overrides
+- I exported CGSpace to check for missing Initiative collection mappings
+- Start a harvest on AReS
+
diff --git a/docs/categories/index.html b/docs/categories/index.html
index 93e653a55..e8519d906 100644
--- a/docs/categories/index.html
+++ b/docs/categories/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/categories/notes/index.html b/docs/categories/notes/index.html
index 2f9550a47..fe08644da 100644
--- a/docs/categories/notes/index.html
+++ b/docs/categories/notes/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/categories/notes/page/2/index.html b/docs/categories/notes/page/2/index.html
index 96706fbb4..88882c86d 100644
--- a/docs/categories/notes/page/2/index.html
+++ b/docs/categories/notes/page/2/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/categories/notes/page/3/index.html b/docs/categories/notes/page/3/index.html
index a950f82bf..05ebcc00b 100644
--- a/docs/categories/notes/page/3/index.html
+++ b/docs/categories/notes/page/3/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/categories/notes/page/4/index.html b/docs/categories/notes/page/4/index.html
index 8570a4d03..9e46d5625 100644
--- a/docs/categories/notes/page/4/index.html
+++ b/docs/categories/notes/page/4/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/categories/notes/page/5/index.html b/docs/categories/notes/page/5/index.html
index 22b69838d..32ebc43bf 100644
--- a/docs/categories/notes/page/5/index.html
+++ b/docs/categories/notes/page/5/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/categories/notes/page/6/index.html b/docs/categories/notes/page/6/index.html
index d58da095c..dea2c31fa 100644
--- a/docs/categories/notes/page/6/index.html
+++ b/docs/categories/notes/page/6/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/categories/notes/page/7/index.html b/docs/categories/notes/page/7/index.html
index 8c21c704d..ae79fb496 100644
--- a/docs/categories/notes/page/7/index.html
+++ b/docs/categories/notes/page/7/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/index.html b/docs/index.html
index 646964c48..1e1f8c7ab 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/10/index.html b/docs/page/10/index.html
index 0beccdcae..128886604 100644
--- a/docs/page/10/index.html
+++ b/docs/page/10/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/2/index.html b/docs/page/2/index.html
index a3b745611..1cf13fd6f 100644
--- a/docs/page/2/index.html
+++ b/docs/page/2/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/3/index.html b/docs/page/3/index.html
index fcf4af40f..bdf0fcac1 100644
--- a/docs/page/3/index.html
+++ b/docs/page/3/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/4/index.html b/docs/page/4/index.html
index bba2fab9a..f3f871bdf 100644
--- a/docs/page/4/index.html
+++ b/docs/page/4/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/5/index.html b/docs/page/5/index.html
index 0c361df6e..fece6c27b 100644
--- a/docs/page/5/index.html
+++ b/docs/page/5/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/6/index.html b/docs/page/6/index.html
index 362433a15..5fa5309eb 100644
--- a/docs/page/6/index.html
+++ b/docs/page/6/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/7/index.html b/docs/page/7/index.html
index 3c346ad8f..62a7c51fd 100644
--- a/docs/page/7/index.html
+++ b/docs/page/7/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/8/index.html b/docs/page/8/index.html
index fa2838a96..c20a0a7f6 100644
--- a/docs/page/8/index.html
+++ b/docs/page/8/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/page/9/index.html b/docs/page/9/index.html
index d79c6d92f..d021b762e 100644
--- a/docs/page/9/index.html
+++ b/docs/page/9/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/index.html b/docs/posts/index.html
index d231de0d4..fc680e952 100644
--- a/docs/posts/index.html
+++ b/docs/posts/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/10/index.html b/docs/posts/page/10/index.html
index a29bd9644..ccee9ae96 100644
--- a/docs/posts/page/10/index.html
+++ b/docs/posts/page/10/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/2/index.html b/docs/posts/page/2/index.html
index ff006163c..b8495f933 100644
--- a/docs/posts/page/2/index.html
+++ b/docs/posts/page/2/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/3/index.html b/docs/posts/page/3/index.html
index 69a58f6fa..e8cc13af4 100644
--- a/docs/posts/page/3/index.html
+++ b/docs/posts/page/3/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/4/index.html b/docs/posts/page/4/index.html
index 0bf5f2071..ee100a6f5 100644
--- a/docs/posts/page/4/index.html
+++ b/docs/posts/page/4/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/5/index.html b/docs/posts/page/5/index.html
index e6d0f9d43..4ce4be95e 100644
--- a/docs/posts/page/5/index.html
+++ b/docs/posts/page/5/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/6/index.html b/docs/posts/page/6/index.html
index bda2f205d..2378351e4 100644
--- a/docs/posts/page/6/index.html
+++ b/docs/posts/page/6/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/7/index.html b/docs/posts/page/7/index.html
index 6b43b77eb..86201e88d 100644
--- a/docs/posts/page/7/index.html
+++ b/docs/posts/page/7/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/8/index.html b/docs/posts/page/8/index.html
index b65029752..82bbe8521 100644
--- a/docs/posts/page/8/index.html
+++ b/docs/posts/page/8/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/posts/page/9/index.html b/docs/posts/page/9/index.html
index 1f0d91b62..00cc9c5fc 100644
--- a/docs/posts/page/9/index.html
+++ b/docs/posts/page/9/index.html
@@ -10,7 +10,7 @@
-
+
diff --git a/docs/sitemap.xml b/docs/sitemap.xml
index d171f8983..1e1866172 100644
--- a/docs/sitemap.xml
+++ b/docs/sitemap.xml
@@ -3,19 +3,19 @@
xmlns:xhtml="http://www.w3.org/1999/xhtml">
https://alanorth.github.io/cgspace-notes/categories/
- 2023-03-22T08:28:33+03:00
+ 2023-03-24T13:19:13+03:00
https://alanorth.github.io/cgspace-notes/
- 2023-03-22T08:28:33+03:00
+ 2023-03-24T13:19:13+03:00
https://alanorth.github.io/cgspace-notes/2023-03/
- 2023-03-22T08:28:33+03:00
+ 2023-03-24T13:19:13+03:00
https://alanorth.github.io/cgspace-notes/categories/notes/
- 2023-03-22T08:28:33+03:00
+ 2023-03-24T13:19:13+03:00
https://alanorth.github.io/cgspace-notes/posts/
- 2023-03-22T08:28:33+03:00
+ 2023-03-24T13:19:13+03:00
https://alanorth.github.io/cgspace-notes/2023-02/
2023-03-01T08:30:25+03:00