diff --git a/content/posts/2018-11.md b/content/posts/2018-11.md index 801643063..448f32fb2 100644 --- a/content/posts/2018-11.md +++ b/content/posts/2018-11.md @@ -240,6 +240,18 @@ $ ./add-dc-rights.py -i /tmp/marlo.csv -db dspace -u dspace -p 'fuuu' - The file `marlo.csv` was cleaned up and formatted in Open Refine - 165 of the items in their 2017 data are from CGSpace! -- I will add the data to CGSpace this week +- I will add the data to CGSpace this week (done!) +- Jesus, is Facebook *trying* to be annoying? + +``` +# zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "05/Nov/2018" | grep -c "2a03:2880:11ff:" +29889 +# grep -c -E 'session_id=[A-Z0-9]{32}:ip_addr=2a03:2880:11ff' dspace.log.2018-11-05 | sort | uniq +29156 +# zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "05/Nov/2018" | grep "2a03:2880:11ff:" | grep -c -E "(handle|bitstream)" +29896 +``` + +- 29,000 requests from Facebook, 29,000 Tomcat sessions, and none of the requests are to the dynamic pages I rate limited yesterday! diff --git a/docs/2018-11/index.html b/docs/2018-11/index.html index 2e21f5487..e370258f0 100644 --- a/docs/2018-11/index.html +++ b/docs/2018-11/index.html @@ -23,7 +23,7 @@ Today these are the top 10 IPs: " /> - + @@ -52,9 +52,9 @@ Today these are the top 10 IPs: "@type": "BlogPosting", "headline": "November, 2018", "url": "https://alanorth.github.io/cgspace-notes/2018-11/", - "wordCount": "1057", + "wordCount": "1129", "datePublished": "2018-11-01T16:41:30+02:00", - "dateModified": "2018-11-04T22:45:00+02:00", + "dateModified": "2018-11-05T17:45:39+02:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -377,7 +377,20 @@ Today these are the top 10 IPs: + +
# zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "05/Nov/2018" | grep -c "2a03:2880:11ff:"
+29889
+# grep -c -E 'session_id=[A-Z0-9]{32}:ip_addr=2a03:2880:11ff' dspace.log.2018-11-05 | sort | uniq
+29156
+# zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "05/Nov/2018" | grep "2a03:2880:11ff:" | grep -c -E "(handle|bitstream)"
+29896
+
+ + diff --git a/docs/sitemap.xml b/docs/sitemap.xml index b12d8ddcc..18edea762 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,7 +4,7 @@ https://alanorth.github.io/cgspace-notes/2018-11/ - 2018-11-04T22:45:00+02:00 + 2018-11-05T17:45:39+02:00 @@ -194,7 +194,7 @@ https://alanorth.github.io/cgspace-notes/ - 2018-11-04T22:45:00+02:00 + 2018-11-05T17:45:39+02:00 0 @@ -205,7 +205,7 @@ https://alanorth.github.io/cgspace-notes/tags/notes/ - 2018-11-04T22:45:00+02:00 + 2018-11-05T17:45:39+02:00 0 @@ -217,13 +217,13 @@ https://alanorth.github.io/cgspace-notes/posts/ - 2018-11-04T22:45:00+02:00 + 2018-11-05T17:45:39+02:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2018-11-04T22:45:00+02:00 + 2018-11-05T17:45:39+02:00 0