From 0a112d16bf89fed4fd8b891236fcc299d52ab411 Mon Sep 17 00:00:00 2001 From: Alan Orth Date: Thu, 24 Jan 2019 10:59:03 +0200 Subject: [PATCH] Add notes for 2019-01-24 --- content/posts/2019-01.md | 58 +++++++++++++++++++++++++++++++++ docs/2019-01/index.html | 70 ++++++++++++++++++++++++++++++++++++++-- docs/robots.txt | 2 +- docs/sitemap.xml | 20 ++++++------ 4 files changed, 136 insertions(+), 14 deletions(-) diff --git a/content/posts/2019-01.md b/content/posts/2019-01.md index cb2bbcba2..4bc9df365 100644 --- a/content/posts/2019-01.md +++ b/content/posts/2019-01.md @@ -835,4 +835,62 @@ $ schedtool -D -e ionice -c2 -n7 nice -n19 /home/cgspace.cgiar.org/bin/dspace fi - I think this Launchpad discussion is relevant: https://bugs.launchpad.net/ubuntu/+source/ghostscript/+bug/1806517 - As well as the original Ghostscript bug report: https://bugs.ghostscript.com/show_bug.cgi?id=699815 +## 2019-01-24 + +- I noticed Ubuntu's Ghostscript 9.26 works on some troublesome PDFs where Arch's Ghostscript 9.26 doesn't, so the fix for the first/last page crash is not the patch I found yesterday +- Ubuntu's Ghostscript uses another [patch from Ghostscript git](http://git.ghostscript.com/?p=ghostpdl.git;h=fae21f1668d2b44b18b84cf0923a1d5f3008a696) ([upstream bug report](https://bugs.ghostscript.com/show_bug.cgi?id=700315)) +- I re-compiled Arch's ghostscript with the patch and then I was able to generate a thumbnail from one of the [troublesome PDFs](https://cgspace.cgiar.org/handle/10568/98390) +- Before and after: + +``` +$ identify Food\ safety\ Kenya\ fruits.pdf\[0\] +zsh: abort (core dumped) identify Food\ safety\ Kenya\ fruits.pdf\[0\] +$ identify Food\ safety\ Kenya\ fruits.pdf\[0\] +Food safety Kenya fruits.pdf[0]=>Food safety Kenya fruits.pdf PDF 612x792 612x792+0+0 16-bit sRGB 64626B 0.000u 0:00.000 +identify: CorruptImageProfile `xmp' @ warning/profile.c/SetImageProfileInternal/1747. +``` + +- I reported it to the Arch Linux bug tracker ([61513](https://bugs.archlinux.org/task/61513)) +- I told Atmire to go ahead with the Metadata Quality Module addition based on our `5_x-dev` branch ([657](https://tracker.atmire.com/tickets-cgiar-ilri/view-ticket?id=657)) +- Linode sent alerts last night to say that CGSpace (linode18) was using high CPU last night, here are the top ten IPs from the nginx logs around that time: + +``` +# zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "23/Jan/2019:(18|19|20)" | awk '{print $1}' | sort | uniq -c | sort -n | tail -n 10 + 305 3.81.136.184 + 306 3.83.14.11 + 306 52.54.252.47 + 325 54.221.57.180 + 378 66.249.64.157 + 424 54.70.40.11 + 497 47.29.247.74 + 783 35.237.175.180 + 1108 66.249.64.155 + 2378 45.5.186.2 +``` + +- 45.5.186.2 is CIAT and 66.249.64.155 is Google... hmmm. +- Linode sent another alert this morning, here are the top ten IPs active during that time: + +``` +# zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "24/Jan/2019:0(4|5|6)" | awk '{print $1}' | sort | uniq -c | sort -n | tail -n 10 + 360 3.89.134.93 + 362 34.230.15.139 + 366 100.24.48.177 + 369 18.212.208.240 + 377 3.81.136.184 + 404 54.221.57.180 + 506 66.249.64.155 + 4642 70.32.83.92 + 4643 205.186.128.185 + 8593 45.5.186.2 +``` + +- Just double checking what CIAT is doing, they are mainly hitting the REST API: + +``` +# zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "24/Jan/2019:" | grep 45.5.186.2 | grep -Eo "GET /(handle|bitstream|rest|oai)/" | sort | uniq -c | sort -n +``` + +- CIAT's community currently has 12,000 items in it so this is normal + diff --git a/docs/2019-01/index.html b/docs/2019-01/index.html index 372826780..f06777952 100644 --- a/docs/2019-01/index.html +++ b/docs/2019-01/index.html @@ -27,7 +27,7 @@ I don’t see anything interesting in the web server logs around that time t " /> - + @@ -60,9 +60,9 @@ I don’t see anything interesting in the web server logs around that time t "@type": "BlogPosting", "headline": "January, 2019", "url": "https://alanorth.github.io/cgspace-notes/2019-01/", - "wordCount": "4210", + "wordCount": "4540", "datePublished": "2019-01-02T09:48:30+02:00", - "dateModified": "2019-01-23T17:27:09+02:00", + "dateModified": "2019-01-23T18:21:06+02:00", "author": { "@type": "Person", "name": "Alan Orth" @@ -1122,6 +1122,70 @@ $ schedtool -D -e ionice -c2 -n7 nice -n19 /home/cgspace.cgiar.org/bin/dspace fi
  • As well as the original Ghostscript bug report: https://bugs.ghostscript.com/show_bug.cgi?id=699815
  • +

    2019-01-24

    + + + +
    $ identify Food\ safety\ Kenya\ fruits.pdf\[0\]
    +zsh: abort (core dumped)  identify Food\ safety\ Kenya\ fruits.pdf\[0\]
    +$ identify Food\ safety\ Kenya\ fruits.pdf\[0\]
    +Food safety Kenya fruits.pdf[0]=>Food safety Kenya fruits.pdf PDF 612x792 612x792+0+0 16-bit sRGB 64626B 0.000u 0:00.000
    +identify: CorruptImageProfile `xmp' @ warning/profile.c/SetImageProfileInternal/1747.
    +
    + + + +
    # zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "23/Jan/2019:(18|19|20)" | awk '{print $1}' | sort | uniq -c | sort -n | tail -n 10
    +    305 3.81.136.184
    +    306 3.83.14.11
    +    306 52.54.252.47
    +    325 54.221.57.180
    +    378 66.249.64.157
    +    424 54.70.40.11
    +    497 47.29.247.74
    +    783 35.237.175.180
    +   1108 66.249.64.155
    +   2378 45.5.186.2
    +
    + + + +
    # zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "24/Jan/2019:0(4|5|6)" | awk '{print $1}' | sort | uniq -c | sort -n | tail -n 10
    +    360 3.89.134.93
    +    362 34.230.15.139
    +    366 100.24.48.177
    +    369 18.212.208.240
    +    377 3.81.136.184
    +    404 54.221.57.180
    +    506 66.249.64.155
    +   4642 70.32.83.92
    +   4643 205.186.128.185
    +   8593 45.5.186.2
    +
    + + + +
    # zcat --force /var/log/nginx/*.log /var/log/nginx/*.log.1 | grep -E "24/Jan/2019:" | grep 45.5.186.2 | grep -Eo "GET /(handle|bitstream|rest|oai)/" | sort | uniq -c | sort -n
    +
    + + + diff --git a/docs/robots.txt b/docs/robots.txt index c454234ec..1405dffd5 100644 --- a/docs/robots.txt +++ b/docs/robots.txt @@ -43,7 +43,7 @@ Disallow: /cgspace-notes/2015-12/ Disallow: /cgspace-notes/2015-11/ Disallow: /cgspace-notes/ Disallow: /cgspace-notes/categories/ -Disallow: /cgspace-notes/categories/notes/ Disallow: /cgspace-notes/tags/notes/ +Disallow: /cgspace-notes/categories/notes/ Disallow: /cgspace-notes/posts/ Disallow: /cgspace-notes/tags/ diff --git a/docs/sitemap.xml b/docs/sitemap.xml index 11bb1dbfe..215d52d81 100644 --- a/docs/sitemap.xml +++ b/docs/sitemap.xml @@ -4,7 +4,7 @@ https://alanorth.github.io/cgspace-notes/2019-01/ - 2019-01-23T17:27:09+02:00 + 2019-01-23T18:21:06+02:00 @@ -204,7 +204,7 @@ https://alanorth.github.io/cgspace-notes/ - 2019-01-23T17:27:09+02:00 + 2019-01-23T18:21:06+02:00 0 @@ -213,27 +213,27 @@ 0 + + https://alanorth.github.io/cgspace-notes/tags/notes/ + 2019-01-23T18:21:06+02:00 + 0 + + https://alanorth.github.io/cgspace-notes/categories/notes/ 2018-03-09T22:10:33+02:00 0 - - https://alanorth.github.io/cgspace-notes/tags/notes/ - 2019-01-23T17:27:09+02:00 - 0 - - https://alanorth.github.io/cgspace-notes/posts/ - 2019-01-23T17:27:09+02:00 + 2019-01-23T18:21:06+02:00 0 https://alanorth.github.io/cgspace-notes/tags/ - 2019-01-23T17:27:09+02:00 + 2019-01-23T18:21:06+02:00 0