mirror of
https://github.com/alanorth/cgspace-notes.git
synced 2024-12-26 06:54:30 +01:00
Add notes for 2017-08-12
This commit is contained in:
parent
fcd67161f4
commit
7d675f93f8
@ -94,3 +94,24 @@ dspace#= \copy (select distinct text_value, count(*) from metadatavalue where me
|
||||
## 2017-08-12
|
||||
|
||||
- I sent a message to the mailing list about the duplicate content issue with `/rest` and `/bitstream` URLs
|
||||
- Looking at the logs for the REST API on `/rest`, it looks like there is someone hammering doing testing or something on it...
|
||||
|
||||
```
|
||||
# awk '{print $1}' /var/log/nginx/rest.log.1 | sort -n | uniq -c | sort -h | tail -n 5
|
||||
140 66.249.66.91
|
||||
404 66.249.66.90
|
||||
1479 50.116.102.77
|
||||
9794 45.5.184.196
|
||||
85736 70.32.83.92
|
||||
```
|
||||
|
||||
- The top offender is 70.32.83.92 which is actually the same IP as ccafs.cgiar.org, so I will email the Macaroni Bros to see if they can test on DSpace Test instead
|
||||
- I've enabled logging of `/oai` requests on nginx as well so we can potentially determine bad actors here (also to see if anyone is actually using OAI!)
|
||||
|
||||
```
|
||||
# log oai requests
|
||||
location /oai {
|
||||
access_log /var/log/nginx/oai.log;
|
||||
proxy_pass http://tomcat_http;
|
||||
}
|
||||
```
|
||||
|
@ -37,7 +37,7 @@ Then I cleaned up the author authorities and HTML characters in OpenRefine and s
|
||||
|
||||
|
||||
<meta property="article:published_time" content="2017-08-01T11:51:52+03:00"/>
|
||||
<meta property="article:modified_time" content="2017-08-12T08:40:59+03:00"/>
|
||||
<meta property="article:modified_time" content="2017-08-12T09:29:02+03:00"/>
|
||||
|
||||
|
||||
|
||||
@ -85,9 +85,9 @@ Then I cleaned up the author authorities and HTML characters in OpenRefine and s
|
||||
"@type": "BlogPosting",
|
||||
"headline": "August, 2017",
|
||||
"url": "https://alanorth.github.io/cgspace-notes/2017-08/",
|
||||
"wordCount": "1207",
|
||||
"wordCount": "1327",
|
||||
"datePublished": "2017-08-01T11:51:52+03:00",
|
||||
"dateModified": "2017-08-12T08:40:59+03:00",
|
||||
"dateModified": "2017-08-12T09:29:02+03:00",
|
||||
"author": {
|
||||
"@type": "Person",
|
||||
"name": "Alan Orth"
|
||||
@ -268,8 +268,29 @@ Then I cleaned up the author authorities and HTML characters in OpenRefine and s
|
||||
|
||||
<ul>
|
||||
<li>I sent a message to the mailing list about the duplicate content issue with <code>/rest</code> and <code>/bitstream</code> URLs</li>
|
||||
<li>Looking at the logs for the REST API on <code>/rest</code>, it looks like there is someone hammering doing testing or something on it…</li>
|
||||
</ul>
|
||||
|
||||
<pre><code># awk '{print $1}' /var/log/nginx/rest.log.1 | sort -n | uniq -c | sort -h | tail -n 5
|
||||
140 66.249.66.91
|
||||
404 66.249.66.90
|
||||
1479 50.116.102.77
|
||||
9794 45.5.184.196
|
||||
85736 70.32.83.92
|
||||
</code></pre>
|
||||
|
||||
<ul>
|
||||
<li>The top offender is 70.32.83.92 which is actually the same IP as ccafs.cgiar.org, so I will email the Macaroni Bros to see if they can test on DSpace Test instead</li>
|
||||
<li>I’ve enabled logging of <code>/oai</code> requests on nginx as well so we can potentially determine bad actors here (also to see if anyone is actually using OAI!)</li>
|
||||
</ul>
|
||||
|
||||
<pre><code> # log oai requests
|
||||
location /oai {
|
||||
access_log /var/log/nginx/oai.log;
|
||||
proxy_pass http://tomcat_http;
|
||||
}
|
||||
</code></pre>
|
||||
|
||||
|
||||
|
||||
|
||||
|
@ -4,7 +4,7 @@
|
||||
|
||||
<url>
|
||||
<loc>https://alanorth.github.io/cgspace-notes/2017-08/</loc>
|
||||
<lastmod>2017-08-12T08:40:59+03:00</lastmod>
|
||||
<lastmod>2017-08-12T09:29:02+03:00</lastmod>
|
||||
</url>
|
||||
|
||||
<url>
|
||||
@ -114,7 +114,7 @@
|
||||
|
||||
<url>
|
||||
<loc>https://alanorth.github.io/cgspace-notes/</loc>
|
||||
<lastmod>2017-08-12T08:40:59+03:00</lastmod>
|
||||
<lastmod>2017-08-12T09:29:02+03:00</lastmod>
|
||||
<priority>0</priority>
|
||||
</url>
|
||||
|
||||
@ -125,19 +125,19 @@
|
||||
|
||||
<url>
|
||||
<loc>https://alanorth.github.io/cgspace-notes/tags/notes/</loc>
|
||||
<lastmod>2017-08-12T08:40:59+03:00</lastmod>
|
||||
<lastmod>2017-08-12T09:29:02+03:00</lastmod>
|
||||
<priority>0</priority>
|
||||
</url>
|
||||
|
||||
<url>
|
||||
<loc>https://alanorth.github.io/cgspace-notes/post/</loc>
|
||||
<lastmod>2017-08-12T08:40:59+03:00</lastmod>
|
||||
<lastmod>2017-08-12T09:29:02+03:00</lastmod>
|
||||
<priority>0</priority>
|
||||
</url>
|
||||
|
||||
<url>
|
||||
<loc>https://alanorth.github.io/cgspace-notes/tags/</loc>
|
||||
<lastmod>2017-08-12T08:40:59+03:00</lastmod>
|
||||
<lastmod>2017-08-12T09:29:02+03:00</lastmod>
|
||||
<priority>0</priority>
|
||||
</url>
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user