mirror of
https://github.com/alanorth/cgspace-notes.git
synced 2025-01-27 05:49:12 +01:00
Add notes for 2017-03-01
This commit is contained in:
@ -12,7 +12,7 @@
|
||||
|
||||
|
||||
|
||||
<meta property="og:updated_time" content="2017-02-07T07:04:52-08:00"/>
|
||||
<meta property="og:updated_time" content="2017-03-01T17:08:52+02:00"/>
|
||||
|
||||
|
||||
|
||||
@ -40,7 +40,7 @@
|
||||
},
|
||||
|
||||
|
||||
"dateModified": "2017-02-07T07:04:52-08:00",
|
||||
"dateModified": "2017-03-01T17:08:52+02:00",
|
||||
|
||||
|
||||
|
||||
@ -103,6 +103,28 @@
|
||||
|
||||
|
||||
|
||||
<article class="blog-post">
|
||||
<header>
|
||||
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2017-03/">March, 2017</a></h2>
|
||||
<p class="blog-post-meta"><time datetime="2017-03-01T17:08:52+02:00">Wed Mar 01, 2017</time> by Alan Orth in
|
||||
|
||||
<i class="fa fa-tag" aria-hidden="true"></i> <a href="/cgspace-notes/tags/notes" rel="tag">Notes</a>
|
||||
|
||||
</p>
|
||||
</header>
|
||||
<h2 id="2017-03-01">2017-03-01</h2>
|
||||
|
||||
<ul>
|
||||
<li>Run the 279 CIAT author corrections on CGSpace</li>
|
||||
</ul>
|
||||
|
||||
<p></p>
|
||||
<a href='https://alanorth.github.io/cgspace-notes/2017-03/'>Read more →</a>
|
||||
</article>
|
||||
|
||||
|
||||
|
||||
|
||||
<article class="blog-post">
|
||||
<header>
|
||||
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2017-02/">February, 2017</a></h2>
|
||||
@ -379,34 +401,6 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
|
||||
|
||||
|
||||
|
||||
<article class="blog-post">
|
||||
<header>
|
||||
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-05/">May, 2016</a></h2>
|
||||
<p class="blog-post-meta"><time datetime="2016-05-01T23:06:00+03:00">Sun May 01, 2016</time> by Alan Orth in
|
||||
|
||||
<i class="fa fa-tag" aria-hidden="true"></i> <a href="/cgspace-notes/tags/notes" rel="tag">Notes</a>
|
||||
|
||||
</p>
|
||||
</header>
|
||||
<h2 id="2016-05-01">2016-05-01</h2>
|
||||
|
||||
<ul>
|
||||
<li>Since yesterday there have been 10,000 REST errors and the site has been unstable again</li>
|
||||
<li>I have blocked access to the API now</li>
|
||||
<li>There are 3,000 IPs accessing the REST API in a 24-hour period!</li>
|
||||
</ul>
|
||||
|
||||
<pre><code># awk '{print $1}' /var/log/nginx/rest.log | uniq | wc -l
|
||||
3168
|
||||
</code></pre>
|
||||
|
||||
<p></p>
|
||||
<a href='https://alanorth.github.io/cgspace-notes/2016-05/'>Read more →</a>
|
||||
</article>
|
||||
|
||||
|
||||
|
||||
|
||||
<nav class="blog-pagination">
|
||||
|
||||
|
||||
@ -431,6 +425,8 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
|
||||
<h4>Recent Posts</h4>
|
||||
<ol class="list-unstyled">
|
||||
|
||||
<li><a href="/cgspace-notes/2017-03/">March, 2017</a></li>
|
||||
|
||||
<li><a href="/cgspace-notes/2017-02/">February, 2017</a></li>
|
||||
|
||||
<li><a href="/cgspace-notes/2017-01/">January, 2017</a></li>
|
||||
@ -439,8 +435,6 @@ dspacetest=# select text_value from metadatavalue where metadata_field_id=3 and
|
||||
|
||||
<li><a href="/cgspace-notes/2016-11/">November, 2016</a></li>
|
||||
|
||||
<li><a href="/cgspace-notes/2016-10/">October, 2016</a></li>
|
||||
|
||||
</ol>
|
||||
</section>
|
||||
|
||||
|
@ -6,9 +6,24 @@
|
||||
<description>Recent content in Posts on CGSpace Notes</description>
|
||||
<generator>Hugo -- gohugo.io</generator>
|
||||
<language>en-us</language>
|
||||
<lastBuildDate>Tue, 07 Feb 2017 07:04:52 -0800</lastBuildDate>
|
||||
<lastBuildDate>Wed, 01 Mar 2017 17:08:52 +0200</lastBuildDate>
|
||||
<atom:link href="https://alanorth.github.io/cgspace-notes/post/index.xml" rel="self" type="application/rss+xml" />
|
||||
|
||||
<item>
|
||||
<title>March, 2017</title>
|
||||
<link>https://alanorth.github.io/cgspace-notes/2017-03/</link>
|
||||
<pubDate>Wed, 01 Mar 2017 17:08:52 +0200</pubDate>
|
||||
|
||||
<guid>https://alanorth.github.io/cgspace-notes/2017-03/</guid>
|
||||
<description><h2 id="2017-03-01">2017-03-01</h2>
|
||||
|
||||
<ul>
|
||||
<li>Run the 279 CIAT author corrections on CGSpace</li>
|
||||
</ul>
|
||||
|
||||
<p></p></description>
|
||||
</item>
|
||||
|
||||
<item>
|
||||
<title>February, 2017</title>
|
||||
<link>https://alanorth.github.io/cgspace-notes/2017-02/</link>
|
||||
@ -5379,174 +5394,5 @@ $ find SimpleArchiveForBio/ -iname &ldquo;*.pdf&rdquo; -exec basename {}
|
||||
<p><img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2016/01/xmlui-subjects-after.png" alt="XMLUI subjects after" /></p></description>
|
||||
</item>
|
||||
|
||||
<item>
|
||||
<title>December, 2015</title>
|
||||
<link>https://alanorth.github.io/cgspace-notes/2015-12/</link>
|
||||
<pubDate>Wed, 02 Dec 2015 13:18:00 +0300</pubDate>
|
||||
|
||||
<guid>https://alanorth.github.io/cgspace-notes/2015-12/</guid>
|
||||
<description><h2 id="2015-12-02">2015-12-02</h2>
|
||||
|
||||
<ul>
|
||||
<li>Replace <code>lzop</code> with <code>xz</code> in log compression cron jobs on DSpace Test—it uses less space:</li>
|
||||
</ul>
|
||||
|
||||
<pre><code># cd /home/dspacetest.cgiar.org/log
|
||||
# ls -lh dspace.log.2015-11-18*
|
||||
-rw-rw-r-- 1 tomcat7 tomcat7 2.0M Nov 18 23:59 dspace.log.2015-11-18
|
||||
-rw-rw-r-- 1 tomcat7 tomcat7 387K Nov 18 23:59 dspace.log.2015-11-18.lzo
|
||||
-rw-rw-r-- 1 tomcat7 tomcat7 169K Nov 18 23:59 dspace.log.2015-11-18.xz
|
||||
</code></pre>
|
||||
|
||||
<p></p>
|
||||
|
||||
<ul>
|
||||
<li>I had used lrzip once, but it needs more memory and is harder to use as it requires the lrztar wrapper</li>
|
||||
<li>Need to remember to go check if everything is ok in a few days and then change CGSpace</li>
|
||||
<li>CGSpace went down again (due to PostgreSQL idle connections of course)</li>
|
||||
<li>Current database settings for DSpace are <code>db.maxconnections = 30</code> and <code>db.maxidle = 8</code>, yet idle connections are exceeding this:</li>
|
||||
</ul>
|
||||
|
||||
<pre><code>$ psql -c 'SELECT * from pg_stat_activity;' | grep cgspace | grep -c idle
|
||||
39
|
||||
</code></pre>
|
||||
|
||||
<ul>
|
||||
<li>I restarted PostgreSQL and Tomcat and it&rsquo;s back</li>
|
||||
<li>On a related note of why CGSpace is so slow, I decided to finally try the <code>pgtune</code> script to tune the postgres settings:</li>
|
||||
</ul>
|
||||
|
||||
<pre><code># apt-get install pgtune
|
||||
# pgtune -i /etc/postgresql/9.3/main/postgresql.conf -o postgresql.conf-pgtune
|
||||
# mv /etc/postgresql/9.3/main/postgresql.conf /etc/postgresql/9.3/main/postgresql.conf.orig
|
||||
# mv postgresql.conf-pgtune /etc/postgresql/9.3/main/postgresql.conf
|
||||
</code></pre>
|
||||
|
||||
<ul>
|
||||
<li>It introduced the following new settings:</li>
|
||||
</ul>
|
||||
|
||||
<pre><code>default_statistics_target = 50
|
||||
maintenance_work_mem = 480MB
|
||||
constraint_exclusion = on
|
||||
checkpoint_completion_target = 0.9
|
||||
effective_cache_size = 5632MB
|
||||
work_mem = 48MB
|
||||
wal_buffers = 8MB
|
||||
checkpoint_segments = 16
|
||||
shared_buffers = 1920MB
|
||||
max_connections = 80
|
||||
</code></pre>
|
||||
|
||||
<ul>
|
||||
<li>Now I need to go read PostgreSQL docs about these options, and watch memory settings in munin etc</li>
|
||||
<li>For what it&rsquo;s worth, now the REST API should be faster (because of these PostgreSQL tweaks):</li>
|
||||
</ul>
|
||||
|
||||
<pre><code>$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
1.474
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
2.141
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
1.685
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
1.995
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
1.786
|
||||
</code></pre>
|
||||
|
||||
<ul>
|
||||
<li>Last week it was an average of 8 seconds&hellip; now this is <sup>1</sup>&frasl;<sub>4</sub> of that</li>
|
||||
<li>CCAFS noticed that one of their items displays only the Atmire statlets: <a href="https://cgspace.cgiar.org/handle/10568/42445">https://cgspace.cgiar.org/handle/10568/42445</a></li>
|
||||
</ul>
|
||||
|
||||
<p><img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2015/12/ccafs-item-no-metadata.png" alt="CCAFS item" /></p>
|
||||
|
||||
<ul>
|
||||
<li>The authorizations for the item are all public READ, and I don&rsquo;t see any errors in dspace.log when browsing that item</li>
|
||||
<li>I filed a ticket on Atmire&rsquo;s issue tracker</li>
|
||||
<li>I also filed a ticket on Atmire&rsquo;s issue tracker for the PostgreSQL stuff</li>
|
||||
</ul>
|
||||
|
||||
<h2 id="2015-12-03">2015-12-03</h2>
|
||||
|
||||
<ul>
|
||||
<li>CGSpace very slow, and monitoring emailing me to say its down, even though I can load the page (very slowly)</li>
|
||||
<li>Idle postgres connections look like this (with no change in DSpace db settings lately):</li>
|
||||
</ul>
|
||||
|
||||
<pre><code>$ psql -c 'SELECT * from pg_stat_activity;' | grep cgspace | grep -c idle
|
||||
29
|
||||
</code></pre>
|
||||
|
||||
<ul>
|
||||
<li>I restarted Tomcat and postgres&hellip;</li>
|
||||
<li>Atmire commented that we should raise the JVM heap size by ~500M, so it is now <code>-Xms3584m -Xmx3584m</code></li>
|
||||
<li>We weren&rsquo;t out of heap yet, but it&rsquo;s probably fair enough that the DSpace 5 upgrade (and new Atmire modules) requires more memory so it&rsquo;s ok</li>
|
||||
<li>A possible side effect is that I see that the REST API is twice as fast for the request above now:</li>
|
||||
</ul>
|
||||
|
||||
<pre><code>$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
1.368
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.968
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
1.006
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.849
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.806
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.854
|
||||
</code></pre>
|
||||
|
||||
<h2 id="2015-12-05">2015-12-05</h2>
|
||||
|
||||
<ul>
|
||||
<li>CGSpace has been up and down all day and REST API is completely unresponsive</li>
|
||||
<li>PostgreSQL idle connections are currently:</li>
|
||||
</ul>
|
||||
|
||||
<pre><code>postgres@linode01:~$ psql -c 'SELECT * from pg_stat_activity;' | grep cgspace | grep -c idle
|
||||
28
|
||||
</code></pre>
|
||||
|
||||
<ul>
|
||||
<li>I have reverted all the pgtune tweaks from the other day, as they didn&rsquo;t fix the stability issues, so I&rsquo;d rather not have them introducing more variables into the equation</li>
|
||||
<li>The PostgreSQL stats from Munin all point to something database-related with the DSpace 5 upgrade around mid–late November</li>
|
||||
</ul>
|
||||
|
||||
<p><img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2015/12/postgres_bgwriter-year.png" alt="PostgreSQL bgwriter (year)" />
|
||||
<img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2015/12/postgres_cache_cgspace-year.png" alt="PostgreSQL cache (year)" />
|
||||
<img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2015/12/postgres_locks_cgspace-year.png" alt="PostgreSQL locks (year)" />
|
||||
<img src="https://alanorth.github.io/cgspace-notes/cgspace-notes/2015/12/postgres_scans_cgspace-year.png" alt="PostgreSQL scans (year)" /></p>
|
||||
|
||||
<h2 id="2015-12-07">2015-12-07</h2>
|
||||
|
||||
<ul>
|
||||
<li>Atmire sent <a href="https://github.com/ilri/DSpace/pull/161">some fixes</a> to DSpace&rsquo;s REST API code that was leaving contexts open (causing the slow performance and database issues)</li>
|
||||
<li>After deploying the fix to CGSpace the REST API is consistently faster:</li>
|
||||
</ul>
|
||||
|
||||
<pre><code>$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.675
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.599
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.588
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.566
|
||||
$ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle/10568/32802?expand=all
|
||||
0.497
|
||||
</code></pre>
|
||||
|
||||
<h2 id="2015-12-08">2015-12-08</h2>
|
||||
|
||||
<ul>
|
||||
<li>Switch CGSpace log compression cron jobs from using lzop to xz—the compression isn&rsquo;t as good, but it&rsquo;s much faster and causes less IO/CPU load</li>
|
||||
<li>Since we figured out (and fixed) the cause of the performance issue, I reverted Google Bot&rsquo;s crawl rate to the &ldquo;Let Google optimize&rdquo; setting</li>
|
||||
</ul></description>
|
||||
</item>
|
||||
|
||||
</channel>
|
||||
</rss>
|
@ -12,7 +12,7 @@
|
||||
|
||||
|
||||
|
||||
<meta property="og:updated_time" content="2016-04-04T11:06:00+03:00"/>
|
||||
<meta property="og:updated_time" content="2016-05-01T23:06:00+03:00"/>
|
||||
|
||||
|
||||
|
||||
@ -40,7 +40,7 @@
|
||||
},
|
||||
|
||||
|
||||
"dateModified": "2016-04-04T11:06:00+03:00",
|
||||
"dateModified": "2016-05-01T23:06:00+03:00",
|
||||
|
||||
|
||||
|
||||
@ -103,6 +103,34 @@
|
||||
|
||||
|
||||
|
||||
<article class="blog-post">
|
||||
<header>
|
||||
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-05/">May, 2016</a></h2>
|
||||
<p class="blog-post-meta"><time datetime="2016-05-01T23:06:00+03:00">Sun May 01, 2016</time> by Alan Orth in
|
||||
|
||||
<i class="fa fa-tag" aria-hidden="true"></i> <a href="/cgspace-notes/tags/notes" rel="tag">Notes</a>
|
||||
|
||||
</p>
|
||||
</header>
|
||||
<h2 id="2016-05-01">2016-05-01</h2>
|
||||
|
||||
<ul>
|
||||
<li>Since yesterday there have been 10,000 REST errors and the site has been unstable again</li>
|
||||
<li>I have blocked access to the API now</li>
|
||||
<li>There are 3,000 IPs accessing the REST API in a 24-hour period!</li>
|
||||
</ul>
|
||||
|
||||
<pre><code># awk '{print $1}' /var/log/nginx/rest.log | uniq | wc -l
|
||||
3168
|
||||
</code></pre>
|
||||
|
||||
<p></p>
|
||||
<a href='https://alanorth.github.io/cgspace-notes/2016-05/'>Read more →</a>
|
||||
</article>
|
||||
|
||||
|
||||
|
||||
|
||||
<article class="blog-post">
|
||||
<header>
|
||||
<h2 class="blog-post-title"><a href="https://alanorth.github.io/cgspace-notes/2016-04/">April, 2016</a></h2>
|
||||
@ -289,6 +317,8 @@
|
||||
<h4>Recent Posts</h4>
|
||||
<ol class="list-unstyled">
|
||||
|
||||
<li><a href="/cgspace-notes/2017-03/">March, 2017</a></li>
|
||||
|
||||
<li><a href="/cgspace-notes/2017-02/">February, 2017</a></li>
|
||||
|
||||
<li><a href="/cgspace-notes/2017-01/">January, 2017</a></li>
|
||||
@ -297,8 +327,6 @@
|
||||
|
||||
<li><a href="/cgspace-notes/2016-11/">November, 2016</a></li>
|
||||
|
||||
<li><a href="/cgspace-notes/2016-10/">October, 2016</a></li>
|
||||
|
||||
</ol>
|
||||
</section>
|
||||
|
||||
|
Reference in New Issue
Block a user