diff --git a/docs/2015-11/index.html b/docs/2015-11/index.html index 9f4275886..d3247d591 100644 --- a/docs/2015-11/index.html +++ b/docs/2015-11/index.html @@ -297,6 +297,8 @@ db.statementpool = true
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -305,8 +307,6 @@ db.statementpool = true
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2015-12/index.html b/docs/2015-12/index.html index affc7cc79..4fdf4f6f5 100644 --- a/docs/2015-12/index.html +++ b/docs/2015-12/index.html @@ -314,6 +314,8 @@ $ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -322,8 +324,6 @@ $ curl -o /dev/null -s -w %{time_total}\\n https://cgspace.cgiar.org/rest/handle
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-01/index.html b/docs/2016-01/index.html index 9064b2f7c..fd95f5080 100644 --- a/docs/2016-01/index.html +++ b/docs/2016-01/index.html @@ -229,6 +229,8 @@ $ find SimpleArchiveForBio/ -iname “*.pdf” -exec basename {} \; | so
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -237,8 +239,6 @@ $ find SimpleArchiveForBio/ -iname “*.pdf” -exec basename {} \; | so
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-02/index.html b/docs/2016-02/index.html index 17406d2a9..e79fe7eb8 100644 --- a/docs/2016-02/index.html +++ b/docs/2016-02/index.html @@ -482,6 +482,8 @@ Bitstream: tést señora alimentación.pdf
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -490,8 +492,6 @@ Bitstream: tést señora alimentación.pdf
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-03/index.html b/docs/2016-03/index.html index a86a44f41..9ddd7f068 100644 --- a/docs/2016-03/index.html +++ b/docs/2016-03/index.html @@ -382,6 +382,8 @@ Reinstall my local (Mac OS X) DSpace stack with Tomcat 7, PostgreSQL 9.3, and Ja
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -390,8 +392,6 @@ Reinstall my local (Mac OS X) DSpace stack with Tomcat 7, PostgreSQL 9.3, and Ja
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-04/index.html b/docs/2016-04/index.html index 728f1c57b..d405f2a78 100644 --- a/docs/2016-04/index.html +++ b/docs/2016-04/index.html @@ -599,6 +599,8 @@ dspace.log.2016-04-27:7271
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -607,8 +609,6 @@ dspace.log.2016-04-27:7271
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-05/index.html b/docs/2016-05/index.html index 477f866a7..282c73e0f 100644 --- a/docs/2016-05/index.html +++ b/docs/2016-05/index.html @@ -449,6 +449,8 @@ sys 0m20.540s
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -457,8 +459,6 @@ sys 0m20.540s
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-06/index.html b/docs/2016-06/index.html index 6266e23d9..34471feb0 100644 --- a/docs/2016-06/index.html +++ b/docs/2016-06/index.html @@ -494,6 +494,8 @@ $ ./delete-metadata-values.py -f dc.contributor.corporate -i Corporate-Authors-D
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -502,8 +504,6 @@ $ ./delete-metadata-values.py -f dc.contributor.corporate -i Corporate-Authors-D
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-07/index.html b/docs/2016-07/index.html index 7eb6625d1..e898588d6 100644 --- a/docs/2016-07/index.html +++ b/docs/2016-07/index.html @@ -412,6 +412,8 @@ discovery.index.authority.ignore-variants=true
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -420,8 +422,6 @@ discovery.index.authority.ignore-variants=true
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-08/index.html b/docs/2016-08/index.html index aa4d5d644..65f06dea1 100644 --- a/docs/2016-08/index.html +++ b/docs/2016-08/index.html @@ -485,6 +485,8 @@ $ JAVA_OPTS="-Dfile.encoding=UTF-8 -Xmx512m" /home/cgspace.cgiar.org/b
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -493,8 +495,6 @@ $ JAVA_OPTS="-Dfile.encoding=UTF-8 -Xmx512m" /home/cgspace.cgiar.org/b
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-09/index.html b/docs/2016-09/index.html index 7638d8a23..bbc0568ca 100644 --- a/docs/2016-09/index.html +++ b/docs/2016-09/index.html @@ -785,6 +785,8 @@ $ ./delete-metadata-values.py -i ilrisubjects-delete-13.csv -f cg.subject.ilri -
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -793,8 +795,6 @@ $ ./delete-metadata-values.py -i ilrisubjects-delete-13.csv -f cg.subject.ilri -
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-10/index.html b/docs/2016-10/index.html index f6613c7cb..bec36fd00 100644 --- a/docs/2016-10/index.html +++ b/docs/2016-10/index.html @@ -470,6 +470,8 @@ dspace=# update metadatavalue set text_value = regexp_replace(text_value, 'http:
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -478,8 +480,6 @@ dspace=# update metadatavalue set text_value = regexp_replace(text_value, 'http:
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-11/index.html b/docs/2016-11/index.html index 6169e985e..a111ad567 100644 --- a/docs/2016-11/index.html +++ b/docs/2016-11/index.html @@ -687,6 +687,8 @@ org.dspace.discovery.SearchServiceException: Error executing query
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -695,8 +697,6 @@ org.dspace.discovery.SearchServiceException: Error executing query
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2016-12/index.html b/docs/2016-12/index.html index b92ff6a76..e353e6fc6 100644 --- a/docs/2016-12/index.html +++ b/docs/2016-12/index.html @@ -923,6 +923,8 @@ $ exit
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -931,8 +933,6 @@ $ exit
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-01/index.html b/docs/2017-01/index.html index 0b3d61765..c1e1d3977 100644 --- a/docs/2017-01/index.html +++ b/docs/2017-01/index.html @@ -468,6 +468,8 @@ $ gs -sDEVICE=pdfwrite -dCompatibilityLevel=1.4 -dPDFSETTINGS=/ebook -dNOPAUSE -
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -476,8 +478,6 @@ $ gs -sDEVICE=pdfwrite -dCompatibilityLevel=1.4 -dPDFSETTINGS=/ebook -dNOPAUSE -
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-02/index.html b/docs/2017-02/index.html index 3692cfe16..294ad80a3 100644 --- a/docs/2017-02/index.html +++ b/docs/2017-02/index.html @@ -540,6 +540,8 @@ COPY 1968
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -548,8 +550,6 @@ COPY 1968
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-03/index.html b/docs/2017-03/index.html index 24cfb68fc..c90fab597 100644 --- a/docs/2017-03/index.html +++ b/docs/2017-03/index.html @@ -454,6 +454,8 @@ $ ./delete-metadata-values.py -i Investors-Delete-121.csv -f dc.description.spon
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -462,8 +464,6 @@ $ ./delete-metadata-values.py -i Investors-Delete-121.csv -f dc.description.spon
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-04/index.html b/docs/2017-04/index.html index 66cb5c521..0ea1948fe 100644 --- a/docs/2017-04/index.html +++ b/docs/2017-04/index.html @@ -733,6 +733,8 @@ $ gem install compass -v 1.0.3
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -741,8 +743,6 @@ $ gem install compass -v 1.0.3
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-05/index.html b/docs/2017-05/index.html index 34570ff2c..edc94ffc4 100644 --- a/docs/2017-05/index.html +++ b/docs/2017-05/index.html @@ -487,6 +487,8 @@ UPDATE 187
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -495,8 +497,6 @@ UPDATE 187
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-06/index.html b/docs/2017-06/index.html index 067b1070c..16f0c0202 100644 --- a/docs/2017-06/index.html +++ b/docs/2017-06/index.html @@ -305,6 +305,8 @@ $ JAVA_OPTS="-Xmx1024m -Dfile.encoding=UTF-8" [dspace]/bin/dspace impo
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -313,8 +315,6 @@ $ JAVA_OPTS="-Xmx1024m -Dfile.encoding=UTF-8" [dspace]/bin/dspace impo
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-07/index.html b/docs/2017-07/index.html index 5dd91eacf..fd876cc0d 100644 --- a/docs/2017-07/index.html +++ b/docs/2017-07/index.html @@ -340,6 +340,8 @@ delete from metadatavalue where resource_type_id=2 and metadata_field_id=235 and
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -348,8 +350,6 @@ delete from metadatavalue where resource_type_id=2 and metadata_field_id=235 and
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-08/index.html b/docs/2017-08/index.html index 22e372a9d..4e3674c3b 100644 --- a/docs/2017-08/index.html +++ b/docs/2017-08/index.html @@ -626,6 +626,8 @@ org.apache.commons.dbcp.SQLNestedException: Cannot get a connection, pool error
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -634,8 +636,6 @@ org.apache.commons.dbcp.SQLNestedException: Cannot get a connection, pool error
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-09/index.html b/docs/2017-09/index.html index 29c2c7c56..0ae4a5bd1 100644 --- a/docs/2017-09/index.html +++ b/docs/2017-09/index.html @@ -798,6 +798,8 @@ Cert Status: good
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -806,8 +808,6 @@ Cert Status: good
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-10/index.html b/docs/2017-10/index.html index ee264909d..5917eb6dc 100644 --- a/docs/2017-10/index.html +++ b/docs/2017-10/index.html @@ -563,6 +563,8 @@ session_id=6C30F10B4351A4ED83EC6ED50AFD6B6A
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -571,8 +573,6 @@ session_id=6C30F10B4351A4ED83EC6ED50AFD6B6A
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-11/index.html b/docs/2017-11/index.html index f50f95908..bf7aa1bde 100644 --- a/docs/2017-11/index.html +++ b/docs/2017-11/index.html @@ -1207,6 +1207,8 @@ $ cat dspace.log.2017-11-28 | grep -o -E 'session_id=[A-Z0-9]{32}' | sort -n | u
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -1215,8 +1217,6 @@ $ cat dspace.log.2017-11-28 | grep -o -E 'session_id=[A-Z0-9]{32}' | sort -n | u
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2017-12/index.html b/docs/2017-12/index.html index 3cf21646a..e44573a16 100644 --- a/docs/2017-12/index.html +++ b/docs/2017-12/index.html @@ -972,6 +972,8 @@ DELETE 20
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -980,8 +982,6 @@ DELETE 20
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2018-01/index.html b/docs/2018-01/index.html index 4869c123f..45c89539e 100644 --- a/docs/2018-01/index.html +++ b/docs/2018-01/index.html @@ -1799,6 +1799,8 @@ Catalina:type=Manager,context=/,host=localhost activeSessions 8
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -1807,8 +1809,6 @@ Catalina:type=Manager,context=/,host=localhost activeSessions 8
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2018-02/index.html b/docs/2018-02/index.html index f6350e7e8..d030fc3bb 100644 --- a/docs/2018-02/index.html +++ b/docs/2018-02/index.html @@ -1317,6 +1317,8 @@ UPDATE 3
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -1325,8 +1327,6 @@ UPDATE 3
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2018-03/index.html b/docs/2018-03/index.html index ce40b9178..c4e21086c 100644 --- a/docs/2018-03/index.html +++ b/docs/2018-03/index.html @@ -745,6 +745,8 @@ Fixed 5 occurences of: GENEBANKS
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -753,8 +755,6 @@ Fixed 5 occurences of: GENEBANKS
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2018-04/index.html b/docs/2018-04/index.html index 1943c2cdd..8f2e89832 100644 --- a/docs/2018-04/index.html +++ b/docs/2018-04/index.html @@ -742,6 +742,8 @@ $ pg_restore -O -U dspacetest -d dspacetest -W -h localhost /tmp/dspace_2018-04-
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -750,8 +752,6 @@ $ pg_restore -O -U dspacetest -d dspacetest -W -h localhost /tmp/dspace_2018-04-
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/2018-05/index.html b/docs/2018-05/index.html new file mode 100644 index 000000000..9f500247b --- /dev/null +++ b/docs/2018-05/index.html @@ -0,0 +1,221 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + May, 2018 | CGSpace Notes + + + + + + + + + + + + + + + + + +
+
+ +
+
+ + + +
+
+

CGSpace Notes

+

Documenting day-to-day work on the CGSpace repository.

+
+
+ + + +
+
+
+ + + + +
+
+

May, 2018

+ +
+

2018-05-01

+ + + +

+ + + + + +
+ + + +
+ + + + +
+
+ + + + + + + + + diff --git a/docs/404.html b/docs/404.html index 549aabfd2..4c9cdea2c 100644 --- a/docs/404.html +++ b/docs/404.html @@ -98,6 +98,8 @@
    +
  1. May, 2018
  2. +
  3. April, 2018
  4. March, 2018
  5. @@ -106,8 +108,6 @@
  6. January, 2018
  7. -
  8. December, 2017
  9. -
diff --git a/docs/categories/index.html b/docs/categories/index.html index 6c9e2c002..74199fc60 100644 --- a/docs/categories/index.html +++ b/docs/categories/index.html @@ -100,6 +100,37 @@ +
+
+

May, 2018

+ +
+

2018-05-01

+ + + +

+ Read more → +
+ + + + + +

April, 2018

@@ -422,48 +453,6 @@ COPY 54701 - -
-
-

August, 2017

- -
-

2017-08-01

- -
    -
  • Linode sent an alert that CGSpace (linode18) was using 350% CPU for the past two hours
  • -
  • I looked in the Activity pane of the Admin Control Panel and it seems that Google, Baidu, Yahoo, and Bing are all crawling with massive numbers of bots concurrently (~100 total, mostly Baidu and Google)
  • -
  • The good thing is that, according to dspace.log.2017-08-01, they are all using the same Tomcat session
  • -
  • This means our Tomcat Crawler Session Valve is working
  • -
  • But many of the bots are browsing dynamic URLs like: - -
      -
    • /handle/10568/3353/discover
    • -
    • /handle/10568/16510/browse
    • -
  • -
  • The robots.txt only blocks the top-level /discover and /browse URLs… we will need to find a way to forbid them from accessing these!
  • -
  • Relevant issue from DSpace Jira (semi resolved in DSpace 6.0): https://jira.duraspace.org/browse/DS-2962
  • -
  • It turns out that we’re already adding the X-Robots-Tag "none" HTTP header, but this only forbids the search engine from indexing the page, not crawling it!
  • -
  • Also, the bot has to successfully browse the page first so it can receive the HTTP header…
  • -
  • We might actually have to block these requests with HTTP 403 depending on the user agent
  • -
  • Abenet pointed out that the CGIAR Library Historical Archive collection I sent July 20th only had ~100 entries, instead of 2415
  • -
  • This was due to newline characters in the dc.description.abstract column, which caused OpenRefine to choke when exporting the CSV
  • -
  • I exported a new CSV from the collection on DSpace Test and then manually removed the characters in vim using g/^$/d
  • -
  • Then I cleaned up the author authorities and HTML characters in OpenRefine and sent the file back to Abenet
  • -
- -

- Read more → -
- - - - -