diff --git a/docs/2024-08/index.html b/docs/2024-08/index.html new file mode 100644 index 000000000..81cffb89e --- /dev/null +++ b/docs/2024-08/index.html @@ -0,0 +1,243 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + August, 2024 | CGSpace Notes + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+
+ + + + +
+
+

CGSpace Notes

+

Documenting day-to-day work on the CGSpace repository.

+
+
+ + + + +
+
+
+ + + + +
+
+

August, 2024

+ +
+

2024-08-08

+
    +
  • While working on the CGIAR Climate Change Synthesis I learned some new tricks with OpenRefine
  • +
+
    +
  • The first was to retrieve affiliations from OpenAlex and extract them from JSON with this GREL:
  • +
+
forEach(
+  value.parseJson()['authorships'],
+  a,
+  forEach(
+    a.parseJson()['institutions'],
+    i,
+    i['display_name']
+  ).join("||")
+).join("||")
+
    +
  • It is a nested forEach to extract all institutions for all authors
  • +
  • Second was a better way to deduplicate lists in Jython while preserving list order:
  • +
+
# better dedupe preserves order
+seen = set()
+deduped_list = [x for x in value.split("||") if x not in seen and not seen.add(x)]
+
+return "||".join(deduped_list)
+

2024-08-20

+ +

2024-08-22

+ +
dspace=# \COPY (SELECT m.text_value AS handle_from, h.handle AS handle_to FROM metadatavalue m JOIN handle h on m.dspace_object_id = h.resource_id WHERE m.metadata_field_id=181 AND h.resource_type_id=2 AND h.resource_id IN (SELECT uuid FROM item WHERE in_archive AND NOT withdrawn)) to /tmp/handle-redirects.csv CSV HEADER;
+COPY 400
+
    +
  • Export list of IFPRI CONTENTdm redirects:
  • +
+
dspace-# \COPY (SELECT m.text_value, h.handle FROM metadatavalue m JOIN handle h on m.dspace_object_id = h.resource_id WHERE m.metadata_field_id=28 AND m.text_value LIKE '%URL from IFPRI CONTENTdm%' AND h.resource_type_id=2 AND m.dspace_object_id IN (SELECT uuid FROM item WHERE in_archive AND NOT withdrawn)) to /tmp/ifpri.csv CSV HEADER;
+COPY 10794
+
    +
  • I filed an issue on DSpace Angular for anonymous users to be able to export search results to CSV
  • +
+

2024-08-26

+
    +
  • Spent some time trying to rebase our DSpace Angular themes on top of the massive header/navbar rework from DSpace 7.6.2
  • +
  • Spent some time getting missing bibliographic metadata (issue dates, licenses, pages, volume, issue, publisher, etc) from Crossref for CGSpace
  • +
+ + + + + + +
+ + + +
+ + + + +
+
+ + + + + + + + +