1
0
mirror of https://github.com/ilri/csv-metadata-quality.git synced 2024-11-17 11:37:03 +01:00

Check comma space on bibliographicCitation too

The regex was only matching `dc.identifier.citation`, but we need
to match `dcterms.bibliographicCitation` too.
This commit is contained in:
Alan Orth 2023-03-10 16:13:16 +03:00
parent 45a310387a
commit d661ffe439
Signed by: alanorth
GPG Key ID: 0FB860CC9C45B1B9

View File

@ -102,7 +102,7 @@ def run(argv):
# Fix: missing space after comma. Only run on author and citation
# fields for now, as this problem is mostly an issue in names.
if args.unsafe_fixes:
match = re.match(r"^.*?(author|citation).*$", column)
match = re.match(r"^.*?(author|[Cc]itation).*$", column)
if match is not None:
df[column] = df[column].apply(fix.comma_space, field_name=column)