mirror of
https://github.com/ilri/csv-metadata-quality.git
synced 2025-06-06 09:08:40 +02:00
csv_metadata_quality/app.py: disable whitespace on abstracts
It's too aggressive on abstracts. If people paste in text from a PDF there are often newlines, and most of the time this is what they want.
This commit is contained in:
@ -90,11 +90,13 @@ def run(argv):
|
||||
|
||||
continue
|
||||
|
||||
if args.unsafe_fixes:
|
||||
match = re.match(r"^.*?abstract.*$", column)
|
||||
if match is None:
|
||||
# Fix: whitespace
|
||||
df[column] = df[column].apply(fix.whitespace, field_name=column)
|
||||
|
||||
# Fix: newlines
|
||||
if args.unsafe_fixes:
|
||||
df[column] = df[column].apply(fix.newlines, field_name=column)
|
||||
|
||||
# Fix: missing space after comma. Only run on author and citation
|
||||
|
Reference in New Issue
Block a user