mirror of
https://github.com/ilri/csv-metadata-quality.git
synced 2024-12-22 04:02:19 +01:00
csv_metadata_quality/fix.py: minor update to DOI fix
Normalize www.doi.org to doi.org in DOI field.
This commit is contained in:
parent
c1f630c298
commit
ae38a826ec
@ -441,6 +441,13 @@ def normalize_dois(field):
|
|||||||
pattern = re.compile(r"dx\.doi\.org")
|
pattern = re.compile(r"dx\.doi\.org")
|
||||||
match = re.findall(pattern, new_value)
|
match = re.findall(pattern, new_value)
|
||||||
|
|
||||||
|
if match:
|
||||||
|
new_value = re.sub(pattern, "doi.org", new_value)
|
||||||
|
|
||||||
|
# Convert www.doi.org to doi.org
|
||||||
|
pattern = re.compile(r"www\.doi\.org")
|
||||||
|
match = re.findall(pattern, new_value)
|
||||||
|
|
||||||
if match:
|
if match:
|
||||||
new_value = re.sub(pattern, "doi.org", new_value)
|
new_value = re.sub(pattern, "doi.org", new_value)
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user