mirror of
https://github.com/ilri/csv-metadata-quality.git
synced 2025-11-01 21:19:09 +01:00
Compare commits
1 Commits
master
...
renovate/l
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
97e603fc87 |
@@ -7,7 +7,6 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
|
||||
## Unreleased
|
||||
### Changed
|
||||
- New AGROVOC REST API URL
|
||||
- Use urllib from Python stdlib instead of manual replacement for unquoting URLs
|
||||
|
||||
## [0.7.0] - 2025-01-31
|
||||
### Added
|
||||
|
||||
@@ -49,7 +49,6 @@ dev = [
|
||||
"isort~=6.0",
|
||||
"csvkit~=2.0",
|
||||
"ipython~=8.31",
|
||||
"black~=25.9",
|
||||
]
|
||||
|
||||
[tool.isort]
|
||||
|
||||
@@ -3,7 +3,6 @@
|
||||
import logging
|
||||
import re
|
||||
from unicodedata import normalize
|
||||
from urllib.parse import unquote
|
||||
|
||||
import country_converter as coco
|
||||
import pandas as pd
|
||||
@@ -452,8 +451,12 @@ def normalize_dois(field):
|
||||
if match:
|
||||
new_value = re.sub(pattern, "doi.org", new_value)
|
||||
|
||||
# Replace %xx escapes with their single-character equivalent.
|
||||
new_value = unquote(new_value)
|
||||
# Convert erroneous %2f to /
|
||||
pattern = re.compile("%2f")
|
||||
match = re.findall(pattern, new_value)
|
||||
|
||||
if match:
|
||||
new_value = re.sub(pattern, "/", new_value)
|
||||
|
||||
# Replace values like doi: 10.11648/j.jps.20140201.14
|
||||
pattern = re.compile(r"^doi: 10\.")
|
||||
|
||||
Reference in New Issue
Block a user