1
0
mirror of https://github.com/ilri/csv-metadata-quality.git synced 2024-11-22 05:45:02 +01:00

csv_metadata_quality/check.py: Prune requests cache once

We only need to prune the requests cache once before using it, not
for every value we check.
This commit is contained in:
Alan Orth 2020-07-06 13:41:51 +03:00
parent aa9e23b46c
commit 5fcaa63bd5
Signed by: alanorth
GPG Key ID: 0FB860CC9C45B1B9

View File

@ -221,23 +221,23 @@ def agrovoc(field, field_name):
if pd.isna(field):
return
# Try to split multi-value field on "||" separator
for value in field.split("||"):
request_url = (
f"http://agrovoc.uniroma2.it/agrovoc/rest/v1/agrovoc/search?query={value}"
)
# enable transparent request cache with thirty days expiry
expire_after = timedelta(days=30)
requests_cache.install_cache(
"agrovoc-response-cache", expire_after=expire_after
)
request = requests.get(request_url)
# prune old cache entries
requests_cache.core.remove_expired_responses()
# Try to split multi-value field on "||" separator
for value in field.split("||"):
request_url = (
f"http://agrovoc.uniroma2.it/agrovoc/rest/v1/agrovoc/search?query={value}"
)
request = requests.get(request_url)
if request.status_code == requests.codes.ok:
data = request.json()