From 0941f171bbd4665e0eef5956b2f8c87acb8fc3a4 Mon Sep 17 00:00:00 2001 From: Pierre Choffet Date: Tue, 9 Jun 2026 11:03:26 -0400 Subject: [PATCH] Make RDFs merging a bit more solid and verbose --- scripts/get_merged_all.sh | 1 + scripts/rdf.sh | 7 +++++-- 2 files changed, 6 insertions(+), 2 deletions(-) diff --git a/scripts/get_merged_all.sh b/scripts/get_merged_all.sh index 548a1c3..99c9cdd 100755 --- a/scripts/get_merged_all.sh +++ b/scripts/get_merged_all.sh @@ -50,6 +50,7 @@ cp "${WDEF_PATH}" "${LAST_ITERATION_PATH}" for qid in "${WDIDS[@]}" do + echo "Processing element with QID ${qid}…" >&2 NEW_WDEF_PATH="$(mktemp)" "${SCRIPT_DIR}/get_merged_element.sh" "${LAST_ITERATION_PATH}" "${qid}" > "${NEW_WDEF_PATH}" diff --git a/scripts/rdf.sh b/scripts/rdf.sh index 7679251..811a49e 100644 --- a/scripts/rdf.sh +++ b/scripts/rdf.sh @@ -33,7 +33,10 @@ function cacheRDF() { # Create cache dir mkdir -p "${RDFS_CACHE_DIR}" - curl "${rdf_url}" > "${rdf_path}" + curl --fail --silent --retry 10 "${rdf_url}" > "${rdf_path}" + + # Dirty solution to prevent from overflooding Wikidata server + sleep 1 echo "${rdf_path}" } @@ -50,7 +53,7 @@ function cacheRDFMaxAge() { local -r rdf_path="${RDFS_CACHE_DIR}${element_qid}.xml" - if [ ! -f "${rdf_path}" ]||[[ $(find "${rdf_path}" -mmin "+${max_age}") ]] + if [ ! -s "${rdf_path}" ]||[[ $(find "${rdf_path}" -mmin "+${max_age}") ]] then cacheRDF "${element_qid}" else -- 2.54.0