From 32a91b9ce6b208943a3498ef8be526daf91ccbd8 Mon Sep 17 00:00:00 2001 From: avdata99 Date: Tue, 28 Oct 2025 16:24:28 -0300 Subject: [PATCH] start proposal --- ckanext/datapusher_plus/jobs.py | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) diff --git a/ckanext/datapusher_plus/jobs.py b/ckanext/datapusher_plus/jobs.py index 6e3f7831..e26d693e 100644 --- a/ckanext/datapusher_plus/jobs.py +++ b/ckanext/datapusher_plus/jobs.py @@ -1174,6 +1174,22 @@ def _push_to_datastore(task_id, input, dry_run=False, temp_dir=None): if conf.AUTO_INDEX_THRESHOLD: headers_cardinality.append(int(fr.get("cardinality") or 0)) + # Go through the qsv_stats_csv file and ensure the "mean" field is empty for + # field of type "Date" + new_qsv_stats_csv = os.path.join(temp_dir, "qsv_stats_cleaned.csv") + with open(qsv_stats_csv, mode="r") as inp, open(new_qsv_stats_csv, mode="w") as outp: + reader = csv.DictReader(inp) + fieldnames = reader.fieldnames + writer = csv.DictWriter(outp, fieldnames=fieldnames) + writer.writeheader() + for row in reader: + if row["type"] == "Date" or row["type"] == "DateTime": + row["mean"] = "" + writer.writerow(row) + qsv_stats_csv = new_qsv_stats_csv + logger.info(f"New qsv_stats_csv types for {qsv_stats_csv}") + print(open(qsv_stats_csv).read()) + # Get the field stats for each field in the headers list existing = datastore_resource_exists(resource_id) existing_info = None