From c559150d40a9a7d61e3c099dce7fd81736a0283e Mon Sep 17 00:00:00 2001 From: Marton Vago Date: Thu, 28 May 2026 09:19:22 +0100 Subject: [PATCH 1/5] feat: :sparkles: stage raw data --- justfile | 4 ++ scripts/stage_data.py | 133 ++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 137 insertions(+) create mode 100644 scripts/stage_data.py diff --git a/justfile b/justfile index dfe00d4..f85dfc8 100644 --- a/justfile +++ b/justfile @@ -86,3 +86,7 @@ download-data-dict: # Download data from REDCap download-data: uv run python scripts/redcap_data.py + +# Stage raw data +stage-data: + uv run python scripts/stage_data.py diff --git a/scripts/stage_data.py b/scripts/stage_data.py new file mode 100644 index 0000000..dbfe35a --- /dev/null +++ b/scripts/stage_data.py @@ -0,0 +1,133 @@ +import re +from datetime import datetime +from operator import itemgetter +from pathlib import Path +from typing import cast + +import polars as pl +import seedcase_soil as so + +VAS_TIME_FIELD_PATTERN = re.compile( + r"^vas_(?P.+?)(_fasted)?_(?P