{ "cells": [ { "cell_type": "markdown", "id": "55d5d6bb-d84c-4d62-8e99-56ce527e7f5e", "metadata": {}, "source": [ "# Imports" ] }, { "cell_type": "code", "execution_count": 1, "id": "375c7877-61c1-42f9-8123-317de9f71946", "metadata": {}, "outputs": [], "source": [ "from datetime import datetime\n", "import pandas as pd\n", "\n", "from diive.core.io.files import load_parquet, save_parquet\n", "from diive.pkgs.gapfilling.xgboost_ts import XGBoostTS" ] }, { "cell_type": "markdown", "id": "00e071a1-ccde-4b4c-80fc-e5d384327f36", "metadata": {}, "source": [ "# Load data" ] }, { "cell_type": "code", "execution_count": 2, "id": "2b4be116-7da5-4772-b830-4fa5e872e5e7", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Loaded .parquet file 17.3_CH-CHA_meteo10_2005-2024.parquet (0.355 seconds).\n", " --> Detected time resolution of <30 * Minutes> / 30min \n" ] }, { "data": { "text/html": [ "
\n", " | LW_IN_T1_2_1 | \n", "PA_GF1_0.9_1 | \n", "FLAG_PA_GF1_0.9_1_ISFILLED | \n", "PPFD_IN_T1_2_2 | \n", "FLAG_PPFD_IN_T1_2_2_ISFILLED | \n", "VPD_T1_2_1 | \n", "... | \n", "TS_GF1_0.04_1_gfXG | \n", "FLAG_TS_GF1_0.04_1_gfXG_ISFILLED | \n", "TS_GF1_0.15_1_gfXG | \n", "FLAG_TS_GF1_0.15_1_gfXG_ISFILLED | \n", "TS_GF1_0.4_1_gfXG | \n", "FLAG_TS_GF1_0.4_1_gfXG_ISFILLED | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
TIMESTAMP_MIDDLE | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
2005-01-01 00:15:00 | \n", "NaN | \n", "978.100000 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.099893 | \n", "... | \n", "1.014525 | \n", "1 | \n", "2.907254 | \n", "1 | \n", "4.007686 | \n", "1 | \n", "
2005-01-01 00:45:00 | \n", "NaN | \n", "977.933333 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.097606 | \n", "... | \n", "1.029936 | \n", "1 | \n", "2.907254 | \n", "1 | \n", "4.007686 | \n", "1 | \n", "
2005-01-01 01:15:00 | \n", "NaN | \n", "977.900000 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.091683 | \n", "... | \n", "1.003078 | \n", "1 | \n", "2.903765 | \n", "1 | \n", "4.077782 | \n", "1 | \n", "
2005-01-01 01:45:00 | \n", "NaN | \n", "977.833333 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.071157 | \n", "... | \n", "1.056877 | \n", "1 | \n", "2.903765 | \n", "1 | \n", "4.077782 | \n", "1 | \n", "
2005-01-01 02:15:00 | \n", "NaN | \n", "977.833333 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.058333 | \n", "... | \n", "0.963062 | \n", "1 | \n", "2.932330 | \n", "1 | \n", "3.979915 | \n", "1 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2024-12-31 21:45:00 | \n", "304.613900 | \n", "983.370890 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000011 | \n", "... | \n", "3.474346 | \n", "0 | \n", "4.437078 | \n", "0 | \n", "5.528727 | \n", "0 | \n", "
2024-12-31 22:15:00 | \n", "303.039890 | \n", "983.052160 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000011 | \n", "... | \n", "3.428224 | \n", "0 | \n", "4.440415 | \n", "0 | \n", "5.521962 | \n", "0 | \n", "
2024-12-31 22:45:00 | \n", "302.093633 | \n", "982.851140 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000011 | \n", "... | \n", "3.384733 | \n", "0 | \n", "4.443751 | \n", "0 | \n", "5.523991 | \n", "0 | \n", "
2024-12-31 23:15:00 | \n", "302.217307 | \n", "982.896827 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000010 | \n", "... | \n", "3.349179 | \n", "0 | \n", "4.439747 | \n", "0 | \n", "5.528050 | \n", "0 | \n", "
2024-12-31 23:45:00 | \n", "298.392973 | \n", "982.856613 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000010 | \n", "... | \n", "3.316919 | \n", "0 | \n", "4.442417 | \n", "0 | \n", "5.523991 | \n", "0 | \n", "
350640 rows × 29 columns
\n", "\n", " | SWC_GF1_0.05_1 | \n", "SWC_GF1_0.15_1 | \n", "SWC_GF1_0.75_1 | \n", "
---|---|---|---|
TIMESTAMP_MIDDLE | \n", "\n", " | \n", " | \n", " |
2005-12-31 | \n", "3213 | \n", "3213 | \n", "3213 | \n", "
2006-12-31 | \n", "17452 | \n", "17428 | \n", "17434 | \n", "
2007-12-31 | \n", "17501 | \n", "17503 | \n", "17502 | \n", "
2008-12-31 | \n", "17560 | \n", "17554 | \n", "17558 | \n", "
2009-12-31 | \n", "17504 | \n", "17505 | \n", "17506 | \n", "
2010-12-31 | \n", "10879 | \n", "16539 | \n", "16536 | \n", "
2011-12-31 | \n", "17021 | \n", "17018 | \n", "17013 | \n", "
2012-12-31 | \n", "17267 | \n", "17268 | \n", "17267 | \n", "
2013-12-31 | \n", "17513 | \n", "17512 | \n", "17514 | \n", "
2014-12-31 | \n", "17503 | \n", "17507 | \n", "17507 | \n", "
2015-12-31 | \n", "17496 | \n", "17496 | \n", "17493 | \n", "
2016-12-31 | \n", "16075 | \n", "16101 | \n", "16092 | \n", "
2017-12-31 | \n", "17413 | \n", "17413 | \n", "17413 | \n", "
2018-12-31 | \n", "17085 | \n", "17085 | \n", "17085 | \n", "
2019-12-31 | \n", "17394 | \n", "17394 | \n", "17394 | \n", "
2020-12-31 | \n", "16867 | \n", "16867 | \n", "16867 | \n", "
2021-12-31 | \n", "14497 | \n", "14497 | \n", "17466 | \n", "
2022-12-31 | \n", "17516 | \n", "17517 | \n", "17515 | \n", "
2023-12-31 | \n", "17520 | \n", "17520 | \n", "17515 | \n", "
2024-12-31 | \n", "17540 | \n", "17540 | \n", "17534 | \n", "