{ "cells": [ { "cell_type": "markdown", "id": "55d5d6bb-d84c-4d62-8e99-56ce527e7f5e", "metadata": {}, "source": [ "# Imports" ] }, { "cell_type": "code", "execution_count": 1, "id": "375c7877-61c1-42f9-8123-317de9f71946", "metadata": {}, "outputs": [], "source": [ "from datetime import datetime\n", "import pandas as pd\n", "\n", "from diive.core.io.files import load_parquet, save_parquet\n", "from diive.pkgs.gapfilling.xgboost_ts import XGBoostTS" ] }, { "cell_type": "markdown", "id": "00e071a1-ccde-4b4c-80fc-e5d384327f36", "metadata": {}, "source": [ "# Load data" ] }, { "cell_type": "code", "execution_count": 2, "id": "2b4be116-7da5-4772-b830-4fa5e872e5e7", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Loaded .parquet file 17.1_CH-CHA_meteo10_2005-2024.parquet (0.048 seconds).\n", " --> Detected time resolution of <30 * Minutes> / 30min \n" ] }, { "data": { "text/html": [ "
\n", " | LW_IN_T1_2_1 | \n", "PA_GF1_0.9_1 | \n", "FLAG_PA_GF1_0.9_1_ISFILLED | \n", "PPFD_IN_T1_2_2 | \n", "FLAG_PPFD_IN_T1_2_2_ISFILLED | \n", "VPD_T1_2_1 | \n", "... | \n", "SWC_GF1_0.75_1 | \n", "TS_GF1_0.04_1 | \n", "TS_GF1_0.15_1 | \n", "TS_GF1_0.4_1 | \n", "FLAG_PREC_RAIN_TOT_GF1_0.5_1_FLUXNET_ISFILLED | \n", "TIMESINCE_PREC_RAIN_TOT_GF1_0.5_1 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
TIMESTAMP_MIDDLE | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
2005-01-01 00:15:00 | \n", "NaN | \n", "978.100000 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.099893 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "1 | \n", "
2005-01-01 00:45:00 | \n", "NaN | \n", "977.933333 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.097606 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "2 | \n", "
2005-01-01 01:15:00 | \n", "NaN | \n", "977.900000 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.091683 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0 | \n", "
2005-01-01 01:45:00 | \n", "NaN | \n", "977.833333 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.071157 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "1 | \n", "
2005-01-01 02:15:00 | \n", "NaN | \n", "977.833333 | \n", "1.0 | \n", "0.0 | \n", "0 | \n", "0.058333 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2024-12-31 21:45:00 | \n", "304.613900 | \n", "983.370890 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000011 | \n", "... | \n", "45.120877 | \n", "3.474346 | \n", "4.437078 | \n", "5.528727 | \n", "NaN | \n", "380 | \n", "
2024-12-31 22:15:00 | \n", "303.039890 | \n", "983.052160 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000011 | \n", "... | \n", "45.144937 | \n", "3.428224 | \n", "4.440415 | \n", "5.521962 | \n", "NaN | \n", "381 | \n", "
2024-12-31 22:45:00 | \n", "302.093633 | \n", "982.851140 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000011 | \n", "... | \n", "45.152280 | \n", "3.384733 | \n", "4.443751 | \n", "5.523991 | \n", "NaN | \n", "382 | \n", "
2024-12-31 23:15:00 | \n", "302.217307 | \n", "982.896827 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000010 | \n", "... | \n", "45.095043 | \n", "3.349179 | \n", "4.439747 | \n", "5.528050 | \n", "NaN | \n", "383 | \n", "
2024-12-31 23:45:00 | \n", "298.392973 | \n", "982.856613 | \n", "NaN | \n", "0.0 | \n", "0 | \n", "0.000010 | \n", "... | \n", "45.278093 | \n", "3.316919 | \n", "4.442417 | \n", "5.523991 | \n", "NaN | \n", "384 | \n", "
350640 rows × 23 columns
\n", "