{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "a59b5d8f-1845-4015-9b52-d372b2c9bb5a", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import time\n", "import normet as nm\n", "import matplotlib.pyplot as plt\n", "import matplotlib\n", "from pylab import savefig" ] }, { "cell_type": "code", "execution_count": 2, "id": "e57ad0c9-8c5f-40ca-a98d-109676b91612", "metadata": {}, "outputs": [], "source": [ "df1=pd.read_csv(r'data/MY1_data.csv',parse_dates=['date'],index_col='date')" ] }, { "cell_type": "code", "execution_count": 3, "id": "dddce35f-4638-4b5c-84d2-a7bda5ef4c36", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | O3 | \n", "NO | \n", "NO2 | \n", "NOXasNO2 | \n", "SO2 | \n", "CO | \n", "PM10 | \n", "NV10 | \n", "V10 | \n", "PM2.5 | \n", "... | \n", "d2m | \n", "t2m | \n", "blh | \n", "sp | \n", "ssrd | \n", "tcc | \n", "tp | \n", "rh2m | \n", "lat | \n", "lon | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| date | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
| 2020-01-01 00:00:00 | \n", "1.72961 | \n", "78.38595 | \n", "45.77784 | \n", "165.96796 | \n", "4.75424 | \n", "NaN | \n", "69.0 | \n", "60.0 | \n", "9.0 | \n", "58.1 | \n", "... | \n", "277.183465 | \n", "278.394725 | \n", "384.209053 | \n", "102252.303312 | \n", "-1.164153e-10 | \n", "0.650958 | \n", "0.000008 | \n", "91.884130 | \n", "51.52253 | \n", "-0.154611 | \n", "
| 2020-01-01 01:00:00 | \n", "1.92918 | \n", "88.61587 | \n", "52.64325 | \n", "188.51903 | \n", "4.84394 | \n", "0.397528 | \n", "45.0 | \n", "38.4 | \n", "6.6 | \n", "43.2 | \n", "... | \n", "276.695430 | \n", "277.772899 | \n", "353.220263 | \n", "102211.168636 | \n", "-1.164153e-10 | \n", "0.603699 | \n", "0.000002 | \n", "92.715877 | \n", "51.52253 | \n", "-0.154611 | \n", "
| 2020-01-01 02:00:00 | \n", "1.99570 | \n", "70.02935 | \n", "44.76870 | \n", "152.14554 | \n", "3.09474 | \n", "0.346417 | \n", "46.2 | \n", "39.1 | \n", "7.1 | \n", "43.0 | \n", "... | \n", "276.505662 | \n", "277.463419 | \n", "255.911846 | \n", "102174.855967 | \n", "-1.164153e-10 | \n", "0.710378 | \n", "0.000005 | \n", "93.485560 | \n", "51.52253 | \n", "-0.154611 | \n", "
| 2020-01-01 03:00:00 | \n", "2.04559 | \n", "67.58589 | \n", "40.20699 | \n", "143.83725 | \n", "2.96019 | \n", "0.335059 | \n", "45.1 | \n", "38.8 | \n", "6.3 | \n", "42.8 | \n", "... | \n", "276.412816 | \n", "277.305813 | \n", "191.375560 | \n", "102166.786485 | \n", "-1.164153e-10 | \n", "0.837765 | \n", "0.000005 | \n", "93.906363 | \n", "51.52253 | \n", "-0.154611 | \n", "
| 2020-01-01 04:00:00 | \n", "2.99355 | \n", "72.03298 | \n", "47.26010 | \n", "157.70912 | \n", "3.83478 | \n", "0.349257 | \n", "40.8 | \n", "34.2 | \n", "6.6 | \n", "36.8 | \n", "... | \n", "276.553051 | \n", "277.478941 | \n", "151.780210 | \n", "102142.578039 | \n", "-1.164153e-10 | \n", "0.819103 | \n", "0.000003 | \n", "93.696878 | \n", "51.52253 | \n", "-0.154611 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2020-12-31 19:00:00 | \n", "20.70539 | \n", "12.46950 | \n", "30.47461 | \n", "49.59424 | \n", "1.12164 | \n", "0.129904 | \n", "13.9 | \n", "11.8 | \n", "2.1 | \n", "11.7 | \n", "... | \n", "272.197565 | \n", "273.557442 | \n", "476.945688 | \n", "99902.506413 | \n", "-5.820766e-11 | \n", "0.918149 | \n", "0.000000 | \n", "90.582979 | \n", "51.52253 | \n", "-0.154611 | \n", "
| 2020-12-31 20:00:00 | \n", "24.14797 | \n", "9.65279 | \n", "26.51175 | \n", "41.31249 | \n", "1.12164 | \n", "0.094180 | \n", "14.6 | \n", "11.3 | \n", "3.3 | \n", "11.0 | \n", "... | \n", "272.171041 | \n", "273.629146 | \n", "486.665851 | \n", "99947.625909 | \n", "-5.820766e-11 | \n", "0.839639 | \n", "0.000000 | \n", "89.939908 | \n", "51.52253 | \n", "-0.154611 | \n", "
| 2020-12-31 21:00:00 | \n", "25.69464 | \n", "12.46950 | \n", "28.45232 | \n", "47.57196 | \n", "1.36199 | \n", "0.087685 | \n", "16.6 | \n", "13.0 | \n", "3.6 | \n", "15.3 | \n", "... | \n", "272.087408 | \n", "273.470592 | \n", "489.355002 | \n", "100000.215520 | \n", "-5.820766e-11 | \n", "0.739354 | \n", "0.000000 | \n", "90.422188 | \n", "51.52253 | \n", "-0.154611 | \n", "
| 2020-12-31 22:00:00 | \n", "26.39313 | \n", "6.45629 | \n", "25.05721 | \n", "34.95672 | \n", "0.88129 | \n", "0.084437 | \n", "19.1 | \n", "16.0 | \n", "3.1 | \n", "17.1 | \n", "... | \n", "272.235319 | \n", "272.926062 | \n", "40.714872 | \n", "100042.844978 | \n", "-5.820766e-11 | \n", "0.643753 | \n", "0.000000 | \n", "95.088677 | \n", "51.52253 | \n", "-0.154611 | \n", "
| 2020-12-31 23:00:00 | \n", "27.93980 | \n", "6.61453 | \n", "22.07004 | \n", "32.21218 | \n", "0.88129 | \n", "0.087685 | \n", "17.6 | \n", "13.2 | \n", "4.4 | \n", "15.2 | \n", "... | \n", "272.020979 | \n", "272.681367 | \n", "55.617254 | \n", "100053.601944 | \n", "-5.820766e-11 | \n", "0.549403 | \n", "0.000000 | \n", "95.290673 | \n", "51.52253 | \n", "-0.154611 | \n", "
8784 rows × 65 columns
\n", "AutoML(append_log=False, auto_augment=True, custom_hp={},\n",
" cv_score_agg_func=None, early_stop=False, ensemble=False,\n",
" estimator_list='auto', eval_method='auto', fit_kwargs_by_estimator={},\n",
" force_cancel=False, free_mem_ratio=0, hpo_method='auto',\n",
" keep_search_state=False, learner_selector='sample', log_file_name='',\n",
" log_training_metric=False, log_type='better', max_iter=None,\n",
" mem_thres=4294967296, metric='auto', metric_constraints=[],\n",
" min_sample_size=10000, mlflow_logging=True, model_history=False,\n",
" n_concurrent_trials=1, n_jobs=-1, n_splits=5, pred_time_limit=inf,\n",
" preserve_checkpoint=True, retrain_full=True, ...)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. AutoML(append_log=False, auto_augment=True, custom_hp={},\n",
" cv_score_agg_func=None, early_stop=False, ensemble=False,\n",
" estimator_list='auto', eval_method='auto', fit_kwargs_by_estimator={},\n",
" force_cancel=False, free_mem_ratio=0, hpo_method='auto',\n",
" keep_search_state=False, learner_selector='sample', log_file_name='',\n",
" log_training_metric=False, log_type='better', max_iter=None,\n",
" mem_thres=4294967296, metric='auto', metric_constraints=[],\n",
" min_sample_size=10000, mlflow_logging=True, model_history=False,\n",
" n_concurrent_trials=1, n_jobs=-1, n_splits=5, pred_time_limit=inf,\n",
" preserve_checkpoint=True, retrain_full=True, ...)| H2O_cluster_uptime: | \n", "3 hours 59 mins |
| H2O_cluster_timezone: | \n", "Europe/London |
| H2O_data_parsing_timezone: | \n", "UTC |
| H2O_cluster_version: | \n", "3.46.0.5 |
| H2O_cluster_version_age: | \n", "26 days |
| H2O_cluster_name: | \n", "H2O_from_python_n94921cs_5qrqdn |
| H2O_cluster_total_nodes: | \n", "1 |
| H2O_cluster_free_memory: | \n", "7.572 Gb |
| H2O_cluster_total_cores: | \n", "8 |
| H2O_cluster_allowed_cores: | \n", "1 |
| H2O_cluster_status: | \n", "locked, healthy |
| H2O_connection_url: | \n", "http://localhost:54321 |
| H2O_connection_proxy: | \n", "{\"http\": null, \"https\": null} |
| H2O_internal_security: | \n", "False |
| Python_version: | \n", "3.12.2 final |
Model Details\n",
"=============\n",
"H2OGradientBoostingEstimator : Gradient Boosting Machine\n",
"Model Key: GBM_grid_1_AutoML_4_20240924_162158_model_2\n",
"\n",
"| \n", " | number_of_trees | \n", "number_of_internal_trees | \n", "model_size_in_bytes | \n", "min_depth | \n", "max_depth | \n", "mean_depth | \n", "min_leaves | \n", "max_leaves | \n", "mean_leaves |
|---|---|---|---|---|---|---|---|---|---|
| \n", " | 69.0 | \n", "69.0 | \n", "1189276.0 | \n", "13.0 | \n", "13.0 | \n", "13.0 | \n", "625.0 | \n", "1942.0 | \n", "1369.2754 |
ModelMetricsRegression: gbm\n",
"** Reported on train data. **\n",
"\n",
"MSE: 0.011242541344013361\n",
"RMSE: 0.10603085090676846\n",
"MAE: 0.07893400538333294\n",
"RMSLE: NaN\n",
"Mean Residual Deviance: 0.011242541344013361ModelMetricsRegression: gbm\n",
"** Reported on cross-validation data. **\n",
"\n",
"MSE: 8.126360199772725\n",
"RMSE: 2.850677147586644\n",
"MAE: 1.9222905950632483\n",
"RMSLE: NaN\n",
"Mean Residual Deviance: 8.126360199772725| \n", " | mean | \n", "sd | \n", "cv_1_valid | \n", "cv_2_valid | \n", "cv_3_valid | \n", "cv_4_valid | \n", "cv_5_valid |
|---|---|---|---|---|---|---|---|
| aic | \n", "nan | \n", "0.0 | \n", "nan | \n", "nan | \n", "nan | \n", "nan | \n", "nan |
| loglikelihood | \n", "nan | \n", "0.0 | \n", "nan | \n", "nan | \n", "nan | \n", "nan | \n", "nan |
| mae | \n", "1.9222906 | \n", "0.0324555 | \n", "1.9084675 | \n", "1.9052794 | \n", "1.888859 | \n", "1.9710108 | \n", "1.9378362 |
| mean_residual_deviance | \n", "8.12636 | \n", "0.6548642 | \n", "8.182448 | \n", "7.1749625 | \n", "7.8459816 | \n", "8.850865 | \n", "8.577542 |
| mse | \n", "8.12636 | \n", "0.6548642 | \n", "8.182448 | \n", "7.1749625 | \n", "7.8459816 | \n", "8.850865 | \n", "8.577542 |
| r2 | \n", "0.8793102 | \n", "0.0095628 | \n", "0.8805432 | \n", "0.8902119 | \n", "0.8867002 | \n", "0.8692322 | \n", "0.8698634 |
| residual_deviance | \n", "8.12636 | \n", "0.6548642 | \n", "8.182448 | \n", "7.1749625 | \n", "7.8459816 | \n", "8.850865 | \n", "8.577542 |
| rmse | \n", "2.8487926 | \n", "0.1158737 | \n", "2.860498 | \n", "2.678612 | \n", "2.801068 | \n", "2.9750404 | \n", "2.928744 |
| rmsle | \n", "nan | \n", "0.0 | \n", "nan | \n", "nan | \n", "nan | \n", "nan | \n", "nan |
| \n", " | timestamp | \n", "duration | \n", "number_of_trees | \n", "training_rmse | \n", "training_mae | \n", "training_deviance |
|---|---|---|---|---|---|---|
| \n", " | 2024-09-24 16:22:28 | \n", "7.661 sec | \n", "0.0 | \n", "8.2062346 | \n", "5.4746640 | \n", "67.3422868 |
| \n", " | 2024-09-24 16:22:28 | \n", "7.723 sec | \n", "5.0 | \n", "5.0442433 | \n", "3.4151840 | \n", "25.4443903 |
| \n", " | 2024-09-24 16:22:28 | \n", "7.779 sec | \n", "10.0 | \n", "3.1914116 | \n", "2.2053144 | \n", "10.1851080 |
| \n", " | 2024-09-24 16:22:28 | \n", "7.835 sec | \n", "15.0 | \n", "2.0162629 | \n", "1.4358716 | \n", "4.0653160 |
| \n", " | 2024-09-24 16:22:28 | \n", "7.892 sec | \n", "20.0 | \n", "1.3258726 | \n", "0.9765391 | \n", "1.7579382 |
| \n", " | 2024-09-24 16:22:28 | \n", "7.957 sec | \n", "25.0 | \n", "0.8801164 | \n", "0.6675258 | \n", "0.7746049 |
| \n", " | 2024-09-24 16:22:28 | \n", "8.014 sec | \n", "30.0 | \n", "0.6213492 | \n", "0.4796348 | \n", "0.3860749 |
| \n", " | 2024-09-24 16:22:28 | \n", "8.067 sec | \n", "35.0 | \n", "0.4578002 | \n", "0.3572500 | \n", "0.2095810 |
| \n", " | 2024-09-24 16:22:28 | \n", "8.132 sec | \n", "40.0 | \n", "0.3379802 | \n", "0.2647451 | \n", "0.1142306 |
| \n", " | 2024-09-24 16:22:28 | \n", "8.191 sec | \n", "45.0 | \n", "0.2648459 | \n", "0.2051404 | \n", "0.0701433 |
| \n", " | 2024-09-24 16:22:28 | \n", "8.251 sec | \n", "50.0 | \n", "0.2069501 | \n", "0.1595394 | \n", "0.0428284 |
| \n", " | 2024-09-24 16:22:28 | \n", "8.305 sec | \n", "55.0 | \n", "0.1663724 | \n", "0.1275311 | \n", "0.0276798 |
| \n", " | 2024-09-24 16:22:28 | \n", "8.354 sec | \n", "60.0 | \n", "0.1397592 | \n", "0.1064105 | \n", "0.0195326 |
| \n", " | 2024-09-24 16:22:28 | \n", "8.408 sec | \n", "65.0 | \n", "0.1167263 | \n", "0.0878304 | \n", "0.0136250 |
| \n", " | 2024-09-24 16:22:29 | \n", "8.495 sec | \n", "69.0 | \n", "0.1060309 | \n", "0.0789340 | \n", "0.0112425 |
| variable | \n", "relative_importance | \n", "scaled_importance | \n", "percentage |
|---|---|---|---|
| u10 | \n", "251463.8437500 | \n", "1.0 | \n", "0.1484518 |
| blh | \n", "210509.4843750 | \n", "0.8371362 | \n", "0.1242744 |
| d2m | \n", "202005.6875000 | \n", "0.8033190 | \n", "0.1192542 |
| day_julian | \n", "201374.0937500 | \n", "0.8008073 | \n", "0.1188813 |
| sp | \n", "158984.7187500 | \n", "0.6322369 | \n", "0.0938567 |
| date_unix | \n", "130323.0937500 | \n", "0.5182578 | \n", "0.0769363 |
| t2m | \n", "108348.5078125 | \n", "0.4308711 | \n", "0.0639636 |
| v10 | \n", "87987.5078125 | \n", "0.3499012 | \n", "0.0519435 |
| weekday | \n", "81752.5156250 | \n", "0.3251064 | \n", "0.0482626 |
| rh2m | \n", "80490.9296875 | \n", "0.3200895 | \n", "0.0475179 |
| hour | \n", "61422.0507812 | \n", "0.2442580 | \n", "0.0362605 |
| tcc | \n", "57315.1562500 | \n", "0.2279260 | \n", "0.0338360 |
| ssrd | \n", "46235.0937500 | \n", "0.1838638 | \n", "0.0272949 |
| tp | \n", "15695.9404297 | \n", "0.0624183 | \n", "0.0092661 |
\n",
"\n",
"[tips]\n",
"Use `model.explain()` to inspect the model.\n",
"--\n",
"Use `h2o.display.toggle_user_tips()` to switch on/off this section."
],
"text/plain": [
"Model Details\n",
"=============\n",
"H2OGradientBoostingEstimator : Gradient Boosting Machine\n",
"Model Key: GBM_grid_1_AutoML_4_20240924_162158_model_2\n",
"\n",
"\n",
"Model Summary: \n",
" number_of_trees number_of_internal_trees model_size_in_bytes min_depth max_depth mean_depth min_leaves max_leaves mean_leaves\n",
"-- ----------------- -------------------------- --------------------- ----------- ----------- ------------ ------------ ------------ -------------\n",
" 69 69 1.18928e+06 13 13 13 625 1942 1369.28\n",
"\n",
"ModelMetricsRegression: gbm\n",
"** Reported on train data. **\n",
"\n",
"MSE: 0.011242541344013361\n",
"RMSE: 0.10603085090676846\n",
"MAE: 0.07893400538333294\n",
"RMSLE: NaN\n",
"Mean Residual Deviance: 0.011242541344013361\n",
"\n",
"ModelMetricsRegression: gbm\n",
"** Reported on cross-validation data. **\n",
"\n",
"MSE: 8.126360199772725\n",
"RMSE: 2.850677147586644\n",
"MAE: 1.9222905950632483\n",
"RMSLE: NaN\n",
"Mean Residual Deviance: 8.126360199772725\n",
"\n",
"Cross-Validation Metrics Summary: \n",
" mean sd cv_1_valid cv_2_valid cv_3_valid cv_4_valid cv_5_valid\n",
"---------------------- ------- ---------- ------------ ------------ ------------ ------------ ------------\n",
"aic nan 0 nan nan nan nan nan\n",
"loglikelihood nan 0 nan nan nan nan nan\n",
"mae 1.92229 0.0324555 1.90847 1.90528 1.88886 1.97101 1.93784\n",
"mean_residual_deviance 8.12636 0.654864 8.18245 7.17496 7.84598 8.85087 8.57754\n",
"mse 8.12636 0.654864 8.18245 7.17496 7.84598 8.85087 8.57754\n",
"r2 0.87931 0.00956279 0.880543 0.890212 0.8867 0.869232 0.869863\n",
"residual_deviance 8.12636 0.654864 8.18245 7.17496 7.84598 8.85087 8.57754\n",
"rmse 2.84879 0.115874 2.8605 2.67861 2.80107 2.97504 2.92874\n",
"rmsle nan 0 nan nan nan nan nan\n",
"\n",
"Scoring History: \n",
" timestamp duration number_of_trees training_rmse training_mae training_deviance\n",
"-- ------------------- ---------- ----------------- --------------- -------------- -------------------\n",
" 2024-09-24 16:22:28 7.661 sec 0 8.20623 5.47466 67.3423\n",
" 2024-09-24 16:22:28 7.723 sec 5 5.04424 3.41518 25.4444\n",
" 2024-09-24 16:22:28 7.779 sec 10 3.19141 2.20531 10.1851\n",
" 2024-09-24 16:22:28 7.835 sec 15 2.01626 1.43587 4.06532\n",
" 2024-09-24 16:22:28 7.892 sec 20 1.32587 0.976539 1.75794\n",
" 2024-09-24 16:22:28 7.957 sec 25 0.880116 0.667526 0.774605\n",
" 2024-09-24 16:22:28 8.014 sec 30 0.621349 0.479635 0.386075\n",
" 2024-09-24 16:22:28 8.067 sec 35 0.4578 0.35725 0.209581\n",
" 2024-09-24 16:22:28 8.132 sec 40 0.33798 0.264745 0.114231\n",
" 2024-09-24 16:22:28 8.191 sec 45 0.264846 0.20514 0.0701433\n",
" 2024-09-24 16:22:28 8.251 sec 50 0.20695 0.159539 0.0428284\n",
" 2024-09-24 16:22:28 8.305 sec 55 0.166372 0.127531 0.0276798\n",
" 2024-09-24 16:22:28 8.354 sec 60 0.139759 0.10641 0.0195326\n",
" 2024-09-24 16:22:28 8.408 sec 65 0.116726 0.0878304 0.013625\n",
" 2024-09-24 16:22:29 8.495 sec 69 0.106031 0.078934 0.0112425\n",
"\n",
"Variable Importances: \n",
"variable relative_importance scaled_importance percentage\n",
"---------- --------------------- ------------------- ------------\n",
"u10 251464 1 0.148452\n",
"blh 210509 0.837136 0.124274\n",
"d2m 202006 0.803319 0.119254\n",
"day_julian 201374 0.800807 0.118881\n",
"sp 158985 0.632237 0.0938567\n",
"date_unix 130323 0.518258 0.0769363\n",
"t2m 108349 0.430871 0.0639636\n",
"v10 87987.5 0.349901 0.0519435\n",
"weekday 81752.5 0.325106 0.0482626\n",
"rh2m 80490.9 0.320089 0.0475179\n",
"hour 61422.1 0.244258 0.0362605\n",
"tcc 57315.2 0.227926 0.033836\n",
"ssrd 46235.1 0.183864 0.0272949\n",
"tp 15695.9 0.0624183 0.00926611\n",
"\n",
"[tips]\n",
"Use `model.explain()` to inspect the model.\n",
"--\n",
"Use `h2o.display.toggle_user_tips()` to switch on/off this section."
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"model2"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "82a03561-0d6a-42b1-9fc4-f02d9db67a3e",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"\u001b[0;31mSignature:\u001b[0m\n",
"\u001b[0mnm\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtrain_model\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m \u001b[0mdf\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m \u001b[0mvalue\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m'value'\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m \u001b[0mautoml_pkg\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m'flaml'\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m \u001b[0mmodel_config\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m \u001b[0mseed\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m7654321\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m \u001b[0mn_cores\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m \u001b[0mverbose\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
"\u001b[0;34m\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;31mDocstring:\u001b[0m\n",
"Trains a machine learning model using either FLAML or H2O AutoML.\n",
"\n",
"Parameters:\n",
" df (pandas.DataFrame): Input dataset to train the model.\n",
" value (str): The name of the target column in the dataset. Default is \"value\".\n",
" automl_pkg (str): The AutoML package to use (\"flaml\" or \"h2o\").\n",
" variables (list, optional): List of feature variables to use for training.\n",
" model_config (dict, optional): Configuration settings for the model training.\n",
" seed (int, optional): Random seed for reproducibility. Default is 7654321.\n",
" n_cores (int, optional): Number of CPU cores to use for training. Default is None.\n",
" verbose (bool, optional): Whether to print detailed logs. Default is True.\n",
"\n",
"Returns:\n",
" model: Trained machine learning model with a custom attribute `_model_type` indicating the package used.\n",
"\u001b[0;31mFile:\u001b[0m ~/anaconda3/envs/normet/lib/python3.12/site-packages/normet/normet.py\n",
"\u001b[0;31mType:\u001b[0m function"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"?nm.train_model"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "050656cc-fb2e-499c-95cf-79583f6c7935",
"metadata": {},
"outputs": [],
"source": [
"mod_stats1=nm.modStats(df1a,model1)"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "75312c50-9ebd-4adc-ab80-60dedad38611",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"| \n", " | n | \n", "FAC2 | \n", "MB | \n", "MGE | \n", "NMB | \n", "NMGE | \n", "RMSE | \n", "r | \n", "p_level | \n", "COE | \n", "IOA | \n", "R2 | \n", "set | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "4780 | \n", "0.987238 | \n", "-0.000007 | \n", "0.268328 | \n", "-7.437997e-07 | \n", "0.029447 | \n", "0.351283 | \n", "0.999110 | \n", "*** | \n", "0.950987 | \n", "0.975494 | \n", "0.998222 | \n", "training | \n", "
| 1 | \n", "1593 | \n", "0.907721 | \n", "0.090223 | \n", "1.920277 | \n", "9.806910e-03 | \n", "0.208727 | \n", "2.699133 | \n", "0.940890 | \n", "*** | \n", "0.650259 | \n", "0.825129 | \n", "0.885274 | \n", "testing | \n", "
| 2 | \n", "6373 | \n", "0.967362 | \n", "0.022547 | \n", "0.681250 | \n", "2.468418e-03 | \n", "0.074582 | \n", "1.383329 | \n", "0.985535 | \n", "*** | \n", "0.875668 | \n", "0.937834 | \n", "0.971279 | \n", "all | \n", "
| \n", " | n | \n", "FAC2 | \n", "MB | \n", "MGE | \n", "NMB | \n", "NMGE | \n", "RMSE | \n", "r | \n", "p_level | \n", "COE | \n", "IOA | \n", "R2 | \n", "set | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "4780 | \n", "0.994142 | \n", "2.145110e-08 | \n", "0.078934 | \n", "2.354070e-09 | \n", "0.008662 | \n", "0.106031 | \n", "0.999923 | \n", "*** | \n", "0.985582 | \n", "0.992791 | \n", "0.999846 | \n", "training | \n", "
| 1 | \n", "1593 | \n", "0.901444 | \n", "1.458128e-01 | \n", "1.952102 | \n", "1.584932e-02 | \n", "0.212186 | \n", "2.753047 | \n", "0.939557 | \n", "*** | \n", "0.644462 | \n", "0.822231 | \n", "0.882767 | \n", "testing | \n", "
| 2 | \n", "6373 | \n", "0.970971 | \n", "3.644749e-02 | \n", "0.547153 | \n", "3.990205e-03 | \n", "0.059901 | \n", "1.379475 | \n", "0.985645 | \n", "*** | \n", "0.900142 | \n", "0.950071 | \n", "0.971496 | \n", "all | \n", "
| \n", " | date | \n", "observed | \n", "normalised | \n", "seed | \n", "
|---|---|---|---|---|
| 0 | \n", "2020-01-01 00:00:00 | \n", "58.1 | \n", "17.221536 | \n", "979812 | \n", "
| 1 | \n", "2020-01-01 01:00:00 | \n", "43.2 | \n", "32.937436 | \n", "979812 | \n", "
| 2 | \n", "2020-01-01 02:00:00 | \n", "43.0 | \n", "24.423807 | \n", "979812 | \n", "
| 3 | \n", "2020-01-01 03:00:00 | \n", "42.8 | \n", "23.372347 | \n", "979812 | \n", "
| 4 | \n", "2020-01-01 04:00:00 | \n", "36.8 | \n", "26.478917 | \n", "979812 | \n", "
| \n", " | u10 | \n", "v10 | \n", "d2m | \n", "t2m | \n", "blh | \n", "sp | \n", "ssrd | \n", "tcc | \n", "tp | \n", "rh2m | \n", "
|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "-2.720528 | \n", "1.545010 | \n", "277.183465 | \n", "278.394725 | \n", "384.209053 | \n", "102252.303312 | \n", "-1.164153e-10 | \n", "0.650958 | \n", "0.000008 | \n", "91.884130 | \n", "
| 1 | \n", "-2.308789 | \n", "1.282742 | \n", "276.695430 | \n", "277.772899 | \n", "353.220263 | \n", "102211.168636 | \n", "-1.164153e-10 | \n", "0.603699 | \n", "0.000002 | \n", "92.715877 | \n", "
| 2 | \n", "-2.216471 | \n", "0.758730 | \n", "276.505662 | \n", "277.463419 | \n", "255.911846 | \n", "102174.855967 | \n", "-1.164153e-10 | \n", "0.710378 | \n", "0.000005 | \n", "93.485560 | \n", "
| 3 | \n", "-1.928623 | \n", "0.509013 | \n", "276.412816 | \n", "277.305813 | \n", "191.375560 | \n", "102166.786485 | \n", "-1.164153e-10 | \n", "0.837765 | \n", "0.000005 | \n", "93.906363 | \n", "
| 4 | \n", "-1.700043 | \n", "0.607069 | \n", "276.553051 | \n", "277.478941 | \n", "151.780210 | \n", "102142.578039 | \n", "-1.164153e-10 | \n", "0.819103 | \n", "0.000003 | \n", "93.696878 | \n", "
| \n", " | observed | \n", "normalised_979812 | \n", "normalised_378829 | \n", "normalised_120727 | \n", "normalised_541475 | \n", "normalised_488292 | \n", "mean | \n", "std | \n", "median | \n", "lower_bound | \n", "upper_bound | \n", "weighted | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| date | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
| 2020-01-01 00:00:00 | \n", "58.1 | \n", "30.252205 | \n", "26.007282 | \n", "21.472511 | \n", "13.609010 | \n", "13.521217 | \n", "20.972445 | \n", "6.655142 | \n", "21.472511 | \n", "13.529996 | \n", "29.827713 | \n", "20.220786 | \n", "
| 2020-01-01 01:00:00 | \n", "43.2 | \n", "30.718119 | \n", "22.379913 | \n", "22.043467 | \n", "11.979618 | \n", "14.756184 | \n", "20.375460 | \n", "6.570192 | \n", "22.043467 | \n", "12.257275 | \n", "29.884298 | \n", "18.638353 | \n", "
| 2020-01-01 02:00:00 | \n", "43.0 | \n", "30.120009 | \n", "21.627895 | \n", "20.220487 | \n", "13.131916 | \n", "14.394936 | \n", "19.899048 | \n", "6.060521 | \n", "20.220487 | \n", "13.258218 | \n", "29.270797 | \n", "18.202305 | \n", "
| 2020-01-01 03:00:00 | \n", "42.8 | \n", "28.591281 | \n", "21.836566 | \n", "22.887696 | \n", "11.813100 | \n", "12.544112 | \n", "19.534551 | \n", "6.435126 | \n", "21.836566 | \n", "11.886201 | \n", "28.020922 | \n", "18.432641 | \n", "
| 2020-01-01 04:00:00 | \n", "36.8 | \n", "30.390922 | \n", "21.896232 | \n", "21.653471 | \n", "12.113235 | \n", "12.944652 | \n", "19.799702 | \n", "6.724275 | \n", "21.653471 | \n", "12.196376 | \n", "29.541453 | \n", "18.257228 | \n", "
| \n", " | observed | \n", "base | \n", "date_unix | \n", "day_julian | \n", "weekday | \n", "hour | \n", "deweathered | \n", "emi_noise | \n", "
|---|---|---|---|---|---|---|---|---|
| date | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
| 2020-01-01 00:00:00 | \n", "58.1 | \n", "9.834232 | \n", "18.762883 | \n", "3.617389 | \n", "0.991752 | \n", "0.271323 | \n", "24.320077 | \n", "0.676729 | \n", "
| 2020-01-01 01:00:00 | \n", "43.2 | \n", "9.211363 | \n", "19.549169 | \n", "3.381027 | \n", "0.795226 | \n", "0.420953 | \n", "24.200235 | \n", "0.053860 | \n", "
| 2020-01-01 02:00:00 | \n", "43.0 | \n", "8.740657 | \n", "18.760258 | \n", "4.192777 | \n", "0.800782 | \n", "-0.187559 | \n", "23.149413 | \n", "-0.416846 | \n", "
| 2020-01-01 03:00:00 | \n", "42.8 | \n", "8.869214 | \n", "18.804496 | \n", "3.959970 | \n", "0.529601 | \n", "-0.208110 | \n", "22.797669 | \n", "-0.288289 | \n", "
| 2020-01-01 04:00:00 | \n", "36.8 | \n", "8.184215 | \n", "19.394484 | \n", "3.038679 | \n", "0.761000 | \n", "0.107604 | \n", "22.328479 | \n", "-0.973288 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2020-12-31 19:00:00 | \n", "11.7 | \n", "8.621910 | \n", "12.759990 | \n", "0.336607 | \n", "-0.046839 | \n", "0.406496 | \n", "12.920661 | \n", "-0.535593 | \n", "
| 2020-12-31 20:00:00 | \n", "11.0 | \n", "8.749583 | \n", "12.430059 | \n", "0.528524 | \n", "-0.321991 | \n", "0.086078 | \n", "12.314750 | \n", "-0.407920 | \n", "
| 2020-12-31 21:00:00 | \n", "15.3 | \n", "8.957951 | \n", "12.361814 | \n", "0.078852 | \n", "-0.219580 | \n", "0.304223 | \n", "12.325758 | \n", "-0.199552 | \n", "
| 2020-12-31 22:00:00 | \n", "17.1 | \n", "11.150086 | \n", "10.425434 | \n", "0.642186 | \n", "-0.419770 | \n", "0.013659 | \n", "12.654092 | \n", "1.992583 | \n", "
| 2020-12-31 23:00:00 | \n", "15.2 | \n", "8.579548 | \n", "12.403958 | \n", "0.512501 | \n", "0.115038 | \n", "-0.705544 | \n", "11.747998 | \n", "-0.577955 | \n", "
6373 rows × 8 columns
\n", "| \n", " | observed | \n", "deweathered | \n", "v10 | \n", "blh | \n", "u10 | \n", "sp | \n", "rh2m | \n", "tcc | \n", "d2m | \n", "t2m | \n", "ssrd | \n", "tp | \n", "met_noise | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| date | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
| 2020-01-01 00:00:00 | \n", "58.1 | \n", "23.775707 | \n", "2.803204 | \n", "2.690817 | \n", "10.533843 | \n", "14.459222 | \n", "6.452000 | \n", "5.053862 | \n", "4.216987 | \n", "5.003190 | \n", "4.792167 | \n", "5.521003 | \n", "1.596199 | \n", "
| 2020-01-01 01:00:00 | \n", "43.2 | \n", "23.712904 | \n", "1.546627 | \n", "4.394804 | \n", "11.799731 | \n", "10.566854 | \n", "1.769647 | \n", "1.297532 | \n", "1.966014 | \n", "2.295684 | \n", "1.542771 | \n", "1.862642 | \n", "-0.930420 | \n", "
| 2020-01-01 02:00:00 | \n", "43.0 | \n", "23.308907 | \n", "1.740158 | \n", "6.840758 | \n", "12.729884 | \n", "8.339736 | \n", "1.449420 | \n", "1.877752 | \n", "2.321789 | \n", "0.919309 | \n", "-0.113854 | \n", "2.106147 | \n", "-0.392609 | \n", "
| 2020-01-01 03:00:00 | \n", "42.8 | \n", "21.808085 | \n", "2.402217 | \n", "10.777716 | \n", "12.743709 | \n", "5.307592 | \n", "1.729576 | \n", "2.229663 | \n", "2.012881 | \n", "0.785298 | \n", "0.305861 | \n", "1.625649 | \n", "0.265997 | \n", "
| 2020-01-01 04:00:00 | \n", "36.8 | \n", "22.173301 | \n", "1.698096 | \n", "8.612109 | \n", "9.510499 | \n", "3.318336 | \n", "1.694841 | \n", "2.583169 | \n", "2.313238 | \n", "0.499432 | \n", "-0.465211 | \n", "1.463167 | \n", "-1.849514 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2020-12-31 19:00:00 | \n", "11.7 | \n", "12.869070 | \n", "0.146833 | \n", "-0.498743 | \n", "-0.443972 | \n", "0.866222 | \n", "0.683517 | \n", "-0.338941 | \n", "-0.219422 | \n", "-0.602156 | \n", "-1.466656 | \n", "-0.560928 | \n", "-0.034524 | \n", "
| 2020-12-31 20:00:00 | \n", "11.0 | \n", "12.018398 | \n", "0.320049 | \n", "-0.056764 | \n", "-0.113305 | \n", "0.966535 | \n", "0.720601 | \n", "-0.261063 | \n", "-0.324155 | \n", "-1.152303 | \n", "-1.581597 | \n", "-0.370613 | \n", "-0.144190 | \n", "
| 2020-12-31 21:00:00 | \n", "15.3 | \n", "12.231738 | \n", "0.397497 | \n", "-0.242102 | \n", "-0.911311 | \n", "0.589118 | \n", "0.786209 | \n", "-0.246796 | \n", "-0.040521 | \n", "-0.713239 | \n", "-1.326826 | \n", "-0.321144 | \n", "4.002425 | \n", "
| 2020-12-31 22:00:00 | \n", "17.1 | \n", "12.514066 | \n", "0.676143 | \n", "4.688038 | \n", "1.570879 | \n", "-1.779531 | \n", "1.186440 | \n", "0.857997 | \n", "1.715646 | \n", "0.982372 | \n", "-0.903092 | \n", "-0.228862 | \n", "0.065919 | \n", "
| 2020-12-31 23:00:00 | \n", "15.2 | \n", "11.770696 | \n", "0.539106 | \n", "5.628566 | \n", "2.067334 | \n", "-2.426622 | \n", "0.414002 | \n", "0.017931 | \n", "1.326883 | \n", "0.882671 | \n", "-0.988648 | \n", "-0.456333 | \n", "-0.216909 | \n", "
6373 rows × 13 columns
\n", "| \n", " | observed | \n", "base | \n", "date_unix | \n", "day_julian | \n", "weekday | \n", "hour | \n", "deweathered | \n", "emi_noise | \n", "
|---|---|---|---|---|---|---|---|---|
| date | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
| 2020-01-01 00:00:00 | \n", "58.1 | \n", "9.636890 | \n", "18.471507 | \n", "3.981692 | \n", "1.373361 | \n", "-0.159863 | \n", "24.146201 | \n", "0.479505 | \n", "
| 2020-01-01 01:00:00 | \n", "43.2 | \n", "9.560233 | \n", "18.945920 | \n", "3.962606 | \n", "0.950994 | \n", "-0.031199 | \n", "24.231168 | \n", "0.402847 | \n", "
| 2020-01-01 02:00:00 | \n", "43.0 | \n", "9.457613 | \n", "18.446638 | \n", "3.478760 | \n", "1.149818 | \n", "-0.735301 | \n", "22.640142 | \n", "0.300227 | \n", "
| 2020-01-01 03:00:00 | \n", "42.8 | \n", "9.553435 | \n", "17.988441 | \n", "4.450814 | \n", "0.201102 | \n", "-0.431935 | \n", "22.604472 | \n", "0.396050 | \n", "
| 2020-01-01 04:00:00 | \n", "36.8 | \n", "8.259178 | \n", "18.887683 | \n", "3.579915 | \n", "1.171948 | \n", "-0.676739 | \n", "22.064599 | \n", "-0.898208 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2020-12-31 19:00:00 | \n", "11.7 | \n", "8.791405 | \n", "12.619534 | \n", "0.570769 | \n", "-0.282182 | \n", "0.277319 | \n", "12.819460 | \n", "-0.365980 | \n", "
| 2020-12-31 20:00:00 | \n", "11.0 | \n", "8.768305 | \n", "12.125637 | \n", "0.483223 | \n", "0.000221 | \n", "-0.067327 | \n", "12.152672 | \n", "-0.389080 | \n", "
| 2020-12-31 21:00:00 | \n", "15.3 | \n", "8.492577 | \n", "12.543496 | \n", "0.251146 | \n", "0.147919 | \n", "-0.081575 | \n", "12.196178 | \n", "-0.664809 | \n", "
| 2020-12-31 22:00:00 | \n", "17.1 | \n", "9.704561 | \n", "12.125288 | \n", "0.186412 | \n", "-0.348574 | \n", "0.029269 | \n", "12.539570 | \n", "0.547175 | \n", "
| 2020-12-31 23:00:00 | \n", "15.2 | \n", "8.273833 | \n", "12.567619 | \n", "0.757832 | \n", "-0.068558 | \n", "-0.986782 | \n", "11.386559 | \n", "-0.883552 | \n", "
6373 rows × 8 columns
\n", "| \n", " | observed | \n", "rolling_0 | \n", "rolling_1 | \n", "rolling_2 | \n", "rolling_3 | \n", "rolling_4 | \n", "rolling_5 | \n", "rolling_6 | \n", "rolling_7 | \n", "rolling_8 | \n", "... | \n", "rolling_35 | \n", "rolling_36 | \n", "rolling_37 | \n", "rolling_38 | \n", "rolling_39 | \n", "rolling_40 | \n", "rolling_41 | \n", "rolling_42 | \n", "rolling_43 | \n", "rolling_44 | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| date | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
| 2020-01-01 00:00:00 | \n", "58.1 | \n", "20.207316 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 2020-01-01 01:00:00 | \n", "43.2 | \n", "20.131948 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 2020-01-01 02:00:00 | \n", "43.0 | \n", "19.247751 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 2020-01-01 03:00:00 | \n", "42.8 | \n", "19.310005 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 2020-01-01 04:00:00 | \n", "36.8 | \n", "20.072632 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
5 rows × 46 columns
\n", "| \n", " | rowid | \n", "d2m | \n", "blh | \n", "ssrd | \n", "t2m | \n", "v10 | \n", "u10 | \n", "sp | \n", "tp | \n", "tcc | \n", "rh2m | \n", "date | \n", "value | \n", "date_unix | \n", "day_julian | \n", "weekday | \n", "hour | \n", "set | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "0 | \n", "277.183465 | \n", "384.209053 | \n", "-1.164153e-10 | \n", "278.394725 | \n", "1.545010 | \n", "-2.720528 | \n", "102252.303312 | \n", "0.000008 | \n", "0.650958 | \n", "91.884130 | \n", "2020-01-01 00:00:00 | \n", "58.1 | \n", "1.577837e+09 | \n", "1 | \n", "3 | \n", "0 | \n", "training | \n", "
| 1 | \n", "1 | \n", "276.695430 | \n", "353.220263 | \n", "-1.164153e-10 | \n", "277.772899 | \n", "1.282742 | \n", "-2.308789 | \n", "102211.168636 | \n", "0.000002 | \n", "0.603699 | \n", "92.715877 | \n", "2020-01-01 01:00:00 | \n", "43.2 | \n", "1.577840e+09 | \n", "1 | \n", "3 | \n", "1 | \n", "training | \n", "
| 2 | \n", "2 | \n", "276.505662 | \n", "255.911846 | \n", "-1.164153e-10 | \n", "277.463419 | \n", "0.758730 | \n", "-2.216471 | \n", "102174.855967 | \n", "0.000005 | \n", "0.710378 | \n", "93.485560 | \n", "2020-01-01 02:00:00 | \n", "43.0 | \n", "1.577844e+09 | \n", "1 | \n", "3 | \n", "2 | \n", "testing | \n", "
| 3 | \n", "3 | \n", "276.412816 | \n", "191.375560 | \n", "-1.164153e-10 | \n", "277.305813 | \n", "0.509013 | \n", "-1.928623 | \n", "102166.786485 | \n", "0.000005 | \n", "0.837765 | \n", "93.906363 | \n", "2020-01-01 03:00:00 | \n", "42.8 | \n", "1.577848e+09 | \n", "1 | \n", "3 | \n", "3 | \n", "training | \n", "
| 4 | \n", "4 | \n", "276.553051 | \n", "151.780210 | \n", "-1.164153e-10 | \n", "277.478941 | \n", "0.607069 | \n", "-1.700043 | \n", "102142.578039 | \n", "0.000003 | \n", "0.819103 | \n", "93.696878 | \n", "2020-01-01 04:00:00 | \n", "36.8 | \n", "1.577851e+09 | \n", "1 | \n", "3 | \n", "4 | \n", "testing | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 6368 | \n", "6368 | \n", "272.197565 | \n", "476.945688 | \n", "-5.820766e-11 | \n", "273.557442 | \n", "-1.945195 | \n", "1.380939 | \n", "99902.506413 | \n", "0.000000 | \n", "0.918149 | \n", "90.582979 | \n", "2020-12-31 19:00:00 | \n", "11.7 | \n", "1.609441e+09 | \n", "366 | \n", "4 | \n", "19 | \n", "training | \n", "
| 6369 | \n", "6369 | \n", "272.171041 | \n", "486.665851 | \n", "-5.820766e-11 | \n", "273.629146 | \n", "-2.102732 | \n", "0.987925 | \n", "99947.625909 | \n", "0.000000 | \n", "0.839639 | \n", "89.939908 | \n", "2020-12-31 20:00:00 | \n", "11.0 | \n", "1.609445e+09 | \n", "366 | \n", "4 | \n", "20 | \n", "training | \n", "
| 6370 | \n", "6370 | \n", "272.087408 | \n", "489.355002 | \n", "-5.820766e-11 | \n", "273.470592 | \n", "-1.933668 | \n", "0.681543 | \n", "100000.215520 | \n", "0.000000 | \n", "0.739354 | \n", "90.422188 | \n", "2020-12-31 21:00:00 | \n", "15.3 | \n", "1.609448e+09 | \n", "366 | \n", "4 | \n", "21 | \n", "testing | \n", "
| 6371 | \n", "6371 | \n", "272.235319 | \n", "40.714872 | \n", "-5.820766e-11 | \n", "272.926062 | \n", "-0.583816 | \n", "1.020793 | \n", "100042.844978 | \n", "0.000000 | \n", "0.643753 | \n", "95.088677 | \n", "2020-12-31 22:00:00 | \n", "17.1 | \n", "1.609452e+09 | \n", "366 | \n", "4 | \n", "22 | \n", "training | \n", "
| 6372 | \n", "6372 | \n", "272.020979 | \n", "55.617254 | \n", "-5.820766e-11 | \n", "272.681367 | \n", "-0.377511 | \n", "0.959517 | \n", "100053.601944 | \n", "0.000000 | \n", "0.549403 | \n", "95.290673 | \n", "2020-12-31 23:00:00 | \n", "15.2 | \n", "1.609456e+09 | \n", "366 | \n", "4 | \n", "23 | \n", "training | \n", "
6373 rows × 18 columns
\n", "| \n", " | variable | \n", "value | \n", "pdp_mean | \n", "pdp_std | \n", "
|---|---|---|---|---|
| 0 | \n", "blh | \n", "73.415911 | \n", "15.742461 | \n", "8.358786 | \n", "
| 1 | \n", "blh | \n", "88.917320 | \n", "15.359839 | \n", "8.271418 | \n", "
| 2 | \n", "blh | \n", "104.418730 | \n", "14.966788 | \n", "8.354652 | \n", "
| 3 | \n", "blh | \n", "119.920140 | \n", "15.582338 | \n", "8.428540 | \n", "
| 4 | \n", "blh | \n", "135.421549 | \n", "13.699515 | \n", "7.471944 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 95 | \n", "blh | \n", "1546.049822 | \n", "6.940856 | \n", "4.955734 | \n", "
| 96 | \n", "blh | \n", "1561.551231 | \n", "6.955089 | \n", "4.957737 | \n", "
| 97 | \n", "blh | \n", "1577.052641 | \n", "6.960697 | \n", "4.952725 | \n", "
| 98 | \n", "blh | \n", "1592.554051 | \n", "7.132266 | \n", "4.943666 | \n", "
| 99 | \n", "blh | \n", "1608.055460 | \n", "7.126766 | \n", "4.943877 | \n", "
100 rows × 4 columns
\n", "| \n", " | variable | \n", "value | \n", "pdp_mean | \n", "pdp_std | \n", "
|---|---|---|---|---|
| 0 | \n", "blh | \n", "73.415911 | \n", "15.742461 | \n", "8.358786 | \n", "
| 1 | \n", "blh | \n", "88.917320 | \n", "15.359839 | \n", "8.271418 | \n", "
| 2 | \n", "blh | \n", "104.418730 | \n", "14.966788 | \n", "8.354652 | \n", "
| 3 | \n", "blh | \n", "119.920140 | \n", "15.582338 | \n", "8.428540 | \n", "
| 4 | \n", "blh | \n", "135.421549 | \n", "13.699515 | \n", "7.471944 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 195 | \n", "t2m | \n", "294.518468 | \n", "10.544835 | \n", "7.865555 | \n", "
| 196 | \n", "t2m | \n", "294.715875 | \n", "10.532480 | \n", "7.856032 | \n", "
| 197 | \n", "t2m | \n", "294.913281 | \n", "10.565610 | \n", "7.847180 | \n", "
| 198 | \n", "t2m | \n", "295.110688 | \n", "10.527926 | \n", "7.840150 | \n", "
| 199 | \n", "t2m | \n", "295.308095 | \n", "10.515571 | \n", "7.841594 | \n", "
200 rows × 4 columns
\n", "| \n", " | variable | \n", "value | \n", "pdp_mean | \n", "pdp_std | \n", "
|---|---|---|---|---|
| 0 | \n", "weekday | \n", "1.0 | \n", "8.808568 | \n", "7.348096 | \n", "
| 1 | \n", "weekday | \n", "2.0 | \n", "8.975131 | \n", "7.397715 | \n", "
| 2 | \n", "weekday | \n", "3.0 | \n", "9.519126 | \n", "7.803357 | \n", "
| 3 | \n", "weekday | \n", "4.0 | \n", "9.178989 | \n", "7.852847 | \n", "
| 4 | \n", "weekday | \n", "5.0 | \n", "9.756207 | \n", "7.741670 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 1226 | \n", "hour | \n", "19.0 | \n", "9.648269 | \n", "7.468077 | \n", "
| 1227 | \n", "hour | \n", "20.0 | \n", "9.583308 | \n", "7.474737 | \n", "
| 1228 | \n", "hour | \n", "21.0 | \n", "9.275591 | \n", "7.467640 | \n", "
| 1229 | \n", "hour | \n", "22.0 | \n", "9.089483 | \n", "7.493595 | \n", "
| 1230 | \n", "hour | \n", "23.0 | \n", "8.733808 | \n", "7.531601 | \n", "
1231 rows × 4 columns
\n", "