{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "name": "UltimateJupiterNotebookCAIC-1_AF.ipynb", "provenance": [], "collapsed_sections": [] }, "kernelspec": { "display_name": "Python 3", "name": "python3" }, "widgets": { "application/vnd.jupyter.widget-state+json": { "499d8582265046e2970e453489ba6031": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_fbf81571f4cb4c059a3e5a66b7ef2221", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 3, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 3, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_4347d82e97784a83a087906c398d0e1f" } }, "fbf81571f4cb4c059a3e5a66b7ef2221": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "4347d82e97784a83a087906c398d0e1f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "a6c8551cb31645318ee511bd4a1e3859": { "model_module": "@jupyter-widgets/controls", "model_name": "TextModel", "state": { "_view_name": "TextView", "style": "IPY_MODEL_7630cddea594473e9538bef58294d8c2", "_dom_classes": [], "description": "", "_model_name": "TextModel", "placeholder": "​", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": "Following data types have been inferred automatically, if they are correct press enter to continue or type 'quit' otherwise.", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "continuous_update": true, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_169d6da9acf647d6bd4f509a5fdd50ba" } }, "7630cddea594473e9538bef58294d8c2": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "state": { "_view_name": "StyleView", "_model_name": "DescriptionStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "169d6da9acf647d6bd4f509a5fdd50ba": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": "100%", "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "0e9ab74349ab43df8d009f7bd46b034f": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_935ed9dc79c34b8ebd029281bfdcc6f8", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 79, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 79, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_c7560dbc634b435a8b54faaa681f63c9" } }, "935ed9dc79c34b8ebd029281bfdcc6f8": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "c7560dbc634b435a8b54faaa681f63c9": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "73622256dba84671bcab7e329b378818": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_81f4ba27c56546f48f4c958c203d9ff0", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_4a04ba961a454ceda4d285771d7567a2" } }, "81f4ba27c56546f48f4c958c203d9ff0": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "4a04ba961a454ceda4d285771d7567a2": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "f49794a0e9f54c26a7d7f84c0f3344e4": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_8adc97a7aeff4c6da935b5f1b7855696", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_d490a6b4780f436685e43fd6614510ed" } }, "8adc97a7aeff4c6da935b5f1b7855696": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "d490a6b4780f436685e43fd6614510ed": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "6a21aea1e810435582c37b3aace35901": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_63588303eaf74b1b8351bce44c98dec8", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_8eb369ace554446aa838a50afd0bf50e", "IPY_MODEL_c762527fa7374891b97f5d50430d5dd8" ] } }, "63588303eaf74b1b8351bce44c98dec8": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "8eb369ace554446aa838a50afd0bf50e": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_9e49a094eca748aa9286b42c7bf180ed", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 0, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_2994bc88f7624637ab65cef6e500da32" } }, "c762527fa7374891b97f5d50430d5dd8": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
Parameters
objectivebinary:logistic
use_label_encoderTrue
base_score0.5
boostergbtree
colsample_bylevel1
colsample_bynode1
colsample_bytree1
gamma0
gpu_id-1
importance_typegain
interaction_constraints
learning_rate0.300000012
max_delta_step0
max_depth6
min_child_weight1
missingnan
monotone_constraints()
n_estimators100
n_jobs-1
num_parallel_tree1
random_state1506
reg_alpha0
reg_lambda1
scale_pos_weight1
subsample1
tree_methodauto
validate_parameters1
verbosity0
\n
", "text/plain": " Parameters\nobjective binary:logistic\nuse_label_encoder True\nbase_score 0.5\nbooster gbtree\ncolsample_bylevel 1\ncolsample_bynode 1\ncolsample_bytree 1\ngamma 0\ngpu_id -1\nimportance_type gain\ninteraction_constraints \nlearning_rate 0.300000012\nmax_delta_step 0\nmax_depth 6\nmin_child_weight 1\nmissing nan\nmonotone_constraints ()\nn_estimators 100\nn_jobs -1\nnum_parallel_tree 1\nrandom_state 1506\nreg_alpha 0\nreg_lambda 1\nscale_pos_weight 1\nsubsample 1\ntree_method auto\nvalidate_parameters 1\nverbosity 0" } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_e75c29fbbf504123a6518d12d501f3ab", "_model_module": "@jupyter-widgets/output" } }, "9e49a094eca748aa9286b42c7bf180ed": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "2994bc88f7624637ab65cef6e500da32": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "e75c29fbbf504123a6518d12d501f3ab": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "03350dd1e5214f3aabc48b7565ae4b49": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_de314b3f0f544c61acf5fd33e99c911c", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_4550376ea6bd45b9af276503dfbf6a90" } }, "a463af2b79b94ecd9365cc4ba0ee1641": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_db9f6b4f028741f8bd5f4d93803b5e67", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_43c55b638f584647aaefcf3b9cfcee29" } }, "db9f6b4f028741f8bd5f4d93803b5e67": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "43c55b638f584647aaefcf3b9cfcee29": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "bce1c8fe885d45608d740beaadec1033": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_7034122a4ff1489e9d7d26af63ce6af4", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_bf891634e154429f9e7a228e21d84a2d", "IPY_MODEL_2e407875db904ec0ae0a9b9ede4cd9ca" ] } }, "7034122a4ff1489e9d7d26af63ce6af4": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "bf891634e154429f9e7a228e21d84a2d": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_55475be2cb3343bdac82821b1e7dc07b", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 0, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_3ab14392cd464feca63d9f5bc7c721cf" } }, "2e407875db904ec0ae0a9b9ede4cd9ca": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
Parameters
C1.0
class_weightNone
dualFalse
fit_interceptTrue
intercept_scaling1
l1_ratioNone
max_iter1000
multi_classauto
n_jobsNone
penaltyl2
random_state1506
solverlbfgs
tol0.0001
verbose0
warm_startFalse
\n
", "text/plain": " Parameters\nC 1.0\nclass_weight None\ndual False\nfit_intercept True\nintercept_scaling 1\nl1_ratio None\nmax_iter 1000\nmulti_class auto\nn_jobs None\npenalty l2\nrandom_state 1506\nsolver lbfgs\ntol 0.0001\nverbose 0\nwarm_start False" } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_25ff3ee0e3ba4ac59b4b968455e6ffd1", "_model_module": "@jupyter-widgets/output" } }, "55475be2cb3343bdac82821b1e7dc07b": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "3ab14392cd464feca63d9f5bc7c721cf": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "25ff3ee0e3ba4ac59b4b968455e6ffd1": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "465c097926b74791b7ed2dfeb41366e8": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_26fb1c534a0f4c32850a5704b197684f", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_729905d4b2234c8d9895a1fa6713748f" } }, "26fb1c534a0f4c32850a5704b197684f": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "729905d4b2234c8d9895a1fa6713748f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "cc14420b2b9241d3b51fcf513404de1e": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_108169e47ebe4b9bac95b4a38214dd1e", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_ca04ad074d944f4daf5860fdd0393732" } }, "108169e47ebe4b9bac95b4a38214dd1e": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "ca04ad074d944f4daf5860fdd0393732": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "392d9d1a9fa146ab90b0a9e5949d6b61": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_65706dd29fe5457bb1f2201f38b98161", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_6e27df66c8244d3f8506606169a712e3", "IPY_MODEL_d3f96bd6691643239b6757383587be54" ] } }, "65706dd29fe5457bb1f2201f38b98161": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "6e27df66c8244d3f8506606169a712e3": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_9e08f8f4343a441ab290545c679533cf", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 0, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_e14d0ac066224518ac2eaef551c70c10" } }, "d3f96bd6691643239b6757383587be54": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
Parameters
nan_modeMin
eval_metricLogloss
iterations1000
sampling_frequencyPerTree
leaf_estimation_methodNewton
grow_policySymmetricTree
penalties_coefficient1
boosting_typePlain
model_shrink_modeConstant
feature_border_typeGreedyLogSum
bayesian_matrix_reg0.10000000149011612
l2_leaf_reg3
random_strength1
rsm1
boost_from_averageFalse
model_size_reg0.5
subsample0.800000011920929
use_best_modelFalse
class_names[0, 1]
random_seed1506
depth6
posterior_samplingFalse
border_count254
classes_count0
auto_class_weightsNone
sparse_features_conflict_fraction0
leaf_estimation_backtrackingAnyImprovement
best_model_min_trees1
model_shrink_rate0
min_data_in_leaf1
loss_functionLogloss
learning_rate0.015088999643921852
score_functionCosine
task_typeCPU
leaf_estimation_iterations10
bootstrap_typeMVS
max_leaves64
\n
", "text/plain": " Parameters\nnan_mode Min\neval_metric Logloss\niterations 1000\nsampling_frequency PerTree\nleaf_estimation_method Newton\ngrow_policy SymmetricTree\npenalties_coefficient 1\nboosting_type Plain\nmodel_shrink_mode Constant\nfeature_border_type GreedyLogSum\nbayesian_matrix_reg 0.10000000149011612\nl2_leaf_reg 3\nrandom_strength 1\nrsm 1\nboost_from_average False\nmodel_size_reg 0.5\nsubsample 0.800000011920929\nuse_best_model False\nclass_names [0, 1]\nrandom_seed 1506\ndepth 6\nposterior_sampling False\nborder_count 254\nclasses_count 0\nauto_class_weights None\nsparse_features_conflict_fraction 0\nleaf_estimation_backtracking AnyImprovement\nbest_model_min_trees 1\nmodel_shrink_rate 0\nmin_data_in_leaf 1\nloss_function Logloss\nlearning_rate 0.015088999643921852\nscore_function Cosine\ntask_type CPU\nleaf_estimation_iterations 10\nbootstrap_type MVS\nmax_leaves 64" } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_a7a1a6b7f72e4a12bd574eb45c801b39", "_model_module": "@jupyter-widgets/output" } }, "9e08f8f4343a441ab290545c679533cf": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "e14d0ac066224518ac2eaef551c70c10": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "a7a1a6b7f72e4a12bd574eb45c801b39": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "afd584fbc8a24f1baaf7ffd336839df5": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_9e412e3be60c4a65a00a62cc0900524c", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 3, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 3, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_650fd903437f42138427259ae89385c0" } }, "9e412e3be60c4a65a00a62cc0900524c": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "650fd903437f42138427259ae89385c0": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "adc3728c289f4410b594a4212f5e729c": { "model_module": "@jupyter-widgets/controls", "model_name": "TextModel", "state": { "_view_name": "TextView", "style": "IPY_MODEL_dd30b884e50b47caa2c7eb30d7d5b397", "_dom_classes": [], "description": "", "_model_name": "TextModel", "placeholder": "​", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": "Following data types have been inferred automatically, if they are correct press enter to continue or type 'quit' otherwise.", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "continuous_update": true, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_eb3d75a11c1c4575a621c248ccfe0f52" } }, "dd30b884e50b47caa2c7eb30d7d5b397": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "state": { "_view_name": "StyleView", "_model_name": "DescriptionStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "eb3d75a11c1c4575a621c248ccfe0f52": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": "100%", "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "60bb4204212e4b65b4e7fdf846790952": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_7ea62fdec17144158b7fb4cfe3c83b21", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 79, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 79, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_cf5589d70daf40ed94c7ffd89dac990e" } }, "7ea62fdec17144158b7fb4cfe3c83b21": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "cf5589d70daf40ed94c7ffd89dac990e": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "5f54753abe0e4486b04eb8d273109b4c": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_87522b28665f4055afc2762b6d60ebe0", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_547856fc003e480eb9533f7541f11b61" } }, "87522b28665f4055afc2762b6d60ebe0": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "547856fc003e480eb9533f7541f11b61": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "5505c035740744dba23dce1750ea4c06": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_f48ed8a89f0a463eabd3c02d11807c26", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_e3346fce67b341a189e271ae4dbbf637" } }, "f48ed8a89f0a463eabd3c02d11807c26": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "e3346fce67b341a189e271ae4dbbf637": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "289080f92a784987bf9803c808c86b2f": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_c00d0d4f76cf4b3ba143096fcabd9160", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_1278fb36784f41728b5aed0c522375eb", "IPY_MODEL_a391a8969f7044ddbb8f996f2ae9d841" ] } }, "c00d0d4f76cf4b3ba143096fcabd9160": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "1278fb36784f41728b5aed0c522375eb": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_5983e5d1fcca4214afeeb0b6e3e9f01b", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 0, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_5654c6ccc5e94fe5b4b6015c80437afd" } }, "a391a8969f7044ddbb8f996f2ae9d841": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
Parameters
objectivebinary:logistic
use_label_encoderTrue
base_score0.5
boostergbtree
colsample_bylevel1
colsample_bynode1
colsample_bytree1
gamma0
gpu_id-1
importance_typegain
interaction_constraints
learning_rate0.300000012
max_delta_step0
max_depth6
min_child_weight1
missingnan
monotone_constraints()
n_estimators100
n_jobs-1
num_parallel_tree1
random_state4581
reg_alpha0
reg_lambda1
scale_pos_weight1
subsample1
tree_methodauto
validate_parameters1
verbosity0
\n
", "text/plain": " Parameters\nobjective binary:logistic\nuse_label_encoder True\nbase_score 0.5\nbooster gbtree\ncolsample_bylevel 1\ncolsample_bynode 1\ncolsample_bytree 1\ngamma 0\ngpu_id -1\nimportance_type gain\ninteraction_constraints \nlearning_rate 0.300000012\nmax_delta_step 0\nmax_depth 6\nmin_child_weight 1\nmissing nan\nmonotone_constraints ()\nn_estimators 100\nn_jobs -1\nnum_parallel_tree 1\nrandom_state 4581\nreg_alpha 0\nreg_lambda 1\nscale_pos_weight 1\nsubsample 1\ntree_method auto\nvalidate_parameters 1\nverbosity 0" } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_be8e6cd719384b719d8e05c54eab3225", "_model_module": "@jupyter-widgets/output" } }, "5983e5d1fcca4214afeeb0b6e3e9f01b": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "5654c6ccc5e94fe5b4b6015c80437afd": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "be8e6cd719384b719d8e05c54eab3225": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "3f094aa3d2e34e2b988d99c742f9d393": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_aa757b9ea18c486cac397ec90631be22", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 5, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 5, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_2800e9fa0fa84f899598d83083a9f37f" } }, "aa757b9ea18c486cac397ec90631be22": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "2800e9fa0fa84f899598d83083a9f37f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "19bfaa8c92624fc49d00fb576eb168a0": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_209a2ebbe1af4fc498e7ba114ccc3878", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_3eb1e382648f4b47b0b31c76152573bd" } }, "209a2ebbe1af4fc498e7ba114ccc3878": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "3eb1e382648f4b47b0b31c76152573bd": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "6e579c53f5154dcc9f288f98732dfda5": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_4a8be249ec484581994f11a00c835fd7", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_224cb2b4e86f479d91d9fca0a4cff63b" } }, "4a8be249ec484581994f11a00c835fd7": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "224cb2b4e86f479d91d9fca0a4cff63b": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "8f6833e896f24ce1b691f340f19acbf3": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_4a39820fd6e34def9e7df8b60b827dd4", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_3745871b9e9d4960b65954a97c83eff2", "IPY_MODEL_4a103d29196a45ddb2be13242dc5948d" ] } }, "4a39820fd6e34def9e7df8b60b827dd4": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "3745871b9e9d4960b65954a97c83eff2": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_d4177e6dc2a34c94850207968293f112", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 14, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_e8ffa2e43da84377803186697fdf7bd6" } }, "4a103d29196a45ddb2be13242dc5948d": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "application/vnd.jupyter.widget-view+json": { "model_id": "70b3c58232134d9cac7db23f5b62bfda", "version_minor": 0, "version_major": 2 }, "text/plain": "IntProgress(value=0, description='Processing: ', max=5)" }, { "output_type": "pyerr", "metadata": { "tags": [] }, "ename": "ValueError", "evalue": "ignored", "traceback": [ "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", "\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/ipywidgets/widgets/interaction.py\u001b[0m in \u001b[0;36mupdate\u001b[0;34m(self, *args)\u001b[0m\n\u001b[1;32m 254\u001b[0m \u001b[0mvalue\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mwidget\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mget_interact_value\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 255\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mwidget\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_kwarg\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mvalue\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 256\u001b[0;31m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mresult\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mf\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m**\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 257\u001b[0m \u001b[0mshow_inline_matplotlib_plots\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 258\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mauto_display\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mresult\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pycaret/internal/tabular.py\u001b[0m in \u001b[0;36mplot_model\u001b[0;34m(estimator, plot, scale, save, fold, fit_kwargs, groups, feature_name, label, use_train_data, verbose, system, display)\u001b[0m\n\u001b[1;32m 7167\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7168\u001b[0m \u001b[0;31m# execute the plot method\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 7169\u001b[0;31m \u001b[0mret\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mlocals\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mplot\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 7170\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mret\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7171\u001b[0m \u001b[0mplot_filename\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mret\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pycaret/internal/tabular.py\u001b[0m in \u001b[0;36mfeature_all\u001b[0;34m()\u001b[0m\n\u001b[1;32m 7100\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7101\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mfeature_all\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 7102\u001b[0;31m \u001b[0m_feature\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdata_X\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcolumns\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 7103\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7104\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0m_feature\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mn\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mint\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pycaret/internal/tabular.py\u001b[0m in \u001b[0;36m_feature\u001b[0;34m(n)\u001b[0m\n\u001b[1;32m 7128\u001b[0m \u001b[0mmy_range\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msorted_df\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7129\u001b[0m \u001b[0mdisplay\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmove_progress\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 7130\u001b[0;31m \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfigure\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfigsize\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m8\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m5\u001b[0m \u001b[0;34m*\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mn\u001b[0m \u001b[0;34m//\u001b[0m \u001b[0;36m10\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdpi\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0m_base_dpi\u001b[0m \u001b[0;34m*\u001b[0m \u001b[0mscale\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 7131\u001b[0m plt.hlines(\n\u001b[1;32m 7132\u001b[0m \u001b[0my\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mmy_range\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mxmin\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mxmax\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0msorted_df\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"Value\"\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcolor\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m\"skyblue\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/matplotlib/pyplot.py\u001b[0m in \u001b[0;36mfigure\u001b[0;34m(num, figsize, dpi, facecolor, edgecolor, frameon, FigureClass, clear, **kwargs)\u001b[0m\n\u001b[1;32m 544\u001b[0m \u001b[0mframeon\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mframeon\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 545\u001b[0m \u001b[0mFigureClass\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mFigureClass\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 546\u001b[0;31m **kwargs)\n\u001b[0m\u001b[1;32m 547\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 548\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mfigLabel\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/matplotlib/backend_bases.py\u001b[0m in \u001b[0;36mnew_figure_manager\u001b[0;34m(cls, num, *args, **kwargs)\u001b[0m\n\u001b[1;32m 3355\u001b[0m \u001b[0;32mfrom\u001b[0m \u001b[0mmatplotlib\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfigure\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mFigure\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 3356\u001b[0m \u001b[0mfig_cls\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mkwargs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpop\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'FigureClass'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mFigure\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 3357\u001b[0;31m \u001b[0mfig\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mfig_cls\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 3358\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mcls\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnew_figure_manager_given_figure\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnum\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mfig\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 3359\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/matplotlib/figure.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, figsize, dpi, facecolor, edgecolor, linewidth, frameon, subplotpars, tight_layout, constrained_layout)\u001b[0m\n\u001b[1;32m 347\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 348\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0misfinite\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfigsize\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mall\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0marray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfigsize\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m<=\u001b[0m \u001b[0;36m0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0many\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 349\u001b[0;31m raise ValueError('figure size must be positive finite not '\n\u001b[0m\u001b[1;32m 350\u001b[0m f'{figsize}')\n\u001b[1;32m 351\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbbox_inches\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mBbox\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfrom_bounds\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0mfigsize\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;31mValueError\u001b[0m: figure size must be positive finite not (8, 0)" ] } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_61900fd657354669ac47d7fc218f0e63", "_model_module": "@jupyter-widgets/output" } }, "d4177e6dc2a34c94850207968293f112": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "e8ffa2e43da84377803186697fdf7bd6": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "61900fd657354669ac47d7fc218f0e63": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "e5653ef1f4ac4568af5ca682912df39c": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_bc82ef6f0b8f49f6a44179bd6b853445", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 5, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 3, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_e05532a49de54883a2776a4ce69ff02e" } }, "bc82ef6f0b8f49f6a44179bd6b853445": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "e05532a49de54883a2776a4ce69ff02e": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "70b3c58232134d9cac7db23f5b62bfda": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_c4db2e658ea54e1f896d3695a75fb0f8", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 5, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_0edb902376534a8fbd01c22af54b7c27" } }, "c4db2e658ea54e1f896d3695a75fb0f8": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "0edb902376534a8fbd01c22af54b7c27": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "3659c16a4759447f9c8b2e9e1bd7860f": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_ea4bd0ed110e4818a61de5d741d65792", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_ab3daf44e84e407f89d82424587c45d2" } }, "ea4bd0ed110e4818a61de5d741d65792": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "ab3daf44e84e407f89d82424587c45d2": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "9c93b53066f449cabffe42495002ff2b": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_84de493313c4416ba147b8514bdf5ccd", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_e8696e757e9140d38d0dec51809b5a37" } }, "84de493313c4416ba147b8514bdf5ccd": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "e8696e757e9140d38d0dec51809b5a37": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "679526b38f8c47ad9a8759d066aabb5c": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_4bb43807c6ed4bbb8bc7a1de36170aad", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_15bacfbd614c48e7ac46997961421489", "IPY_MODEL_9d221ee267124302b6aac1bab99db046" ] } }, "4bb43807c6ed4bbb8bc7a1de36170aad": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "15bacfbd614c48e7ac46997961421489": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_c0a39ef9ad4c46bca8299fb6a5fffec8", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 0, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_29af3b998a664828a5afa4b9f7dda07c" } }, "9d221ee267124302b6aac1bab99db046": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
Parameters
nan_modeMin
eval_metricLogloss
iterations1000
sampling_frequencyPerTree
leaf_estimation_methodNewton
grow_policySymmetricTree
penalties_coefficient1
boosting_typePlain
model_shrink_modeConstant
feature_border_typeGreedyLogSum
bayesian_matrix_reg0.10000000149011612
l2_leaf_reg3
random_strength1
rsm1
boost_from_averageFalse
model_size_reg0.5
subsample0.800000011920929
use_best_modelFalse
class_names[0, 1]
random_seed4581
depth6
posterior_samplingFalse
border_count254
classes_count0
auto_class_weightsNone
sparse_features_conflict_fraction0
leaf_estimation_backtrackingAnyImprovement
best_model_min_trees1
model_shrink_rate0
min_data_in_leaf1
loss_functionLogloss
learning_rate0.014127999544143677
score_functionCosine
task_typeCPU
leaf_estimation_iterations10
bootstrap_typeMVS
max_leaves64
\n
", "text/plain": " Parameters\nnan_mode Min\neval_metric Logloss\niterations 1000\nsampling_frequency PerTree\nleaf_estimation_method Newton\ngrow_policy SymmetricTree\npenalties_coefficient 1\nboosting_type Plain\nmodel_shrink_mode Constant\nfeature_border_type GreedyLogSum\nbayesian_matrix_reg 0.10000000149011612\nl2_leaf_reg 3\nrandom_strength 1\nrsm 1\nboost_from_average False\nmodel_size_reg 0.5\nsubsample 0.800000011920929\nuse_best_model False\nclass_names [0, 1]\nrandom_seed 4581\ndepth 6\nposterior_sampling False\nborder_count 254\nclasses_count 0\nauto_class_weights None\nsparse_features_conflict_fraction 0\nleaf_estimation_backtracking AnyImprovement\nbest_model_min_trees 1\nmodel_shrink_rate 0\nmin_data_in_leaf 1\nloss_function Logloss\nlearning_rate 0.014127999544143677\nscore_function Cosine\ntask_type CPU\nleaf_estimation_iterations 10\nbootstrap_type MVS\nmax_leaves 64" } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_bc3075446d0348bcb00f9a672dcc8ad1", "_model_module": "@jupyter-widgets/output" } }, "c0a39ef9ad4c46bca8299fb6a5fffec8": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "29af3b998a664828a5afa4b9f7dda07c": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "bc3075446d0348bcb00f9a672dcc8ad1": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "69bbea89321f407eae6f435e00728d9d": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_5facd9a5cac94c8d87e51d5d79cc6aca", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 5, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_75c2ebf71ba14b8da324d470fde6096b" } }, "5facd9a5cac94c8d87e51d5d79cc6aca": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "75c2ebf71ba14b8da324d470fde6096b": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "8707725331314861821ce500a3eeffac": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_4be5360cabe647d5849b88f489b6cd20", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 3, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 3, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_eb95926f6a4944c292da60aa0213e396" } }, "4be5360cabe647d5849b88f489b6cd20": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "eb95926f6a4944c292da60aa0213e396": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "8395d1cb9e454d068dd6a3db160fc9c6": { "model_module": "@jupyter-widgets/controls", "model_name": "TextModel", "state": { "_view_name": "TextView", "style": "IPY_MODEL_b8d139ba355646888a39dfaa52bb6c36", "_dom_classes": [], "description": "", "_model_name": "TextModel", "placeholder": "​", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": "Following data types have been inferred automatically, if they are correct press enter to continue or type 'quit' otherwise.", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "continuous_update": true, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_6d74e458826c4bd1aed9dca2760c8ca0" } }, "b8d139ba355646888a39dfaa52bb6c36": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "state": { "_view_name": "StyleView", "_model_name": "DescriptionStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "6d74e458826c4bd1aed9dca2760c8ca0": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": "100%", "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "c24b28b804be4c248eba0b3eb3099673": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_5737d68310e24f188f9a1c8844aa4831", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 79, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 79, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_0df65d85f8fc4afd845d8a8346d0ac00" } }, "5737d68310e24f188f9a1c8844aa4831": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "0df65d85f8fc4afd845d8a8346d0ac00": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "8dd10b0c4c8e4c2d899ca98ddf26f19f": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_4cf7d8abf42d43239a03e760182abacd", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_46c96d3cfe814a7fb86366bdf21700ea" } }, "4cf7d8abf42d43239a03e760182abacd": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "46c96d3cfe814a7fb86366bdf21700ea": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "3516024e5141494ba968244737483245": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_4885cdb5a3d2483e924c0cc0d75f97e5", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_dfb224af140240ecb4e4b055a3238bf8" } }, "4885cdb5a3d2483e924c0cc0d75f97e5": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "dfb224af140240ecb4e4b055a3238bf8": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "5238ac85157f48ebbef40b4332450a4d": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_3e4c48f925694b4992df24d3db4cd08d", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_90305a6b029b4002915d714b18d2dc6a", "IPY_MODEL_36efa56b78d848e18fc9d8ff5248025b" ] } }, "3e4c48f925694b4992df24d3db4cd08d": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "90305a6b029b4002915d714b18d2dc6a": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_cbb0a03436964633b5fb8378022b6af0", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 0, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_389e9955fa29468eb796fe3c1421b4cb" } }, "36efa56b78d848e18fc9d8ff5248025b": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
Parameters
objectivebinary:logistic
use_label_encoderTrue
base_score0.5
boostergbtree
colsample_bylevel1
colsample_bynode1
colsample_bytree1
gamma0
gpu_id-1
importance_typegain
interaction_constraints
learning_rate0.300000012
max_delta_step0
max_depth6
min_child_weight1
missingnan
monotone_constraints()
n_estimators100
n_jobs-1
num_parallel_tree1
random_state5221
reg_alpha0
reg_lambda1
scale_pos_weight1
subsample1
tree_methodauto
validate_parameters1
verbosity0
\n
", "text/plain": " Parameters\nobjective binary:logistic\nuse_label_encoder True\nbase_score 0.5\nbooster gbtree\ncolsample_bylevel 1\ncolsample_bynode 1\ncolsample_bytree 1\ngamma 0\ngpu_id -1\nimportance_type gain\ninteraction_constraints \nlearning_rate 0.300000012\nmax_delta_step 0\nmax_depth 6\nmin_child_weight 1\nmissing nan\nmonotone_constraints ()\nn_estimators 100\nn_jobs -1\nnum_parallel_tree 1\nrandom_state 5221\nreg_alpha 0\nreg_lambda 1\nscale_pos_weight 1\nsubsample 1\ntree_method auto\nvalidate_parameters 1\nverbosity 0" } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_da0fead6fe0547549f7d21c109295c78", "_model_module": "@jupyter-widgets/output" } }, "cbb0a03436964633b5fb8378022b6af0": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "389e9955fa29468eb796fe3c1421b4cb": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "3e279ee794e54f74b1af69f76a966a31": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_1d64432c0de54747a4373d2055e990ea", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 5, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 3, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_20959362abf54f809bbc9279cfeda188" } }, "da0fead6fe0547549f7d21c109295c78": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "1d64432c0de54747a4373d2055e990ea": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "20959362abf54f809bbc9279cfeda188": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "738bda43761e444481ea74b6c2da8022": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_fe521331d9a64ddb94d82c0b68616d84", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_63bc1fbd946143a28334f9a2237178fd" } }, "fe521331d9a64ddb94d82c0b68616d84": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "63bc1fbd946143a28334f9a2237178fd": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "2ed584d9e8da4f5da346b1e8d581efc2": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_f46001a0e4914f3db48a84f7987d6b5b", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_33bad682059a4e12839d36d0913169a9" } }, "f46001a0e4914f3db48a84f7987d6b5b": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "33bad682059a4e12839d36d0913169a9": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "77c8ccd8bd8f425cb99be8e58ee3d931": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_72ee822a95ed4232bdc1c1ce909333ee", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_dde01c732630412ba04e143c691fef50", "IPY_MODEL_802bef155bd8481cbdfe9220094b971e" ] } }, "72ee822a95ed4232bdc1c1ce909333ee": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "dde01c732630412ba04e143c691fef50": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_940b0b4b95b547e8847918ae1d4c1ee6", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 0, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_fdbb8e58e39a4ee3a4b53252a2a17dd6" } }, "802bef155bd8481cbdfe9220094b971e": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
Parameters
C1.0
class_weightNone
dualFalse
fit_interceptTrue
intercept_scaling1
l1_ratioNone
max_iter1000
multi_classauto
n_jobsNone
penaltyl2
random_state5221
solverlbfgs
tol0.0001
verbose0
warm_startFalse
\n
", "text/plain": " Parameters\nC 1.0\nclass_weight None\ndual False\nfit_intercept True\nintercept_scaling 1\nl1_ratio None\nmax_iter 1000\nmulti_class auto\nn_jobs None\npenalty l2\nrandom_state 5221\nsolver lbfgs\ntol 0.0001\nverbose 0\nwarm_start False" } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_cb21cc1e1e9a415da8bca9e7ddd1afd4", "_model_module": "@jupyter-widgets/output" } }, "940b0b4b95b547e8847918ae1d4c1ee6": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "fdbb8e58e39a4ee3a4b53252a2a17dd6": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "cb21cc1e1e9a415da8bca9e7ddd1afd4": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "fb4b36fcd06149798f6bd0ac5b92f623": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_c28813b57f4149a290aa7fcdad2213cc", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 4, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 4, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_370d6ac451114cbd9d38f3082e51cfbe" } }, "c28813b57f4149a290aa7fcdad2213cc": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "370d6ac451114cbd9d38f3082e51cfbe": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "666ea6b6c5e1477088874e17dc9c33b7": { "model_module": "@jupyter-widgets/controls", "model_name": "IntProgressModel", "state": { "_view_name": "ProgressView", "style": "IPY_MODEL_7175066c42e54289a5038da594728ee0", "_dom_classes": [], "description": "Processing: ", "_model_name": "IntProgressModel", "bar_style": "", "max": 7, "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "value": 7, "_view_count": null, "_view_module_version": "1.5.0", "orientation": "horizontal", "min": 0, "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_3d3e94b00fe743eb9499e640ae18a553" } }, "7175066c42e54289a5038da594728ee0": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "state": { "_view_name": "StyleView", "_model_name": "ProgressStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.2.0", "bar_color": null, "_model_module": "@jupyter-widgets/controls" } }, "3d3e94b00fe743eb9499e640ae18a553": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "f298fe3f4539460f892778917dca8e35": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "state": { "_view_name": "VBoxView", "_dom_classes": [ "widget-interact" ], "_model_name": "VBoxModel", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "_view_module_version": "1.5.0", "box_style": "", "layout": "IPY_MODEL_3ae88fa2ea8642d88a4b44091352d1ae", "_model_module": "@jupyter-widgets/controls", "children": [ "IPY_MODEL_268e0463c4b44a1a9811775756d77c41", "IPY_MODEL_d434264ed45c4de8af5e31ac2901b8c4" ] } }, "3ae88fa2ea8642d88a4b44091352d1ae": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "268e0463c4b44a1a9811775756d77c41": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsModel", "state": { "_options_labels": [ "Hyperparameters", "AUC", "Confusion Matrix", "Threshold", "Precision Recall", "Prediction Error", "Class Report", "Feature Selection", "Learning Curve", "Manifold Learning", "Calibration Curve", "Validation Curve", "Dimensions", "Feature Importance", "Feature Importance (All)", "Decision Boundary", "Lift Chart", "Gain Chart", "Decision Tree" ], "_view_name": "ToggleButtonsView", "style": "IPY_MODEL_497321ff3b6849b19b7ab938133316ad", "_dom_classes": [], "description": "Plot Type:", "_model_name": "ToggleButtonsModel", "tooltips": [], "index": 0, "button_style": "", "_view_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_view_count": null, "disabled": false, "_view_module_version": "1.5.0", "icons": [ "" ], "description_tooltip": null, "_model_module": "@jupyter-widgets/controls", "layout": "IPY_MODEL_cc0fbcf2f77846f4bd1266103d07a1f7" } }, "d434264ed45c4de8af5e31ac2901b8c4": { "model_module": "@jupyter-widgets/output", "model_name": "OutputModel", "state": { "_view_name": "OutputView", "msg_id": "", "_dom_classes": [], "_model_name": "OutputModel", "outputs": [ { "output_type": "display_data", "metadata": { "tags": [] }, "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
Parameters
nan_modeMin
eval_metricLogloss
iterations1000
sampling_frequencyPerTree
leaf_estimation_methodNewton
grow_policySymmetricTree
penalties_coefficient1
boosting_typePlain
model_shrink_modeConstant
feature_border_typeGreedyLogSum
bayesian_matrix_reg0.10000000149011612
l2_leaf_reg3
random_strength1
rsm1
boost_from_averageFalse
model_size_reg0.5
subsample0.800000011920929
use_best_modelFalse
class_names[0, 1]
random_seed5221
depth6
posterior_samplingFalse
border_count254
classes_count0
auto_class_weightsNone
sparse_features_conflict_fraction0
leaf_estimation_backtrackingAnyImprovement
best_model_min_trees1
model_shrink_rate0
min_data_in_leaf1
loss_functionLogloss
learning_rate0.015974000096321106
score_functionCosine
task_typeCPU
leaf_estimation_iterations10
bootstrap_typeMVS
max_leaves64
\n
", "text/plain": " Parameters\nnan_mode Min\neval_metric Logloss\niterations 1000\nsampling_frequency PerTree\nleaf_estimation_method Newton\ngrow_policy SymmetricTree\npenalties_coefficient 1\nboosting_type Plain\nmodel_shrink_mode Constant\nfeature_border_type GreedyLogSum\nbayesian_matrix_reg 0.10000000149011612\nl2_leaf_reg 3\nrandom_strength 1\nrsm 1\nboost_from_average False\nmodel_size_reg 0.5\nsubsample 0.800000011920929\nuse_best_model False\nclass_names [0, 1]\nrandom_seed 5221\ndepth 6\nposterior_sampling False\nborder_count 254\nclasses_count 0\nauto_class_weights None\nsparse_features_conflict_fraction 0\nleaf_estimation_backtracking AnyImprovement\nbest_model_min_trees 1\nmodel_shrink_rate 0\nmin_data_in_leaf 1\nloss_function Logloss\nlearning_rate 0.015974000096321106\nscore_function Cosine\ntask_type CPU\nleaf_estimation_iterations 10\nbootstrap_type MVS\nmax_leaves 64" } ], "_view_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_view_count": null, "_view_module_version": "1.0.0", "layout": "IPY_MODEL_b995a9f6bf614675ac2153fc65daa3de", "_model_module": "@jupyter-widgets/output" } }, "497321ff3b6849b19b7ab938133316ad": { "model_module": "@jupyter-widgets/controls", "model_name": "ToggleButtonsStyleModel", "state": { "_view_name": "StyleView", "button_width": "", "_model_name": "ToggleButtonsStyleModel", "description_width": "", "_view_module": "@jupyter-widgets/base", "_model_module_version": "1.5.0", "_view_count": null, "font_weight": "", "_view_module_version": "1.2.0", "_model_module": "@jupyter-widgets/controls" } }, "cc0fbcf2f77846f4bd1266103d07a1f7": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } }, "b995a9f6bf614675ac2153fc65daa3de": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "state": { "_view_name": "LayoutView", "grid_template_rows": null, "right": null, "justify_content": null, "_view_module": "@jupyter-widgets/base", "overflow": null, "_model_module_version": "1.2.0", "_view_count": null, "flex_flow": null, "width": null, "min_width": null, "border": null, "align_items": null, "bottom": null, "_model_module": "@jupyter-widgets/base", "top": null, "grid_column": null, "overflow_y": null, "overflow_x": null, "grid_auto_flow": null, "grid_area": null, "grid_template_columns": null, "flex": null, "_model_name": "LayoutModel", "justify_items": null, "grid_row": null, "max_height": null, "align_content": null, "visibility": null, "align_self": null, "height": null, "min_height": null, "padding": null, "grid_auto_rows": null, "grid_gap": null, "max_width": null, "order": null, "_view_module_version": "1.2.0", "grid_template_areas": null, "object_position": null, "object_fit": null, "grid_auto_columns": null, "margin": null, "display": null, "left": null } } } } }, "cells": [ { "cell_type": "markdown", "metadata": { "id": "TRQ197E7_GeW" }, "source": [ "**A Study on the Correlation of Weather Station Data and the Occurence of Wet Avalanches**" ] }, { "cell_type": "markdown", "metadata": { "id": "iWjUyErHoy1p" }, "source": [ "# Contribution" ] }, { "cell_type": "markdown", "metadata": { "id": "BGCyS_6gpIDA" }, "source": [ "\n", "\n", "Mahad:\n", "\n", "\n", "> Mahad handled all of the practical analysis done on the data. Mahad also performed most of the data organization and machine learning done on the data.\n", "\n", "\n", "Grace: \n", "\n", "\n", "> Grace handled all of the linear and logistic regression performed on the data. Grace did assist in organizing and cleaning up the data for her own practice; however, the code used for these tasks in this notebook is Mahad's. Grace organized and prepared the notebooks for submission. Grace wrote the abstract, introduction, and other pieces of information throughout the notebook. Lastly, she helped to research details about wet avalanches as well as different methods for analyzing the data.\n", "\n", "\n", "\n", "Daniela:\n", "\n", "\n", "> Daniela communicated with sponsors, professor, and team mates. She set up a meeting with the sponsors and kept track of all emails and data. Daniela also recorded all information and next steps during presentations. She helped with researching Pycaret and defaults along with researching methods that showed the most accuracy.Worked on the testing and training portion. Looked at if there were changes between 60:40, 70:30, and 80:20.\n", "\n", "Required Files:\n", "\n", "The following xlsx files contain the data needed to run the notebook and are available in the CAIC drive folder. They are read in under 'Data Import and Pre-Processing'\n", "* All Wet Avalanches 2014-Present.xlsx\n", "* OriginalWeatherData.xlsx\n", "\n", "**It is important to note that all of the Machine Learning Code underneath the sub section 'Prediction Model' takes at least a minute, likely more, to run for each box of code**\n", "\n" ] }, { "cell_type": "markdown", "metadata": { "id": "O2TdhRU4qydE" }, "source": [ "# Abstract" ] }, { "cell_type": "markdown", "metadata": { "id": "mrBEngaah-RG" }, "source": [ "This report organizes and provides analysis for data provided by the Colorado Avalanche Information Center, regarding wet avalanches. Our goal was to clean and subsequently analyze the wet avalanche data recorded by CAIC as well as the corresponding weather station data in order to find any correlation between the various data points. Overall, this notebook provides a template for organizing, analyzing and predicting wet avalanches; however, the predictions could be more precise with more locations. In the future, we hope that this information can be used to study the causes of wet avalanches in order to predict when they occur. " ] }, { "cell_type": "markdown", "metadata": { "id": "yul-lpNSg75v" }, "source": [ "# Introduction" ] }, { "cell_type": "markdown", "metadata": { "id": "8inJZ_uC_T6O" }, "source": [ "\n", "The Colorado Avalanche Information Center is a program within the Colorado Department of Natural Resources that is committed to educating the public on avalanche safety as well as forecasting avalanche conditions. Currently, the CAIC employs a system that is titled '[The Avalanche Problem](https://www.avalanche.state.co.us/forecasts/help/avalanche-problems/)', which uses four characteristics (avalanche character or type, location, likelihood, and size) to determine the avalanche hazard rating throughout the mountains each day. \n", "\n", "Our research focuses on two of these avalanche characters, Wet Slab and Wet Loose, which we have combined to the single term 'wet avalanches' for the sake of the study. There is little research surrounding wet avalanches and their causes, so our goal was to take the weather station data and wet avalanche data recorded by the CAIC and study their correlation. We hope that the research that we have done can be used as a first-step in identifying where and why wet avalanches form. \n", "\n", "At the start of our research, we relied primarily on graphics in order to visualize the status of various weather varibles alongside the occurence of wet avalanches. Time series and distribution plots were used for this portion of the research. Linear regression was used to help identify how each weather variable directly correlates to avalanche occurence, and machine learning tools were implemented to start generating predictive modeling options for future use. " ] }, { "cell_type": "markdown", "metadata": { "id": "H5o-hqqWAB1o" }, "source": [ "# Methods" ] }, { "cell_type": "markdown", "metadata": { "id": "W6HBR_IhAmd6" }, "source": [ "There are two key pieces of data that we are using in this project, wet avalanche data and weather station data. The wet avalanche data was given to us by the CAIC team in the form of a 664 KB .csv file. We then turned it into a .xlsx file (All Wet Avalanches 2014-Present.xlsx); however, the .csv form of the file is still available in the CAIC drive folder. The SNOTEL weather station data was downloaded from the [National Resources Conservation Center](https://www.wcc.nrcs.usda.gov/snow/snotel-data.html) website. There are 13 SNOTEL stations that were used in this project; so, the data from each station were combined into one .xlsx file (OriginalWeatherData.xlsx) and is 6 MB. The wet avalance data is both categorical and numerical. A description of each column and its units is listed below:" ] }, { "cell_type": "markdown", "metadata": { "id": "EX9nC9iuPfw8" }, "source": [ "Columns and units for 'All Wet Avalanches 2014-Present.xlsx':\n", "\n", "1. id = id \n", "2. obs_id = Observation id \n", "3. avi_hw_op_bc = Was the avalanche in a highway, within an operation (ski area) or backcountry\n", "4. avi_hw_zone_id = If highway what is the pass id (-1 = not highway)\n", "5. avi_path = Avalanche path name if known. These are mostly highway avalanche paths where the name is known.\n", "6. avi_op_name = name of operation if within an operating boundary\n", "7. avi_loc = general area of avalanche from a drop down list\n", "8. avi_bc_zone_id = if avalanche is a backcountry avalanche which CAIC zone is it in\n", "9. avi_mark = Location within a backcountry zone if known\n", "10. avi_number = number of avalanches reported at that place and time\n", "11. avi_type = type of avalanche (WL = wet loose, WS = wet slab)\n", "12. avi_aspect = Compas aspect if known\n", "13. avi_elev = elevation compared to treeline can be (>TL = above treeline, TL = at treeline, \n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
idobs_idavi_hw_op_bcavi_hw_zone_idavi_pathavi_op_nameavi_locavi_bc_zone_idavi_markavi_numberavi_typeavi_aspectavi_elevavi_rsizeavi_dsizeavi_prim_trigavi_sec_trigavi_commentsavi_dateavi_date_knownavi_time_knownavi_areaavi_angle_avgavi_angle_maxavi_elevationavi_elevation_unitsavi_surfaceavi_weak_layeravi_grain_typeavi_crown_avgavi_crown_maxavi_crown_unitsavi_width_avgavi_width_maxavi_width_unitsavi_vertical_avgavi_vertical_maxavi_vertical_unitsavi_terminusavi_road_statusavi_road_depthavi_road_lengthavi_road_unitsavi_latavi_lonid.1obs_id.1avi_descrid.2zone_idlatlonutm_zoneutm_eutm_nnametitleanchorzone_orderUnnamed: 59Unnamed: 60Unnamed: 61
015118260877bc-1NaN-2NaN0-11WSNE<TLR1D1NNaNNaN3/15/2020 00:00EstimatedUnknownThe west end of Byers Canyon.38407900ftGLayerDepth Hoar68.0in3540.0ft7075.0ftNaNNaNNaNNaNft00.03925360877.0A small Wet Slab avalanche was seen in Byers C...1040.45217-106.6690113358475.000004.479283e+06Steamboat & Flat TopsSteamboat Area & Flat Topssteamboat0NaNNaNNaN
15378623807bc-1NaN-2NaN1-11WSE>TLR3D1.5ASuNaN3/9/2014 10:25KnownKnownEast-facing rollover directly below Andrew's T...353811245ftOUnknownUnknown1835.0in100110.0ft125200.0ftNaNNaNNaNNaNft00.0264223807.0My partner and I, both on backcountry skis, de...2140.14328-105.8407513428384.000004.443999e+06Front RangeFront Rangefrontrange1NaNNaNNaN
26632135489bc-1NaN-2NaN1-11WLETLR1D1ASNaNNaN4/3/2015 00:00EstimatedUnknownNaNNaNNaNNaNftNaNNaNNaNNaNNaNinNaNNaNftNaNNaNftNaNNaNNaNNaNft00.01424535489.0NaN2140.14328-105.8407513428384.000004.443999e+06Front RangeFront Rangefrontrange1NaNNaNNaN
36649336044bc-1NaN-2NaN1-11WSS>TLR2D2ASNaNNaN6/7/2015 00:00EstimatedUnknownKelso PkNaNNaNNaNftNaNNaNNaNNaNNaNin25NaNft1000NaNftNaNNaNNaNNaNft00.01478136044.0Skier triggered wet slab.2140.14328-105.8407513428384.000004.443999e+06Front RangeFront Rangefrontrange1NaNNaNNaN
47584340808bc-1NaN-2NaN1-11WLNE<TLR1D1ASNaNMt Trelease3/11/2016 00:00EstimatedUnknownNaNNaNNaNNaNftNaNNaNNaNNaNNaNinNaNNaNftNaNNaNftNaNNaNNaNNaNft00.01943640808.0Mt. trelease, N, NE aspect near the bottom of ...ran 30 ft40° slope angle. Reporting since there were n...or water being able to be sqeezed from the sn...2140.14328-1.058407e+02134283844443999Front RangeFront Rangefrontrange1.0
.............................................................................................................................................................................................
149413246756615hw15Stephen-2NaN8NaN1WLETLR3D2NNaNNaN5/11/2019 00:00KnownUnknownNaNNaNNaNNaNftNaNNaNNaNNaNNaNinNaNNaNftNaNNaNftMPOpenNaNNaNft00.03499156615.0NaN9837.53723-106.8044913340573.000004.156002e+06Southern San JuanSouthern San Juan Mountainssouthsanjuan8NaNNaNNaN
149514999060613hw16-1-2NaN8NaN1WLSE<TLR2D1AScNaN3/5/2020 00:00KnownUnknownWest of Cumbres Pass. Not a highway path.NaNNaNNaNftNaNNaNNaNNaNNaNinNaN20.0ftNaN200.0ftBPNaNNaNNaNft00.03898960613.0No recent natural avalanche activity observed ...9837.53723-106.8044913340573.000004.156002e+06Southern San JuanSouthern San Juan Mountainssouthsanjuan8NaNNaNNaN
149615522361425hw16-1-2NaN8NaN1WLNW<TLR2D1.5NNaNAvalanche date is a total guess. An drop down ...4/2/2020 00:00EstimatedUnknownCamp SlideNaNNaNNaNftGNaNNaNNaNNaNinNaNNaNftNaNNaNftMPOpenNaNNaNft00.03980161425.0NaN9837.53723-106.8044913340573.000004.156002e+06Southern San JuanSouthern San Juan Mountainssouthsanjuan8NaNNaNNaN
149715544461449hw15Andrew-2NaN8NaN1WLETLR1D1.5NNaNSlid to the ground and plunged over the cliff,...4/9/2020 00:00EstimatedUnknownIn steep rocky terrain above shot 9.NaNNaNNaNftGNaNNaNNaNNaNinNaNNaNftNaNNaNftTPOpenNaNNaNft00.03982561449.0NaN9837.53723-106.8044913340573.000004.156002e+06Southern San JuanSouthern San Juan Mountainssouthsanjuan8NaNNaNNaN
149815544561449hw15Stephen-2NaN8NaN1WLSE<TLR2D1.5NNaNNaN4/5/2020 00:00EstimatedUnknownReleased from the cliffs below the starting zone.NaNNaNNaNftINaNNaNNaNNaNinNaNNaNftNaNNaNftMPOpenNaNNaNft00.03982561449.0NaN9837.53723-106.8044913340573.000004.156002e+06Southern San JuanSouthern San Juan Mountainssouthsanjuan8NaNNaNNaN
\n", "

1499 rows × 62 columns

\n", "" ], "text/plain": [ " id obs_id avi_hw_op_bc avi_hw_zone_id avi_path avi_op_name \\\n", "0 151182 60877 bc -1 NaN -2 \n", "1 53786 23807 bc -1 NaN -2 \n", "2 66321 35489 bc -1 NaN -2 \n", "3 66493 36044 bc -1 NaN -2 \n", "4 75843 40808 bc -1 NaN -2 \n", "... ... ... ... ... ... ... \n", "1494 132467 56615 hw 15 Stephen -2 \n", "1495 149990 60613 hw 16 -1 -2 \n", "1496 155223 61425 hw 16 -1 -2 \n", "1497 155444 61449 hw 15 Andrew -2 \n", "1498 155445 61449 hw 15 Stephen -2 \n", "\n", " avi_loc avi_bc_zone_id avi_mark avi_number avi_type avi_aspect \\\n", "0 NaN 0 -1 1 WS NE \n", "1 NaN 1 -1 1 WS E \n", "2 NaN 1 -1 1 WL E \n", "3 NaN 1 -1 1 WS S \n", "4 NaN 1 -1 1 WL NE \n", "... ... ... ... ... ... ... \n", "1494 NaN 8 NaN 1 WL E \n", "1495 NaN 8 NaN 1 WL SE \n", "1496 NaN 8 NaN 1 WL NW \n", "1497 NaN 8 NaN 1 WL E \n", "1498 NaN 8 NaN 1 WL SE \n", "\n", " avi_elev avi_rsize avi_dsize avi_prim_trig avi_sec_trig \\\n", "0 TL R3 D1.5 AS u \n", "2 TL R1 D1 AS NaN \n", "3 >TL R2 D2 AS NaN \n", "4 \n", "RangeIndex: 1499 entries, 0 to 1498\n", "Data columns (total 62 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 id 1499 non-null int64 \n", " 1 obs_id 1499 non-null int64 \n", " 2 avi_hw_op_bc 1499 non-null object \n", " 3 avi_hw_zone_id 1499 non-null int64 \n", " 4 avi_path 335 non-null object \n", " 5 avi_op_name 1499 non-null object \n", " 6 avi_loc 1 non-null object \n", " 7 avi_bc_zone_id 1499 non-null int64 \n", " 8 avi_mark 847 non-null object \n", " 9 avi_number 1499 non-null int64 \n", " 10 avi_type 1499 non-null object \n", " 11 avi_aspect 1461 non-null object \n", " 12 avi_elev 1468 non-null object \n", " 13 avi_rsize 1334 non-null object \n", " 14 avi_dsize 1460 non-null object \n", " 15 avi_prim_trig 1452 non-null object \n", " 16 avi_sec_trig 216 non-null object \n", " 17 avi_comments 584 non-null object \n", " 18 avi_date 1499 non-null object \n", " 19 avi_date_known 1499 non-null object \n", " 20 avi_time_known 1499 non-null object \n", " 21 avi_area 1021 non-null object \n", " 22 avi_angle_avg 163 non-null object \n", " 23 avi_angle_max 139 non-null object \n", " 24 avi_elevation 431 non-null object \n", " 25 avi_elevation_units 1496 non-null object \n", " 26 avi_surface 455 non-null object \n", " 27 avi_weak_layer 170 non-null object \n", " 28 avi_grain_type 165 non-null object \n", " 29 avi_crown_avg 156 non-null object \n", " 30 avi_crown_max 106 non-null float64\n", " 31 avi_crown_units 1495 non-null object \n", " 32 avi_width_avg 247 non-null object \n", " 33 avi_width_max 225 non-null float64\n", " 34 avi_width_units 1496 non-null object \n", " 35 avi_vertical_avg 326 non-null object \n", " 36 avi_vertical_max 257 non-null float64\n", " 37 avi_vertical_units 1497 non-null object \n", " 38 avi_terminus 195 non-null object \n", " 39 avi_road_status 273 non-null object \n", " 40 avi_road_depth 150 non-null object \n", " 41 avi_road_length 148 non-null float64\n", " 42 avi_road_units 1495 non-null object \n", " 43 avi_lat 1496 non-null object \n", " 44 avi_lon 1496 non-null float64\n", " 45 id.1 1497 non-null object \n", " 46 obs_id.1 1497 non-null float64\n", " 47 avi_descr 835 non-null object \n", " 48 id.2 1493 non-null object \n", " 49 zone_id 1495 non-null object \n", " 50 lat 1493 non-null object \n", " 51 lon 1494 non-null object \n", " 52 utm_zone 1494 non-null object \n", " 53 utm_e 1493 non-null float64\n", " 54 utm_n 1493 non-null float64\n", " 55 name 1493 non-null object \n", " 56 title 1493 non-null object \n", " 57 anchor 1493 non-null object \n", " 58 zone_order 1493 non-null object \n", " 59 Unnamed: 59 13 non-null object \n", " 60 Unnamed: 60 8 non-null object \n", " 61 Unnamed: 61 2 non-null float64\n", "dtypes: float64(9), int64(5), object(48)\n", "memory usage: 726.2+ KB\n" ], "name": "stdout" } ] }, { "cell_type": "code", "metadata": { "id": "VNpI6i5pDnFa" }, "source": [ "# Adjust variables types \n", "\n", "DataAvalanches['avi_date'] = pd.to_datetime(DataAvalanches['avi_date'], errors='coerce').dt.date.astype('datetime64')\n", "\n", "# Create categorical variable to sign avalanche\n", "\n", "DataAvalanches['Avalanche'] = 'Yes'" ], "execution_count": null, "outputs": [] }, { "cell_type": "code", "metadata": { "id": "dZgaCPN2ZaF4", "colab": { "base_uri": "https://localhost:8080/", "height": 564 }, "outputId": "a494caaa-b08d-483f-e355-ca815deb5a90" }, "source": [ "# Check result\n", "\n", "DataAvalanches.head()" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
idobs_idavi_hw_op_bcavi_hw_zone_idavi_pathavi_op_nameavi_locavi_bc_zone_idavi_markavi_numberavi_typeavi_aspectavi_elevavi_rsizeavi_dsizeavi_prim_trigavi_sec_trigavi_commentsavi_dateavi_date_knownavi_time_knownavi_areaavi_angle_avgavi_angle_maxavi_elevationavi_elevation_unitsavi_surfaceavi_weak_layeravi_grain_typeavi_crown_avgavi_crown_maxavi_crown_unitsavi_width_avgavi_width_maxavi_width_unitsavi_vertical_avgavi_vertical_maxavi_vertical_unitsavi_terminusavi_road_statusavi_road_depthavi_road_lengthavi_road_unitsavi_latavi_lonid.1obs_id.1avi_descrid.2zone_idlatlonutm_zoneutm_eutm_nnametitleanchorzone_orderUnnamed: 59Unnamed: 60Unnamed: 61Avalanche
015118260877bc-1NaN-2NaN0-11WSNE<TLR1D1NNaNNaN2020-03-15EstimatedUnknownThe west end of Byers Canyon.38407900ftGLayerDepth Hoar68.0in3540.0ft7075.0ftNaNNaNNaNNaNft00.03925360877.0A small Wet Slab avalanche was seen in Byers C...1040.45217-106.6690113358475.000004.479283e+06Steamboat & Flat TopsSteamboat Area & Flat Topssteamboat0NaNNaNNaNYes
15378623807bc-1NaN-2NaN1-11WSE>TLR3D1.5ASuNaN2014-03-09KnownKnownEast-facing rollover directly below Andrew's T...353811245ftOUnknownUnknown1835.0in100110.0ft125200.0ftNaNNaNNaNNaNft00.0264223807.0My partner and I, both on backcountry skis, de...2140.14328-105.8407513428384.000004.443999e+06Front RangeFront Rangefrontrange1NaNNaNNaNYes
26632135489bc-1NaN-2NaN1-11WLETLR1D1ASNaNNaN2015-04-03EstimatedUnknownNaNNaNNaNNaNftNaNNaNNaNNaNNaNinNaNNaNftNaNNaNftNaNNaNNaNNaNft00.01424535489.0NaN2140.14328-105.8407513428384.000004.443999e+06Front RangeFront Rangefrontrange1NaNNaNNaNYes
36649336044bc-1NaN-2NaN1-11WSS>TLR2D2ASNaNNaN2015-06-07EstimatedUnknownKelso PkNaNNaNNaNftNaNNaNNaNNaNNaNin25NaNft1000NaNftNaNNaNNaNNaNft00.01478136044.0Skier triggered wet slab.2140.14328-105.8407513428384.000004.443999e+06Front RangeFront Rangefrontrange1NaNNaNNaNYes
47584340808bc-1NaN-2NaN1-11WLNE<TLR1D1ASNaNMt Trelease2016-03-11EstimatedUnknownNaNNaNNaNNaNftNaNNaNNaNNaNNaNinNaNNaNftNaNNaNftNaNNaNNaNNaNft00.01943640808.0Mt. trelease, N, NE aspect near the bottom of ...ran 30 ft40° slope angle. Reporting since there were n...or water being able to be sqeezed from the sn...2140.14328-1.058407e+02134283844443999Front RangeFront Rangefrontrange1.0Yes
\n", "
" ], "text/plain": [ " id obs_id avi_hw_op_bc avi_hw_zone_id avi_path avi_op_name avi_loc \\\n", "0 151182 60877 bc -1 NaN -2 NaN \n", "1 53786 23807 bc -1 NaN -2 NaN \n", "2 66321 35489 bc -1 NaN -2 NaN \n", "3 66493 36044 bc -1 NaN -2 NaN \n", "4 75843 40808 bc -1 NaN -2 NaN \n", "\n", " avi_bc_zone_id avi_mark avi_number avi_type avi_aspect avi_elev avi_rsize \\\n", "0 0 -1 1 WS NE TL R3 \n", "2 1 -1 1 WL E TL R1 \n", "3 1 -1 1 WS S >TL R2 \n", "4 1 -1 1 WL NE \n", "RangeIndex: 1499 entries, 0 to 1498\n", "Data columns (total 63 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 id 1499 non-null int64 \n", " 1 obs_id 1499 non-null int64 \n", " 2 avi_hw_op_bc 1499 non-null object \n", " 3 avi_hw_zone_id 1499 non-null int64 \n", " 4 avi_path 335 non-null object \n", " 5 avi_op_name 1499 non-null object \n", " 6 avi_loc 1 non-null object \n", " 7 avi_bc_zone_id 1499 non-null int64 \n", " 8 avi_mark 847 non-null object \n", " 9 avi_number 1499 non-null int64 \n", " 10 avi_type 1499 non-null object \n", " 11 avi_aspect 1461 non-null object \n", " 12 avi_elev 1468 non-null object \n", " 13 avi_rsize 1334 non-null object \n", " 14 avi_dsize 1460 non-null object \n", " 15 avi_prim_trig 1452 non-null object \n", " 16 avi_sec_trig 216 non-null object \n", " 17 avi_comments 584 non-null object \n", " 18 avi_date 1498 non-null datetime64[ns]\n", " 19 avi_date_known 1499 non-null object \n", " 20 avi_time_known 1499 non-null object \n", " 21 avi_area 1021 non-null object \n", " 22 avi_angle_avg 163 non-null object \n", " 23 avi_angle_max 139 non-null object \n", " 24 avi_elevation 431 non-null object \n", " 25 avi_elevation_units 1496 non-null object \n", " 26 avi_surface 455 non-null object \n", " 27 avi_weak_layer 170 non-null object \n", " 28 avi_grain_type 165 non-null object \n", " 29 avi_crown_avg 156 non-null object \n", " 30 avi_crown_max 106 non-null float64 \n", " 31 avi_crown_units 1495 non-null object \n", " 32 avi_width_avg 247 non-null object \n", " 33 avi_width_max 225 non-null float64 \n", " 34 avi_width_units 1496 non-null object \n", " 35 avi_vertical_avg 326 non-null object \n", " 36 avi_vertical_max 257 non-null float64 \n", " 37 avi_vertical_units 1497 non-null object \n", " 38 avi_terminus 195 non-null object \n", " 39 avi_road_status 273 non-null object \n", " 40 avi_road_depth 150 non-null object \n", " 41 avi_road_length 148 non-null float64 \n", " 42 avi_road_units 1495 non-null object \n", " 43 avi_lat 1496 non-null object \n", " 44 avi_lon 1496 non-null float64 \n", " 45 id.1 1497 non-null object \n", " 46 obs_id.1 1497 non-null float64 \n", " 47 avi_descr 835 non-null object \n", " 48 id.2 1493 non-null object \n", " 49 zone_id 1495 non-null object \n", " 50 lat 1493 non-null object \n", " 51 lon 1494 non-null object \n", " 52 utm_zone 1494 non-null object \n", " 53 utm_e 1493 non-null float64 \n", " 54 utm_n 1493 non-null float64 \n", " 55 name 1493 non-null object \n", " 56 title 1493 non-null object \n", " 57 anchor 1493 non-null object \n", " 58 zone_order 1493 non-null object \n", " 59 Unnamed: 59 13 non-null object \n", " 60 Unnamed: 60 8 non-null object \n", " 61 Unnamed: 61 2 non-null float64 \n", " 62 Avalanche 1499 non-null object \n", "dtypes: datetime64[ns](1), float64(9), int64(5), object(48)\n", "memory usage: 737.9+ KB\n" ], "name": "stdout" } ] }, { "cell_type": "markdown", "metadata": { "id": "CEPLFb46r7gI" }, "source": [ "With that part done, it is time to move for the pre-processing of the weather dataset. The first step is to combine the data from all the different tabs into a single dataset." ] }, { "cell_type": "code", "metadata": { "id": "2hujg5pk_f9L", "colab": { "base_uri": "https://localhost:8080/", "height": 793 }, "outputId": "bf137b5e-b5d8-41c8-e166-ab8a4bb8b2b8" }, "source": [ "# Combine weather data from different stations into a single dataframe\n", "\n", "CombinedDataWeather = pd.concat(DataWeather, keys=DataWeather.keys())\n", "\n", "CombinedDataWeather.reset_index(inplace=True)\n", "\n", "CombinedDataWeather.drop('level_1', axis=1, inplace=True)\n", "\n", "CombinedDataWeather.rename(columns={'level_0':'Location'}, inplace=True)\n", "\n", "CombinedDataWeather" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
LocationDateSnow Water Equivalent (in) Start of Day ValuesPrecipitation Accumulation (in) Start of Day ValuesAir Temperature Maximum (degF)Air Temperature Minimum (degF)Air Temperature Average (degF)Precipitation Increment (in)
0Berthoud Pass1978-10-010.00.0NaNNaNNaN0.0
1Berthoud Pass1978-10-020.00.0NaNNaNNaN0.0
2Berthoud Pass1978-10-030.00.0NaNNaNNaN0.0
3Berthoud Pass1978-10-040.00.0NaNNaNNaN0.2
4Berthoud Pass1978-10-050.00.2NaNNaNNaN0.0
...........................
174871Wolf Creek pass Snotel2020-10-030.0NaN60.041.049.0NaN
174872Wolf Creek pass Snotel2020-10-040.00.059.038.048.00.0
174873Wolf Creek pass Snotel2020-10-050.00.062.042.051.00.0
174874Wolf Creek pass Snotel2020-10-060.00.062.044.052.00.0
174875Wolf Creek pass Snotel2020-10-070.00.0NaNNaNNaNNaN
\n", "

174876 rows × 8 columns

\n", "
" ], "text/plain": [ " Location Date \\\n", "0 Berthoud Pass 1978-10-01 \n", "1 Berthoud Pass 1978-10-02 \n", "2 Berthoud Pass 1978-10-03 \n", "3 Berthoud Pass 1978-10-04 \n", "4 Berthoud Pass 1978-10-05 \n", "... ... ... \n", "174871 Wolf Creek pass Snotel 2020-10-03 \n", "174872 Wolf Creek pass Snotel 2020-10-04 \n", "174873 Wolf Creek pass Snotel 2020-10-05 \n", "174874 Wolf Creek pass Snotel 2020-10-06 \n", "174875 Wolf Creek pass Snotel 2020-10-07 \n", "\n", " Snow Water Equivalent (in) Start of Day Values \\\n", "0 0.0 \n", "1 0.0 \n", "2 0.0 \n", "3 0.0 \n", "4 0.0 \n", "... ... \n", "174871 0.0 \n", "174872 0.0 \n", "174873 0.0 \n", "174874 0.0 \n", "174875 0.0 \n", "\n", " Precipitation Accumulation (in) Start of Day Values \\\n", "0 0.0 \n", "1 0.0 \n", "2 0.0 \n", "3 0.0 \n", "4 0.2 \n", "... ... \n", "174871 NaN \n", "174872 0.0 \n", "174873 0.0 \n", "174874 0.0 \n", "174875 0.0 \n", "\n", " Air Temperature Maximum (degF) Air Temperature Minimum (degF) \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "... ... ... \n", "174871 60.0 41.0 \n", "174872 59.0 38.0 \n", "174873 62.0 42.0 \n", "174874 62.0 44.0 \n", "174875 NaN NaN \n", "\n", " Air Temperature Average (degF) Precipitation Increment (in) \n", "0 NaN 0.0 \n", "1 NaN 0.0 \n", "2 NaN 0.0 \n", "3 NaN 0.2 \n", "4 NaN 0.0 \n", "... ... ... \n", "174871 49.0 NaN \n", "174872 48.0 0.0 \n", "174873 51.0 0.0 \n", "174874 52.0 0.0 \n", "174875 NaN NaN \n", "\n", "[174876 rows x 8 columns]" ] }, "metadata": { "tags": [] }, "execution_count": 12 } ] }, { "cell_type": "markdown", "metadata": { "id": "On8sB-1TsGa_" }, "source": [ "We can see now that all the stations have their data properly labeled into a unique dataset." ] }, { "cell_type": "code", "metadata": { "id": "MtsrLrSgFPK_", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "0e288c6f-a257-4a13-9062-02b6e6ff50ed" }, "source": [ "# Get information about the dataframe\n", "\n", "CombinedDataWeather.info()" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "\n", "RangeIndex: 174876 entries, 0 to 174875\n", "Data columns (total 8 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 Location 174876 non-null object \n", " 1 Date 174876 non-null object \n", " 2 Snow Water Equivalent (in) Start of Day Values 173843 non-null float64\n", " 3 Precipitation Accumulation (in) Start of Day Values 173798 non-null float64\n", " 4 Air Temperature Maximum (degF) 159835 non-null float64\n", " 5 Air Temperature Minimum (degF) 159788 non-null float64\n", " 6 Air Temperature Average (degF) 160247 non-null float64\n", " 7 Precipitation Increment (in) 173777 non-null float64\n", "dtypes: float64(6), object(2)\n", "memory usage: 10.7+ MB\n" ], "name": "stdout" } ] }, { "cell_type": "markdown", "metadata": { "id": "ZeW9LMN0sODl" }, "source": [ "As it was done with the avalanches data, we also need to change the date variable to datetime format." ] }, { "cell_type": "code", "metadata": { "id": "KrkAz30GFeBg", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "94378459-df51-456f-cbe6-da25ed9c1f9d" }, "source": [ "# Adjust variables types\n", "\n", "CombinedDataWeather['Date'] = pd.to_datetime(CombinedDataWeather['Date'])\n", "\n", "CombinedDataWeather.info()" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "\n", "RangeIndex: 174876 entries, 0 to 174875\n", "Data columns (total 8 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 Location 174876 non-null object \n", " 1 Date 174876 non-null datetime64[ns]\n", " 2 Snow Water Equivalent (in) Start of Day Values 173843 non-null float64 \n", " 3 Precipitation Accumulation (in) Start of Day Values 173798 non-null float64 \n", " 4 Air Temperature Maximum (degF) 159835 non-null float64 \n", " 5 Air Temperature Minimum (degF) 159788 non-null float64 \n", " 6 Air Temperature Average (degF) 160247 non-null float64 \n", " 7 Precipitation Increment (in) 173777 non-null float64 \n", "dtypes: datetime64[ns](1), float64(6), object(1)\n", "memory usage: 10.7+ MB\n" ], "name": "stdout" } ] }, { "cell_type": "code", "metadata": { "id": "K3JXXea5OGNl", "colab": { "base_uri": "https://localhost:8080/", "height": 793 }, "outputId": "0082981b-8353-4aab-cc49-c602a765eb2a" }, "source": [ "CombinedDataWeather" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
LocationDateSnow Water Equivalent (in) Start of Day ValuesPrecipitation Accumulation (in) Start of Day ValuesAir Temperature Maximum (degF)Air Temperature Minimum (degF)Air Temperature Average (degF)Precipitation Increment (in)
0Berthoud Pass1978-10-010.00.0NaNNaNNaN0.0
1Berthoud Pass1978-10-020.00.0NaNNaNNaN0.0
2Berthoud Pass1978-10-030.00.0NaNNaNNaN0.0
3Berthoud Pass1978-10-040.00.0NaNNaNNaN0.2
4Berthoud Pass1978-10-050.00.2NaNNaNNaN0.0
...........................
174871Wolf Creek pass Snotel2020-10-030.0NaN60.041.049.0NaN
174872Wolf Creek pass Snotel2020-10-040.00.059.038.048.00.0
174873Wolf Creek pass Snotel2020-10-050.00.062.042.051.00.0
174874Wolf Creek pass Snotel2020-10-060.00.062.044.052.00.0
174875Wolf Creek pass Snotel2020-10-070.00.0NaNNaNNaNNaN
\n", "

174876 rows × 8 columns

\n", "
" ], "text/plain": [ " Location Date \\\n", "0 Berthoud Pass 1978-10-01 \n", "1 Berthoud Pass 1978-10-02 \n", "2 Berthoud Pass 1978-10-03 \n", "3 Berthoud Pass 1978-10-04 \n", "4 Berthoud Pass 1978-10-05 \n", "... ... ... \n", "174871 Wolf Creek pass Snotel 2020-10-03 \n", "174872 Wolf Creek pass Snotel 2020-10-04 \n", "174873 Wolf Creek pass Snotel 2020-10-05 \n", "174874 Wolf Creek pass Snotel 2020-10-06 \n", "174875 Wolf Creek pass Snotel 2020-10-07 \n", "\n", " Snow Water Equivalent (in) Start of Day Values \\\n", "0 0.0 \n", "1 0.0 \n", "2 0.0 \n", "3 0.0 \n", "4 0.0 \n", "... ... \n", "174871 0.0 \n", "174872 0.0 \n", "174873 0.0 \n", "174874 0.0 \n", "174875 0.0 \n", "\n", " Precipitation Accumulation (in) Start of Day Values \\\n", "0 0.0 \n", "1 0.0 \n", "2 0.0 \n", "3 0.0 \n", "4 0.2 \n", "... ... \n", "174871 NaN \n", "174872 0.0 \n", "174873 0.0 \n", "174874 0.0 \n", "174875 0.0 \n", "\n", " Air Temperature Maximum (degF) Air Temperature Minimum (degF) \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "... ... ... \n", "174871 60.0 41.0 \n", "174872 59.0 38.0 \n", "174873 62.0 42.0 \n", "174874 62.0 44.0 \n", "174875 NaN NaN \n", "\n", " Air Temperature Average (degF) Precipitation Increment (in) \n", "0 NaN 0.0 \n", "1 NaN 0.0 \n", "2 NaN 0.0 \n", "3 NaN 0.2 \n", "4 NaN 0.0 \n", "... ... ... \n", "174871 49.0 NaN \n", "174872 48.0 0.0 \n", "174873 51.0 0.0 \n", "174874 52.0 0.0 \n", "174875 NaN NaN \n", "\n", "[174876 rows x 8 columns]" ] }, "metadata": { "tags": [] }, "execution_count": 15 } ] }, { "cell_type": "markdown", "metadata": { "id": "CytvevGSt8aH" }, "source": [ "In this notebook we will average the weather data by date." ] }, { "cell_type": "code", "metadata": { "id": "sNHBcIGKJ5-V", "colab": { "base_uri": "https://localhost:8080/", "height": 606 }, "outputId": "39a3b9a2-a0bd-44af-dec6-972d28577db1" }, "source": [ "AveragedDataWeather = CombinedDataWeather.groupby(['Date']).mean().reset_index()\n", "\n", "AveragedDataWeather" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
DateSnow Water Equivalent (in) Start of Day ValuesPrecipitation Accumulation (in) Start of Day ValuesAir Temperature Maximum (degF)Air Temperature Minimum (degF)Air Temperature Average (degF)Precipitation Increment (in)
01978-10-010.0000000.000000NaNNaNNaN0.000000
11978-10-020.0000000.000000NaNNaNNaN0.000000
21978-10-030.0000000.000000NaNNaNNaN0.000000
31978-10-040.0000000.000000NaNNaNNaN0.100000
41978-10-050.0000000.100000NaNNaNNaN0.000000
........................
153432020-10-030.0230770.00833358.00000033.69230843.8461540.000000
153442020-10-040.0307690.00769261.00000034.00000045.8461540.008333
153452020-10-050.0307690.01666760.92307735.76923146.3076920.000000
153462020-10-060.1076920.00833364.61538535.84615447.9230770.009091
153472020-10-070.0923080.018182NaNNaNNaNNaN
\n", "

15348 rows × 7 columns

\n", "
" ], "text/plain": [ " Date Snow Water Equivalent (in) Start of Day Values \\\n", "0 1978-10-01 0.000000 \n", "1 1978-10-02 0.000000 \n", "2 1978-10-03 0.000000 \n", "3 1978-10-04 0.000000 \n", "4 1978-10-05 0.000000 \n", "... ... ... \n", "15343 2020-10-03 0.023077 \n", "15344 2020-10-04 0.030769 \n", "15345 2020-10-05 0.030769 \n", "15346 2020-10-06 0.107692 \n", "15347 2020-10-07 0.092308 \n", "\n", " Precipitation Accumulation (in) Start of Day Values \\\n", "0 0.000000 \n", "1 0.000000 \n", "2 0.000000 \n", "3 0.000000 \n", "4 0.100000 \n", "... ... \n", "15343 0.008333 \n", "15344 0.007692 \n", "15345 0.016667 \n", "15346 0.008333 \n", "15347 0.018182 \n", "\n", " Air Temperature Maximum (degF) Air Temperature Minimum (degF) \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "... ... ... \n", "15343 58.000000 33.692308 \n", "15344 61.000000 34.000000 \n", "15345 60.923077 35.769231 \n", "15346 64.615385 35.846154 \n", "15347 NaN NaN \n", "\n", " Air Temperature Average (degF) Precipitation Increment (in) \n", "0 NaN 0.000000 \n", "1 NaN 0.000000 \n", "2 NaN 0.000000 \n", "3 NaN 0.100000 \n", "4 NaN 0.000000 \n", "... ... ... \n", "15343 43.846154 0.000000 \n", "15344 45.846154 0.008333 \n", "15345 46.307692 0.000000 \n", "15346 47.923077 0.009091 \n", "15347 NaN NaN \n", "\n", "[15348 rows x 7 columns]" ] }, "metadata": { "tags": [] }, "execution_count": 16 } ] }, { "cell_type": "markdown", "metadata": { "id": "ta1onB3qKZ8v" }, "source": [ "The grouping was successfully made so now we will merge that information in the avalanches dataset by using Date as the primary key to connect the datasets." ] }, { "cell_type": "code", "metadata": { "id": "I4OzjxAiOVIs", "colab": { "base_uri": "https://localhost:8080/", "height": 677 }, "outputId": "d52209a6-3242-412a-f304-5e37fafe5950" }, "source": [ "# Merge Avalanches DataFrame with Weather DataFrame\n", "\n", "# FullData = pd.merge(CombinedDataWeather, DataAvalanches[['avi_mark', 'avi_date', 'Avalanche', 'avi_number', 'avi_type']], how='left', left_on=['Location', 'Date'], right_on=['avi_mark', 'avi_date'])\n", "\n", "FullData = pd.merge(DataAvalanches[['avi_mark', 'avi_date', 'Avalanche', 'avi_number', 'avi_type']], AveragedDataWeather, how='outer', left_on='avi_date', right_on='Date')\n", "\n", "FullData.sort_values(by='Date', inplace=True)\n", "\n", "FullData" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
avi_markavi_dateAvalancheavi_numberavi_typeDateSnow Water Equivalent (in) Start of Day ValuesPrecipitation Accumulation (in) Start of Day ValuesAir Temperature Maximum (degF)Air Temperature Minimum (degF)Air Temperature Average (degF)Precipitation Increment (in)
1499NaNNaTNaNNaNNaN1978-10-010.0000000.000000NaNNaNNaN0.000000
1500NaNNaTNaNNaNNaN1978-10-020.0000000.000000NaNNaNNaN0.000000
1501NaNNaTNaNNaNNaN1978-10-030.0000000.000000NaNNaNNaN0.000000
1502NaNNaTNaNNaNNaN1978-10-040.0000000.000000NaNNaNNaN0.100000
1503NaNNaTNaNNaNNaN1978-10-050.0000000.100000NaNNaNNaN0.000000
.......................................
16369NaNNaTNaNNaNNaN2020-10-060.1076920.00833364.61538535.84615447.9230770.009091
16370NaNNaTNaNNaNNaN2020-10-070.0923080.018182NaNNaNNaNNaN
985Hoosier PassNaTYes1.0WSNaTNaNNaNNaNNaNNaNNaN
1001Independence Pass-East side1970-01-01Yes1.0WLNaTNaNNaNNaNNaNNaNNaN
1002NaN1970-01-01Yes1.0WSNaTNaNNaNNaNNaNNaNNaN
\n", "

16371 rows × 12 columns

\n", "
" ], "text/plain": [ " avi_mark avi_date Avalanche avi_number avi_type \\\n", "1499 NaN NaT NaN NaN NaN \n", "1500 NaN NaT NaN NaN NaN \n", "1501 NaN NaT NaN NaN NaN \n", "1502 NaN NaT NaN NaN NaN \n", "1503 NaN NaT NaN NaN NaN \n", "... ... ... ... ... ... \n", "16369 NaN NaT NaN NaN NaN \n", "16370 NaN NaT NaN NaN NaN \n", "985 Hoosier Pass NaT Yes 1.0 WS \n", "1001 Independence Pass-East side 1970-01-01 Yes 1.0 WL \n", "1002 NaN 1970-01-01 Yes 1.0 WS \n", "\n", " Date Snow Water Equivalent (in) Start of Day Values \\\n", "1499 1978-10-01 0.000000 \n", "1500 1978-10-02 0.000000 \n", "1501 1978-10-03 0.000000 \n", "1502 1978-10-04 0.000000 \n", "1503 1978-10-05 0.000000 \n", "... ... ... \n", "16369 2020-10-06 0.107692 \n", "16370 2020-10-07 0.092308 \n", "985 NaT NaN \n", "1001 NaT NaN \n", "1002 NaT NaN \n", "\n", " Precipitation Accumulation (in) Start of Day Values \\\n", "1499 0.000000 \n", "1500 0.000000 \n", "1501 0.000000 \n", "1502 0.000000 \n", "1503 0.100000 \n", "... ... \n", "16369 0.008333 \n", "16370 0.018182 \n", "985 NaN \n", "1001 NaN \n", "1002 NaN \n", "\n", " Air Temperature Maximum (degF) Air Temperature Minimum (degF) \\\n", "1499 NaN NaN \n", "1500 NaN NaN \n", "1501 NaN NaN \n", "1502 NaN NaN \n", "1503 NaN NaN \n", "... ... ... \n", "16369 64.615385 35.846154 \n", "16370 NaN NaN \n", "985 NaN NaN \n", "1001 NaN NaN \n", "1002 NaN NaN \n", "\n", " Air Temperature Average (degF) Precipitation Increment (in) \n", "1499 NaN 0.000000 \n", "1500 NaN 0.000000 \n", "1501 NaN 0.000000 \n", "1502 NaN 0.100000 \n", "1503 NaN 0.000000 \n", "... ... ... \n", "16369 47.923077 0.009091 \n", "16370 NaN NaN \n", "985 NaN NaN \n", "1001 NaN NaN \n", "1002 NaN NaN \n", "\n", "[16371 rows x 12 columns]" ] }, "metadata": { "tags": [] }, "execution_count": 17 } ] }, { "cell_type": "markdown", "metadata": { "id": "hLwYFKBmuFlk" }, "source": [ "We can see that the new dataset appended the avalanches columns that we selected into the dataset of weather measurements. Since all occurrences of avalanches are identified with an `Yes` in the column `Avalanche` we can fill the rows with missing data with a `No`, to identify that there was not an avalanche in that date/location. Also we fill missing values with zero in the column of avalanche numbers, for the same reason." ] }, { "cell_type": "code", "metadata": { "id": "Zsg6LYohZQuF", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "ee978618-a9eb-427b-8f49-206992425921" }, "source": [ "# Fill null values of avalanche numbers and categorical\n", "\n", "FullData['Avalanche'].fillna('No', inplace=True)\n", "FullData['avi_number'].fillna(0, inplace=True)\n", "\n", "# Check information about merged dataset\n", "\n", "FullData.info()" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "\n", "Int64Index: 16371 entries, 1499 to 1002\n", "Data columns (total 12 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 avi_mark 847 non-null object \n", " 1 avi_date 1498 non-null datetime64[ns]\n", " 2 Avalanche 16371 non-null object \n", " 3 avi_number 16371 non-null float64 \n", " 4 avi_type 1499 non-null object \n", " 5 Date 16368 non-null datetime64[ns]\n", " 6 Snow Water Equivalent (in) Start of Day Values 16368 non-null float64 \n", " 7 Precipitation Accumulation (in) Start of Day Values 16368 non-null float64 \n", " 8 Air Temperature Maximum (degF) 15652 non-null float64 \n", " 9 Air Temperature Minimum (degF) 15649 non-null float64 \n", " 10 Air Temperature Average (degF) 15652 non-null float64 \n", " 11 Precipitation Increment (in) 16367 non-null float64 \n", "dtypes: datetime64[ns](2), float64(7), object(3)\n", "memory usage: 1.6+ MB\n" ], "name": "stdout" } ] }, { "cell_type": "markdown", "metadata": { "id": "iawByAnFukch" }, "source": [ "In the table above we can see that 1499 avalanches matched the existing data on weather for the locations that were provided.\n", "\n", "There are three avalanches entries that didn't have a date assigned for them, so we will delete those entries to avoid issues in analyzing the data." ] }, { "cell_type": "code", "metadata": { "id": "cD2Up8WjMn2B", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "727b8579-3d3e-4a36-e818-1ec8c82b57ac" }, "source": [ "FullData.dropna(subset=['Date'], inplace=True)\n", "\n", "FullData.info()" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "\n", "Int64Index: 16368 entries, 1499 to 16370\n", "Data columns (total 12 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 avi_mark 845 non-null object \n", " 1 avi_date 1496 non-null datetime64[ns]\n", " 2 Avalanche 16368 non-null object \n", " 3 avi_number 16368 non-null float64 \n", " 4 avi_type 1496 non-null object \n", " 5 Date 16368 non-null datetime64[ns]\n", " 6 Snow Water Equivalent (in) Start of Day Values 16368 non-null float64 \n", " 7 Precipitation Accumulation (in) Start of Day Values 16368 non-null float64 \n", " 8 Air Temperature Maximum (degF) 15652 non-null float64 \n", " 9 Air Temperature Minimum (degF) 15649 non-null float64 \n", " 10 Air Temperature Average (degF) 15652 non-null float64 \n", " 11 Precipitation Increment (in) 16367 non-null float64 \n", "dtypes: datetime64[ns](2), float64(7), object(3)\n", "memory usage: 1.6+ MB\n" ], "name": "stdout" } ] }, { "cell_type": "markdown", "metadata": { "id": "6TQe7zbQdFd_" }, "source": [ "Since the dataset is very unbalanced we can remove all data before 2014, since we don't have information about avalanches prior to that.\n", "\n" ] }, { "cell_type": "code", "metadata": { "id": "rWHAs8fYfPb2", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "6c0cab7d-365a-4cfa-a49a-cf10d4c9a94b" }, "source": [ "FullData = FullData[FullData['Date'].dt.year >= 2014]\n", "\n", "FullData.info()" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "\n", "Int64Index: 3492 entries, 14375 to 16370\n", "Data columns (total 12 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 avi_mark 845 non-null object \n", " 1 avi_date 1496 non-null datetime64[ns]\n", " 2 Avalanche 3492 non-null object \n", " 3 avi_number 3492 non-null float64 \n", " 4 avi_type 1496 non-null object \n", " 5 Date 3492 non-null datetime64[ns]\n", " 6 Snow Water Equivalent (in) Start of Day Values 3492 non-null float64 \n", " 7 Precipitation Accumulation (in) Start of Day Values 3492 non-null float64 \n", " 8 Air Temperature Maximum (degF) 3491 non-null float64 \n", " 9 Air Temperature Minimum (degF) 3491 non-null float64 \n", " 10 Air Temperature Average (degF) 3491 non-null float64 \n", " 11 Precipitation Increment (in) 3491 non-null float64 \n", "dtypes: datetime64[ns](2), float64(7), object(3)\n", "memory usage: 354.7+ KB\n" ], "name": "stdout" } ] }, { "cell_type": "markdown", "metadata": { "id": "3TGRt_WmvTUU" }, "source": [ "With that the pre-processing section is finished and there is a unique dataframe which we can analyze to check if the existing weather data shows correlation with avalanche occurrences." ] }, { "cell_type": "code", "metadata": { "id": "RZYlZgEuffju", "colab": { "base_uri": "https://localhost:8080/", "height": 377 }, "outputId": "d8c0ae1e-c34d-4283-9ada-8a65225608ff" }, "source": [ "FullData.head()" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
avi_markavi_dateAvalancheavi_numberavi_typeDateSnow Water Equivalent (in) Start of Day ValuesPrecipitation Accumulation (in) Start of Day ValuesAir Temperature Maximum (degF)Air Temperature Minimum (degF)Air Temperature Average (degF)Precipitation Increment (in)
14375NaNNaTNo0.0NaN2014-01-018.9230779.61538527.38461511.00000019.4615380.207692
14376NaNNaTNo0.0NaN2014-01-029.1461549.82307736.07692311.23076921.6153850.046154
14377NaNNaTNo0.0NaN2014-01-039.1769239.86923137.30769216.07692325.6923080.023077
14378NaNNaTNo0.0NaN2014-01-049.2384629.89230826.153846-2.23076912.3076920.161538
14379NaNNaTNo0.0NaN2014-01-059.50000010.0538467.153846-5.0769230.3846150.069231
\n", "
" ], "text/plain": [ " avi_mark avi_date Avalanche avi_number avi_type Date \\\n", "14375 NaN NaT No 0.0 NaN 2014-01-01 \n", "14376 NaN NaT No 0.0 NaN 2014-01-02 \n", "14377 NaN NaT No 0.0 NaN 2014-01-03 \n", "14378 NaN NaT No 0.0 NaN 2014-01-04 \n", "14379 NaN NaT No 0.0 NaN 2014-01-05 \n", "\n", " Snow Water Equivalent (in) Start of Day Values \\\n", "14375 8.923077 \n", "14376 9.146154 \n", "14377 9.176923 \n", "14378 9.238462 \n", "14379 9.500000 \n", "\n", " Precipitation Accumulation (in) Start of Day Values \\\n", "14375 9.615385 \n", "14376 9.823077 \n", "14377 9.869231 \n", "14378 9.892308 \n", "14379 10.053846 \n", "\n", " Air Temperature Maximum (degF) Air Temperature Minimum (degF) \\\n", "14375 27.384615 11.000000 \n", "14376 36.076923 11.230769 \n", "14377 37.307692 16.076923 \n", "14378 26.153846 -2.230769 \n", "14379 7.153846 -5.076923 \n", "\n", " Air Temperature Average (degF) Precipitation Increment (in) \n", "14375 19.461538 0.207692 \n", "14376 21.615385 0.046154 \n", "14377 25.692308 0.023077 \n", "14378 12.307692 0.161538 \n", "14379 0.384615 0.069231 " ] }, "metadata": { "tags": [] }, "execution_count": 21 } ] }, { "cell_type": "markdown", "metadata": { "id": "_60H9-nT2bxZ" }, "source": [ "## Methods for Analyzing Data" ] }, { "cell_type": "markdown", "metadata": { "id": "htwpYkVr3DHd" }, "source": [ "### Practical Analysis" ] }, { "cell_type": "markdown", "metadata": { "id": "bVVopWUN3J_X" }, "source": [ "For Practical Analysis, we look into Time Series Plots, Distribution Plots, and Distribution Plots by Avalanche Type to identify a relationship between avalanche occurrences and the weather. We look at descriptive statistics information about the data, compared time with different weather variables, and weather variables with the avalanche count. Then we did something similar, but with types of avalanches." ] }, { "cell_type": "markdown", "metadata": { "id": "FgkGe1kU3RjH" }, "source": [ "### Linear Regression" ] }, { "cell_type": "markdown", "metadata": { "id": "xpvKS9E-3XHB" }, "source": [ "Linear regression was something that we attempted to use in order to determine if there was a direct correlation between each weather variable and the occurence of avalanches. Linear regression requires a set of independent variables, x, and a dependent variable, y, to determine if there is a linear relationship between them. If there is a linear relationship, it can be used to predict the future occurence of the dependent variable. In this scenario, the variable 'avi_number' is the dependent variable that we are attempting to predict, and the weather variables, 'Snow Water Equivalent (in) Start of Day Values', 'Precipitation Accumulation (in) Start of Day Values',\t'Air Temperature Average (degF)',\t'Air Temperature Maximum (degF)',\t'Air Temperature Minimum (degF)',\tand 'Precipitation Increment' were each used as the various independent variables. \n", "\n", "We used the [NumPy](https://numpy.org) and [skicit-learn](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LinearRegression.html) packages in order to implement linear regression. We manipulated the 'avi_number' data in multiple ways to search for an R2 score that would be significant enough for us to pursue linear regression, and based off our findings, decided it was not an appropriate method for calculating correlation. \n" ] }, { "cell_type": "markdown", "metadata": { "id": "TQ_7vtHyJ7il" }, "source": [ "### Logistic Regression" ] }, { "cell_type": "markdown", "metadata": { "id": "Hp9QxcQCKQFO" }, "source": [ "Logistic regression was a model that we wanted to look into further because it utilizes avalanche count as a binary variable (0 for no avalanche/1 for an avalanche occurence). This is ideal because we are trying to predict the occurence of an avalanche under different weather variables. \n", "\n", "We used the [scikit-learn](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) package to implement logistic regression. The variable 'AvCount' was created as our binary dependent variable because we are trying to predict it. The highest accuracy model was generated when we used all of the available weather variables, 'Snow Water Equivalent (in) Start of Day Values', 'Precipitation Accumulation (in) Start of Day Values',\t'Air Temperature Average (degF)',\t'Air Temperature Maximum (degF)',\t'Air Temperature Minimum (degF)',\tand 'Precipitation Increment'. More information about the logistic regression model that we implemented is available [here](https://www.datacamp.com/community/tutorials/understanding-logistic-regression-python).\n", "\n", "This method of logistic regression differs from the logistic regression model in the machine learning portion of our results. That model is generated using PyCaret which a machine learning library and doesn't require as much code to run and concludes the most important predictors without intervention from the coder." ] }, { "cell_type": "markdown", "metadata": { "id": "_TnoMwNF27DO" }, "source": [ "### Machine Learning" ] }, { "cell_type": "markdown", "metadata": { "id": "Up35Eaxz2Xw9" }, "source": [ "We used PyCaret which is an open-source, low-code machine learning library in Python. It allows us to check the accuracy of multiple methods at ones. The methods included are both categorical and regression. From there we took the columns Avalanche, Snow Water Equivalent, Precipitation Accumilation, Air Temperature Maximum, Ait Temperature Minimum, Air Temperature Average, and Precipitation Increment. Then we set up our target to be Avalanche where No became 0 and Yes became 1. It then shows you defaults like the [fold number](https://www.openml.org/a/estimation-procedus/7), which is the original sample is randomly partitioned into k equal size subsamples for training and testing. Its default for testing and training is 70:30. Once that step is done, you compare models and it shows you the accuracy from highest to lowest. We then took three models from different accuracies, but still high, they were Cat Boost, extreme Gradient Boost, and Logistic Regression. We then tuned each model, evaluated it using a [Confusion Matrix](https://pycaret.org/plot-model/), and included a portion where it plots a Feature Importance Plot and a heat map." ] }, { "cell_type": "markdown", "metadata": { "id": "DUy3OgBc0iEX" }, "source": [ "# Results and Discussion" ] }, { "cell_type": "markdown", "metadata": { "id": "XlEmNMGMCq4R" }, "source": [ "## Practical Analysis\n", "\n", "In the practical analysis we will use statistical and graphical techniques to see if we can identify a relationship between avalanche occurrences and the weather.\n", "\n", "First we start checking descriptive statistics information about the data, to see if there is anything strange and get a sense of the distribution of the data." ] }, { "cell_type": "code", "metadata": { "id": "NkcKvVbMCgwI", "colab": { "base_uri": "https://localhost:8080/", "height": 266 }, "outputId": "d2a54573-c1c9-4111-bf01-c3c5e650bf73" }, "source": [ "# Descriptive Statistics of numerical variables\n", "\n", "FullData.describe().transpose()" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
countmeanstdmin25%50%75%max
avi_number3492.00.9951322.8369680.0000000.0000000.0000001.000000100.000000
Snow Water Equivalent (in) Start of Day Values3492.010.6476528.8902740.0000000.22307711.04230818.06346228.484615
Precipitation Accumulation (in) Start of Day Values3492.019.5117239.6307220.00000013.29230819.67692326.45000039.138462
Air Temperature Maximum (degF)3491.048.18943312.8887597.15384639.61538548.23076957.76923175.153846
Air Temperature Minimum (degF)3491.026.27673412.210477-13.84615418.30769226.91666735.53846248.923077
Air Temperature Average (degF)3491.036.07847112.131301-1.84615427.88461536.23076945.61538560.230769
Precipitation Increment (in)3491.00.0926660.1482130.0000000.0076920.0384620.1076921.523077
\n", "
" ], "text/plain": [ " count mean \\\n", "avi_number 3492.0 0.995132 \n", "Snow Water Equivalent (in) Start of Day Values 3492.0 10.647652 \n", "Precipitation Accumulation (in) Start of Day Va... 3492.0 19.511723 \n", "Air Temperature Maximum (degF) 3491.0 48.189433 \n", "Air Temperature Minimum (degF) 3491.0 26.276734 \n", "Air Temperature Average (degF) 3491.0 36.078471 \n", "Precipitation Increment (in) 3491.0 0.092666 \n", "\n", " std min \\\n", "avi_number 2.836968 0.000000 \n", "Snow Water Equivalent (in) Start of Day Values 8.890274 0.000000 \n", "Precipitation Accumulation (in) Start of Day Va... 9.630722 0.000000 \n", "Air Temperature Maximum (degF) 12.888759 7.153846 \n", "Air Temperature Minimum (degF) 12.210477 -13.846154 \n", "Air Temperature Average (degF) 12.131301 -1.846154 \n", "Precipitation Increment (in) 0.148213 0.000000 \n", "\n", " 25% 50% \\\n", "avi_number 0.000000 0.000000 \n", "Snow Water Equivalent (in) Start of Day Values 0.223077 11.042308 \n", "Precipitation Accumulation (in) Start of Day Va... 13.292308 19.676923 \n", "Air Temperature Maximum (degF) 39.615385 48.230769 \n", "Air Temperature Minimum (degF) 18.307692 26.916667 \n", "Air Temperature Average (degF) 27.884615 36.230769 \n", "Precipitation Increment (in) 0.007692 0.038462 \n", "\n", " 75% max \n", "avi_number 1.000000 100.000000 \n", "Snow Water Equivalent (in) Start of Day Values 18.063462 28.484615 \n", "Precipitation Accumulation (in) Start of Day Va... 26.450000 39.138462 \n", "Air Temperature Maximum (degF) 57.769231 75.153846 \n", "Air Temperature Minimum (degF) 35.538462 48.923077 \n", "Air Temperature Average (degF) 45.615385 60.230769 \n", "Precipitation Increment (in) 0.107692 1.523077 " ] }, "metadata": { "tags": [] }, "execution_count": 22 } ] }, { "cell_type": "markdown", "metadata": { "id": "91UBVOGPv385" }, "source": [ "Despite the wide temperature distribution existing in the data, there are no signs of anomalies in the measurement that should be removed from the dataset. Let's also check some information about the categorical variables below." ] }, { "cell_type": "code", "metadata": { "id": "jOHObO95C0km", "colab": { "base_uri": "https://localhost:8080/", "height": 142 }, "outputId": "a033d4ed-f21c-459a-e8ac-b5b17b5eddd2" }, "source": [ "# Descriptive Statistics of categorical variables\n", "\n", "FullData.describe(include='O').transpose()" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
countuniquetopfreq
avi_mark84594-1124
Avalanche34922No1996
avi_type14962WL1009
\n", "
" ], "text/plain": [ " count unique top freq\n", "avi_mark 845 94 -1 124\n", "Avalanche 3492 2 No 1996\n", "avi_type 1496 2 WL 1009" ] }, "metadata": { "tags": [] }, "execution_count": 23 } ] }, { "cell_type": "markdown", "metadata": { "id": "hIG0WGkNwPsE" }, "source": [ "We can see that the Wet Loose avalanches represent more than two thirds of all avalanches between 2014 and today. Also the dataset seems well balanced between occurences of avalanches.\n", "\n", "Let's check some time series plots about the weather and avalanches." ] }, { "cell_type": "markdown", "metadata": { "id": "IpOpzDYcFFol" }, "source": [ "### Time Series Plots" ] }, { "cell_type": "code", "metadata": { "id": "ep2bDTEmnABr", "colab": { "base_uri": "https://localhost:8080/", "height": 323 }, "outputId": "6bf9c4f3-8f59-4197-f133-157fa37952bf" }, "source": [ "# Group data by date to improve plot quality\n", "\n", "GroupedData = FullData.groupby('Date').agg({'Snow Water Equivalent (in) Start of Day Values':'mean',\n", " 'Precipitation Accumulation (in) Start of Day Values':'mean',\n", " 'Air Temperature Average (degF)':'mean', \n", " 'Air Temperature Maximum (degF)':'mean', \n", " 'Air Temperature Minimum (degF)':'mean',\n", " 'Precipitation Increment (in)':'mean',\n", " 'avi_number':'sum'}).reset_index()\n", "\n", "GroupedData.head()" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
DateSnow Water Equivalent (in) Start of Day ValuesPrecipitation Accumulation (in) Start of Day ValuesAir Temperature Average (degF)Air Temperature Maximum (degF)Air Temperature Minimum (degF)Precipitation Increment (in)avi_number
02014-01-018.9230779.61538519.46153827.38461511.0000000.2076920.0
12014-01-029.1461549.82307721.61538536.07692311.2307690.0461540.0
22014-01-039.1769239.86923125.69230837.30769216.0769230.0230770.0
32014-01-049.2384629.89230812.30769226.153846-2.2307690.1615380.0
42014-01-059.50000010.0538460.3846157.153846-5.0769230.0692310.0
\n", "
" ], "text/plain": [ " Date Snow Water Equivalent (in) Start of Day Values \\\n", "0 2014-01-01 8.923077 \n", "1 2014-01-02 9.146154 \n", "2 2014-01-03 9.176923 \n", "3 2014-01-04 9.238462 \n", "4 2014-01-05 9.500000 \n", "\n", " Precipitation Accumulation (in) Start of Day Values \\\n", "0 9.615385 \n", "1 9.823077 \n", "2 9.869231 \n", "3 9.892308 \n", "4 10.053846 \n", "\n", " Air Temperature Average (degF) Air Temperature Maximum (degF) \\\n", "0 19.461538 27.384615 \n", "1 21.615385 36.076923 \n", "2 25.692308 37.307692 \n", "3 12.307692 26.153846 \n", "4 0.384615 7.153846 \n", "\n", " Air Temperature Minimum (degF) Precipitation Increment (in) avi_number \n", "0 11.000000 0.207692 0.0 \n", "1 11.230769 0.046154 0.0 \n", "2 16.076923 0.023077 0.0 \n", "3 -2.230769 0.161538 0.0 \n", "4 -5.076923 0.069231 0.0 " ] }, "metadata": { "tags": [] }, "execution_count": 24 } ] }, { "cell_type": "code", "metadata": { "id": "D61qH2wA5ZMG", "colab": { "base_uri": "https://localhost:8080/", "height": 340 }, "outputId": "e6f86842-83dd-4705-e190-7b7094218946" }, "source": [ "d=GroupedData['Date']\n", "GroupedData.insert(1,'Year',d.dt.year)\n", "GroupedData.insert(2,'Day of Year',d.dt.dayofyear)\n", "del d\n", "GroupedData.head()" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
DateYearDay of YearSnow Water Equivalent (in) Start of Day ValuesPrecipitation Accumulation (in) Start of Day ValuesAir Temperature Average (degF)Air Temperature Maximum (degF)Air Temperature Minimum (degF)Precipitation Increment (in)avi_number
02014-01-01201418.9230779.61538519.46153827.38461511.0000000.2076920.0
12014-01-02201429.1461549.82307721.61538536.07692311.2307690.0461540.0
22014-01-03201439.1769239.86923125.69230837.30769216.0769230.0230770.0
32014-01-04201449.2384629.89230812.30769226.153846-2.2307690.1615380.0
42014-01-05201459.50000010.0538460.3846157.153846-5.0769230.0692310.0
\n", "
" ], "text/plain": [ " Date Year Day of Year \\\n", "0 2014-01-01 2014 1 \n", "1 2014-01-02 2014 2 \n", "2 2014-01-03 2014 3 \n", "3 2014-01-04 2014 4 \n", "4 2014-01-05 2014 5 \n", "\n", " Snow Water Equivalent (in) Start of Day Values \\\n", "0 8.923077 \n", "1 9.146154 \n", "2 9.176923 \n", "3 9.238462 \n", "4 9.500000 \n", "\n", " Precipitation Accumulation (in) Start of Day Values \\\n", "0 9.615385 \n", "1 9.823077 \n", "2 9.869231 \n", "3 9.892308 \n", "4 10.053846 \n", "\n", " Air Temperature Average (degF) Air Temperature Maximum (degF) \\\n", "0 19.461538 27.384615 \n", "1 21.615385 36.076923 \n", "2 25.692308 37.307692 \n", "3 12.307692 26.153846 \n", "4 0.384615 7.153846 \n", "\n", " Air Temperature Minimum (degF) Precipitation Increment (in) avi_number \n", "0 11.000000 0.207692 0.0 \n", "1 11.230769 0.046154 0.0 \n", "2 16.076923 0.023077 0.0 \n", "3 -2.230769 0.161538 0.0 \n", "4 -5.076923 0.069231 0.0 " ] }, "metadata": { "tags": [] }, "execution_count": 25 } ] }, { "cell_type": "code", "metadata": { "id": "1SBlsk8T5awK", "colab": { "base_uri": "https://localhost:8080/", "height": 1000 }, "outputId": "17c9a1da-8ce5-4c32-a3fe-c245bdc6fdc7" }, "source": [ "# Create time series subplots\n", "xKey='Date' # for all years end-to-end along axis (not tested)\n", "xKey='Day of Year' # for all years superposed\n", "yKeys=('Snow Water Equivalent (in) Start of Day Values',\n", " 'Precipitation Accumulation (in) Start of Day Values',\n", " 'Air Temperature Average (degF)',\n", " 'Air Temperature Minimum (degF)',\n", " 'Air Temperature Maximum (degF)',\n", " 'Precipitation Increment (in)')\n", "fig = make_subplots(rows=6, \n", " cols=1,\n", " subplot_titles=yKeys)\n", "for row in range(1,len(yKeys)+1) :\n", " fig.add_trace(\n", " go.Scatter(x=GroupedData[xKey],\n", " y=GroupedData[yKeys[row - 1]],\n", " marker=dict(color=GroupedData['Year'],\n", " showscale=True,\n", " size=4),\n", " mode='markers'),\n", " row=row,\n", " col=1)\n", "fig.update_layout(height=1800, \n", " width=800, \n", " showlegend=False,\n", " title_text=\"Weather Data by \" + xKey)\n", "fig.show()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "CjCgK0GMR6WY", "colab": { "base_uri": "https://localhost:8080/", "height": 1000 }, "outputId": "fe9d674a-8b2f-4173-a227-a7cf97de7170" }, "source": [ "# Create time series subplots\n", "\n", "fig = make_subplots(rows=6, \n", " cols=1,\n", " subplot_titles=('Snow Water Equivalent (in) Start of Day Values',\n", " 'Precipitation Accumulation (in) Start of Day Values',\n", " 'Air Temperature Average (degF)',\n", " 'Air Temperature Minimum (degF)',\n", " 'Air Temperature Maximum (degF)',\n", " 'Precipitation Increment (in)'))\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'],\n", " y=GroupedData['Snow Water Equivalent (in) Start of Day Values']),\n", " row=1,\n", " col=1)\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'],\n", " y=GroupedData['Precipitation Accumulation (in) Start of Day Values']),\n", " row=2,\n", " col=1)\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'],\n", " y=GroupedData['Air Temperature Average (degF)']),\n", " row=3,\n", " col=1)\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'],\n", " y=GroupedData['Air Temperature Minimum (degF)']),\n", " row=4,\n", " col=1)\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'],\n", " y=GroupedData['Air Temperature Maximum (degF)']),\n", " row=5,\n", " col=1)\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'],\n", " y=GroupedData['Precipitation Increment (in)']),\n", " row=6,\n", " col=1)\n", "\n", "fig.update_layout(height=1800, \n", " width=800, \n", " showlegend=False,\n", " title_text=\"Weather Data by Date\")\n", "fig.show()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "L8YVkZ3OkhrA", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "ba98234e-ea6e-477f-a5b2-fae36b8e5109" }, "source": [ "# Create figure with secondary y-axis\n", "fig = make_subplots(specs=[[{\"secondary_y\": True}]])\n", "\n", "# Add traces\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Air Temperature Average (degF)'], name=\"Average Temperature\"),\n", " secondary_y=False,\n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'], mode='markers', name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", ")\n", "\n", "# Add figure title\n", "fig.update_layout(\n", " title_text=\"2-Axis Plot (Air Temperature Average)\"\n", ")\n", "\n", "# Set x-axis title\n", "fig.update_xaxes(title_text=\"Date\")\n", "\n", "# Set y-axes titles\n", "fig.update_yaxes(title_text=\"Air Temperature Average (degF)\", secondary_y=False)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True)\n", "\n", "fig.show()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "BB4ynOxtiIBq" }, "source": [ "By looking at the time series data we can identify a pattern. It seems that most avalanches happen when temperatures are rising. This makes a lot of sense because it is when there is most snow in the mountains, and with the increase in temperature this snow starts to melt. Once it is all melted there is not enough snow to generate an avalanche.\n", "\n", "By having those initial insights we can look more in details to each one of the weather variables measured, and see if it is correlated with avalanche occurrences. To do that we can create a distribution plot and split the data from the days when there was an avalanche and when there wasn't, to compare the distributions." ] }, { "cell_type": "code", "metadata": { "id": "g9hyQ6k-xL4Z", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "06b92ff1-c693-420b-a0f6-3c21f6030223" }, "source": [ "# Create figure with secondary y-axis\n", "fig = make_subplots(specs=[[{\"secondary_y\": True}]])\n", "\n", "# Add traces\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Precipitation Accumulation (in) Start of Day Values'], name=\"Precipitation Accumulation\"),\n", " secondary_y=False, \n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'],mode= 'markers', name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", ")\n", "\n", "# Add figure title\n", "fig.update_layout(\n", " title_text=\"2-Axis Plot (Precipitation Accumulation)\"\n", ")\n", "\n", "# Set x-axis title\n", "fig.update_xaxes(title_text=\"Date\")\n", "\n", "# Set y-axes titles\n", "fig.update_yaxes(title_text=\"Precipitation Accumulation\", secondary_y=False)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True)\n", "\n", "fig.show()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "oKniRvV820Jr", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "40c02599-a17f-4e89-9e76-36395df57bb8" }, "source": [ "# Create figure with secondary y-axis\n", "fig = make_subplots(specs=[[{\"secondary_y\": True}]])\n", "\n", "# Add traces\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Snow Water Equivalent (in) Start of Day Values'], name=\"Snow Water Equivalent\"),\n", " secondary_y=False, \n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'],mode= 'markers', name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", ")\n", "\n", "# Add figure title\n", "fig.update_layout(\n", " title_text=\"2-Axis Plot (Snow Water Equivalent (in))\"\n", ")\n", "\n", "# Set x-axis title\n", "fig.update_xaxes(title_text=\"Date\")\n", "\n", "# Set y-axes titles\n", "fig.update_yaxes(title_text=\"Snow Water Equivalent (in)\", secondary_y=False)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True)\n", "\n", "fig.show()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "rkjYLbzEPk0v", "colab": { "base_uri": "https://localhost:8080/", "height": 1000 }, "outputId": "95afc75b-ab25-4b7a-e0c5-a54d684c34e0" }, "source": [ "# Create subplots of dual axis plots\n", "\n", "# Create figure with secondary y-axis\n", "fig = make_subplots(rows=6, \n", " cols=1, \n", " specs=[[{\"secondary_y\": True}], \n", " [{\"secondary_y\": True}], \n", " [{\"secondary_y\": True}], \n", " [{\"secondary_y\": True}], \n", " [{\"secondary_y\": True}], \n", " [{\"secondary_y\": True}]])\n", "\n", "# Add traces for plot (1,1)\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Air Temperature Average (degF)'], name=\"Average Temperature\"), \n", " secondary_y=False,\n", " row=1,\n", " col=1\n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'], name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", " row=1,\n", " col=1\n", ")\n", "\n", "# Add traces for plot (2,1)\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Air Temperature Minimum (degF)'], name=\"Minimum Temperature\"),\n", " secondary_y=False,\n", " row=2,\n", " col=1, \n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'], name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", " row=2,\n", " col=1\n", ")\n", "\n", "# Add traces for plot (3,1)\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Air Temperature Maximum (degF)'], name=\"Maximum Temperature\"),\n", " secondary_y=False,\n", " row=3,\n", " col=1\n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'], name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", " row=3,\n", " col=1\n", ")\n", "\n", "# Add traces for plot (4,1)\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Precipitation Increment (in)'], name=\"Precipitation Increment (in)\"),\n", " secondary_y=False,\n", " row=4,\n", " col=1\n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'], name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", " row=4,\n", " col=1\n", ")\n", "\n", "# Add traces for plot (5,1)\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Precipitation Accumulation (in) Start of Day Values'], name='Precipitation Accumulation (in) Start of Day Values'),\n", " secondary_y=False,\n", " row=5,\n", " col=1\n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'], name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", " row=5,\n", " col=1\n", ")\n", "\n", "# Add traces for plot (6,1)\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['Snow Water Equivalent (in) Start of Day Values'], name='Snow Water Equivalent (in) Start of Day Values'),\n", " secondary_y=False,\n", " row=6,\n", " col=1\n", ")\n", "\n", "fig.add_trace(\n", " go.Scatter(x=GroupedData['Date'], y=GroupedData['avi_number'], name=\"Number of Avalanches\"),\n", " secondary_y=True,\n", " row=6,\n", " col=1\n", ")\n", "\n", "# Add figure title\n", "fig.update_layout(height=2500, \n", " width=800, \n", " showlegend=False,\n", " title_text=\"Weather and Number of Avalanches by Date\")\n", "\n", "# Set x-axis title\n", "fig.update_xaxes(title_text=\"Date\")\n", "\n", "# Set y-axes titles\n", "fig.update_yaxes(title_text=\"Air Temperature Average (degF)\", secondary_y=False, row=1, col=1)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True, row=1, col=1)\n", "\n", "fig.update_yaxes(title_text=\"Air Temperature Minimum (degF)\", secondary_y=False, row=2, col=1)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True, row=2, col=1)\n", "\n", "fig.update_yaxes(title_text=\"Air Temperature Maximum (degF)\", secondary_y=False, row=3, col=1)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True, row=3, col=1)\n", "\n", "fig.update_yaxes(title_text=\"Precipitation Increment (in)\", secondary_y=False, row=4, col=1)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True, row=4, col=1)\n", "\n", "fig.update_yaxes(title_text='Precipitation Accumulation (in) Start of Day Values', secondary_y=False, row=5, col=1)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True, row=5, col=1)\n", "\n", "fig.update_yaxes(title_text='Snow Water Equivalent (in) Start of Day Values', secondary_y=False, row=6, col=1)\n", "fig.update_yaxes(title_text=\"Number of Avalanches\", secondary_y=True, row=6, col=1)\n", "\n", "fig.show()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "mTB6FnJmFLih" }, "source": [ "### Distribution Plots" ] }, { "cell_type": "code", "metadata": { "id": "rdZwGlCJaEwt", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "81be61dc-8451-470d-efb8-e8df8467dfd1" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(FullData,\n", " x='Avalanche',\n", " color='Avalanche',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "8u8d27gNDSNj", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "18b1a126-8308-465a-a85b-c768820baa72" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(FullData,\n", " x='Snow Water Equivalent (in) Start of Day Values',\n", " color='Avalanche',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "Aq9q3YcSf_Xq" }, "source": [ "We can clearly see that there is a significant difference between the results of days when there was an avalanche and of then there was none and that it should be detected by a prediction model.\n", "\n", "Now adding some critical thinking on those results, it is important to remember that the data that is being used is an average of all locations, and not the measurement in the specific location where the avalanche happened. So it is better to read the results as the relations between weather data and any incidence of avalanche.\n", "\n", "Also we saw that spring months are definitely the ones with most avalanche (probably because the snow is melting). If there is a relation between the season and the snow water equivalent results, it is possible that the results that we are seeing are not directly correlated, but are correlated by a third variable. But in this specific case there is a natural theorical explanation that when there is more snow, there is a higher instability in the mountains that can lead to avalanches.\n", "\n", "More details on Snow Water Equivalent:\n", "[Link](https://www.nrcs.usda.gov/wps/portal/nrcs/detail/null/?cid=nrcseprd1314833)" ] }, { "cell_type": "code", "metadata": { "id": "radcs6OkDTW5", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "77d125ff-6deb-4223-b457-e7a39e1309e0" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(FullData,\n", " x='Precipitation Accumulation (in) Start of Day Values',\n", " color='Avalanche',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "gzhhmD5iDULl", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "7738d232-dd98-4949-a97f-84ce9f0f337f" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(FullData,\n", " x='Air Temperature Maximum (degF)',\n", " color='Avalanche',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "Oid-oBpyDU1j", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "ed8168f5-fb49-4580-b65f-99f132c71d9c" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(FullData,\n", " x='Air Temperature Minimum (degF)',\n", " color='Avalanche',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "KNlTAK64DViE", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "61a0ceff-bc96-4f4d-8660-c3d71764eff1" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(FullData,\n", " x='Air Temperature Average (degF)',\n", " color='Avalanche',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "nUDs__nKEWvr", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "7e707041-0ba7-4e1f-ec75-4aa29e952e47" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(FullData,\n", " x='Precipitation Increment (in)',\n", " color='Avalanche',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "Pz0Tht-XDZJk" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "\n", "#variable = 'Air Temperature Average (degF)' #@param ['Location', 'Date', 'Snow Water Equivalent (in) Start of Day Values','Precipitation Accumulation (in) Start of Day Values','Air Temperature Maximum (degF)', 'Air Temperature Minimum (degF)','Air Temperature Average (degF)', 'Precipitation Increment (in)','avi_mark', 'avi_date', 'Avalanche', 'avi_number']\n", "\n", "#px.histogram(FullData,\n", " # color='Avalanche',\n", " # marginal='box')" ], "execution_count": null, "outputs": [] }, { "cell_type": "markdown", "metadata": { "id": "_knMW2QcxBo5" }, "source": [ "We can also look for patterns related to the different types of avalanches, Wet Slab and Wet Loose, using the same method." ] }, { "cell_type": "markdown", "metadata": { "id": "nb69Rs2lHuLr" }, "source": [ "### Distribution Plots by Avalanche Type" ] }, { "cell_type": "code", "metadata": { "id": "K0w15aIDFZw5" }, "source": [ "# Filter Data to check results in which there was an avalanche\n", "\n", "AvalanchesOnly = FullData[FullData['Avalanche'] == 'Yes']\n" ], "execution_count": null, "outputs": [] }, { "cell_type": "code", "metadata": { "id": "mL9yofXFHd9N", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "1aa31e1d-bdd0-4a6a-d31c-dfdbe38193ee" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(AvalanchesOnly,\n", " x='avi_type',\n", " color='avi_type',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "S3wtz0EwFtYN", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "89abccc9-1db6-4ff6-e4da-4a779e80869c" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(AvalanchesOnly,\n", " x='Snow Water Equivalent (in) Start of Day Values',\n", " color='avi_type',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "i_di62CvFucE", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "0c472554-4312-49d5-cfa3-5750ed5c8694" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(AvalanchesOnly,\n", " x='Precipitation Accumulation (in) Start of Day Values',\n", " color='avi_type',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "WyugyM0oFvmr", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "c8591098-ebee-4464-94f4-31bca60edfd1" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(AvalanchesOnly,\n", " x='Air Temperature Maximum (degF)',\n", " color='avi_type',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "afunb8D_FwMx", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "5ce444d0-3903-4ba0-b6d3-00748cf14faf" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(AvalanchesOnly,\n", " x='Air Temperature Minimum (degF)',\n", " color='avi_type',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "9bcKMTo5Fu--", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "c9863a9f-0228-4e9c-edbe-a8c63ef4ca40" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(AvalanchesOnly,\n", " x='Air Temperature Average (degF)',\n", " color='avi_type',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "1GUjbvffFt_x", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "e6303e85-f379-4129-cc6a-80a0a792e5cc" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "px.histogram(AvalanchesOnly,\n", " x='Precipitation Increment (in)',\n", " color='avi_type',\n", " marginal='box')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "88-PF426iF4Q", "colab": { "base_uri": "https://localhost:8080/", "height": 542 }, "outputId": "fab497e6-adce-4acd-9768-797c431b4c6b" }, "source": [ "# Create histogram / distribution visualization for the different variables\n", "\n", "variable = 'Air Temperature Average (degF)' #@param ['Location', 'Date', 'Snow Water Equivalent (in) Start of Day Values','Precipitation Accumulation (in) Start of Day Values','Air Temperature Maximum (degF)', 'Air Temperature Minimum (degF)','Air Temperature Average (degF)', 'Precipitation Increment (in)','avi_mark', 'avi_date', 'Avalanche', 'avi_number']\n", "\n", "fig = px.histogram(AvalanchesOnly,\n", " x=variable,\n", " color='avi_type',\n", " marginal='box')\n", "\n", "fig.show()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "\n", "\n", "\n", "
\n", " \n", " \n", " \n", "
\n", " \n", "
\n", "\n", "" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "WN461FtJz_EY" }, "source": [ "Here there weren't many big differences in the measured variables' distribution. The one specific observation is that it seems that Wet Slab avalanches has a slightly higher median for the Minimum, Maximum and Average temperatures than the Wet Loose ones. It is possible to test that difference in the medians or means to understand if that is statistically significant.\n", "\n" ] }, { "cell_type": "markdown", "metadata": { "id": "fHmyv-a_IaDb" }, "source": [ "## Linear Regression" ] }, { "cell_type": "markdown", "metadata": { "id": "LwJ2u9-tMufH" }, "source": [ "The following code shows our implementation of linear regression and why it did not work. The 'avi_number' data was our biggest obstacle because of how sparse the data was. Multiple attempts were made in order to account for this sparseness; however, none of them generated on R^2 score that we felt was satisfactory enough to continue working on linear regression." ] }, { "cell_type": "code", "metadata": { "id": "qQw4-UBtPaF1" }, "source": [ "#Creating a copy of the data without null values\n", "NoNullGroupedData = GroupedData.dropna()" ], "execution_count": null, "outputs": [] }, { "cell_type": "markdown", "metadata": { "id": "IRpndxuw8OZY" }, "source": [ "This is the first attempt to test for a correlation between the weather variable, Snow Water Equivalent, and avalanche count. This attempt uses the data as is, with no adjustments made to avalanche count. " ] }, { "cell_type": "code", "metadata": { "id": "LCopvMBTMC3P", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "04c80476-90a9-4932-c654-57fc19501db9" }, "source": [ "#creating our x and y variables \n", "x1 = NoNullGroupedData.iloc[:,[3]].values.reshape(-1, 1) #Snow Water Equivalent\n", "y1 = NoNullGroupedData.iloc[:,[9]].values.reshape(-1, 1) #avi_number\n", "\n", "# Model initialization\n", "regression_model_one = LinearRegression()\n", "# Fit the data(train the model)\n", "regression_model_one.fit(x1, y1)\n", "#Calculate and print R2 score\n", "r_sq_one = regression_model_one.score(x1,y1)\n", "print('R2 score: ', r_sq_one)" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "R2 score: 0.07665051806996348\n" ], "name": "stdout" } ] }, { "cell_type": "markdown", "metadata": { "id": "FTS9kudU9hBT" }, "source": [ "Ideally, the R2 score should be as close to 1 as possible. The low R2 score shows that the data, in this form, does not capture the relationship between Snow Water Equivalence and the occurence of avalanches\n" ] }, { "cell_type": "markdown", "metadata": { "id": "poAdVJ0Y9t1y" }, "source": [ "This is the second attempt to test for a correlation between the weather variable, Snow Water Equivalent, and avalanche count. In this attempt, we made avalanche count a binary variable (0 for no/1 for yes).\n", "\n" ] }, { "cell_type": "code", "metadata": { "id": "B70zHsTz99B6" }, "source": [ "#making new column for avalanche data as a binary count\n", "NoNullGroupedData.loc[NoNullGroupedData['avi_number'] == 0, 'AvCount'] = 0 \n", "NoNullGroupedData.loc[NoNullGroupedData['avi_number'] >= 1, 'AvCount'] = 1" ], "execution_count": null, "outputs": [] }, { "cell_type": "code", "metadata": { "id": "qVxAiSEP-EL4", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "dafeaa28-31f9-47b5-cee7-27691a529a98" }, "source": [ "#creating our x and y variables \n", "x2 = NoNullGroupedData.iloc[:,[3]].values.reshape(-1, 1) #Snow Water Equivalent\n", "y2 = NoNullGroupedData.iloc[:,[10]].values.reshape(-1, 1) #AvCount\n", "\n", "# Model initialization\n", "regression_model_two = LinearRegression()\n", "# Fit the data(train the model)\n", "regression_model_two.fit(x2, y2)\n", "#Calculate and print R2 score\n", "r_sq_two = regression_model_two.score(x2,y2)\n", "print('R2 score: ', r_sq_two)" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "R2 score: 0.2755908525407361\n" ], "name": "stdout" } ] }, { "cell_type": "markdown", "metadata": { "id": "KDMVno-t-8kG" }, "source": [ "The R2 score generated is helpful in understanding there is a relationship between 'Snow Water Equivalent' and the occurence of an avalalanche. However, it is not significant enough for us to pursue it further. " ] }, { "cell_type": "markdown", "metadata": { "id": "ptrRGkS4HRtD" }, "source": [ "This is the third attempt to test for a correlation between the weather variable, Snow Water Equivalent, and avalanche count. In this attempt, we removed all of the months after May because the majority of avalanches occur at this time. We also could have included the months November and December; however, the smaller sample worked just as well." ] }, { "cell_type": "code", "metadata": { "id": "y9vLT4FqAc7a" }, "source": [ "#Only including data between January and May\n", "NoNullGroupedData = NoNullGroupedData[NoNullGroupedData['Date'].dt.month <= 5]" ], "execution_count": null, "outputs": [] }, { "cell_type": "code", "metadata": { "id": "gspRoMiLAeaX", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "db5c7569-9491-45de-c48c-811ceca37c9a" }, "source": [ "#creating our x and y variables \n", "x3 = NoNullGroupedData.iloc[:,[3]].values.reshape(-1, 1) #Snow Water Equivalent\n", "y3 = NoNullGroupedData.iloc[:,[9]].values.reshape(-1, 1) #avi_number\n", "\n", "# Model initialization\n", "regression_model_three = LinearRegression()\n", "# Fit the data(train the model)\n", "regression_model_three.fit(x3, y3)\n", "#Calculate and print R2 score\n", "r_sq_three = regression_model_three.score(x3,y3)\n", "print('R2 score: ', r_sq_three)" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "R2 score: 0.020505479899889267\n" ], "name": "stdout" } ] }, { "cell_type": "markdown", "metadata": { "id": "ipg2zqGsAtbp" }, "source": [ "The low R2 score shows that the data, in this form, does not capture the relationship between Snow Water Equivalence and the occurence of avalanches" ] }, { "cell_type": "markdown", "metadata": { "id": "dpR53Y7UFXpv" }, "source": [ "## Logistic Regression" ] }, { "cell_type": "code", "metadata": { "id": "tJjQRl7TZC-m", "colab": { "base_uri": "https://localhost:8080/", "height": 296 }, "outputId": "9ba78ab4-ae39-44f8-bbfc-38d9659e2cc8" }, "source": [ "#split dataset in features and target variable\n", "X = NoNullGroupedData[['Day of Year',\n", " 'Snow Water Equivalent (in) Start of Day Values', \n", " 'Precipitation Accumulation (in) Start of Day Values',\n", " 'Precipitation Increment (in)',\n", " 'Air Temperature Average (degF)',\n", " 'Air Temperature Maximum (degF)',\n", " 'Air Temperature Minimum (degF)']]\n", "y = NoNullGroupedData['AvCount']\n", "\n", "#splitting data into a testing set and training set\n", "X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.25,random_state=0)\n", "\n", "#creating an instance of the logistic regression model and fitting it with data\n", "logistic_regression= LogisticRegression()\n", "logistic_regression.fit(X_train,y_train)\n", "y_pred=logistic_regression.predict(X_test)\n", "\n", "#confusion matrix used to visualize the predictions\n", "confusion_matrix = pd.crosstab(y_test, y_pred, rownames=['Actual'], colnames=['Predicted'])\n", "sn.heatmap(confusion_matrix, annot=True, fmt='g')\n", "\n", "#displaying the confusion matrix and accuracy of the model\n", "print('Accuracy: ',metrics.accuracy_score(y_test, y_pred))\n", "plt.show()" ], "execution_count": null, "outputs": [ { "output_type": "stream", "text": [ "Accuracy: 0.7283018867924528\n" ], "name": "stdout" }, { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [], "needs_background": "light" } } ] }, { "cell_type": "markdown", "metadata": { "id": "Buf4iNsL6ugH" }, "source": [ "In this confusion matrix, the 119 and 74 are actual predictions, and 40 and 32 are incorrect predictions. The model has as accuracy of approximately .73." ] }, { "cell_type": "markdown", "metadata": { "id": "KEU1OfPB0-xG" }, "source": [ "## Prediction Model" ] }, { "cell_type": "markdown", "metadata": { "id": "zuooMMfYX5So" }, "source": [ "We were unable to get this code to run." ] }, { "cell_type": "code", "metadata": { "id": "muoTRjx7S8OT", "colab": { "base_uri": "https://localhost:8080/", "height": 292 }, "outputId": "8063f542-30ad-4044-9c81-daa14866bb16" }, "source": [ "ModelDataset = FullData.copy()\n", "ModelDataset2 = FullData.copy()\n", "d=ModelDataset['Date']\n", "ModelDataset.insert(1,'Year',d.dt.year)\n", "ModelDataset.insert(2,'Day of Year',d.dt.dayofyear)\n", "ModelDataset.drop(['Date','avi_mark','avi_date', 'avi_number', 'avi_type'], axis=1, inplace=True)\n", "ModelDataset2.drop(['avi_mark','avi_date', 'avi_type'], axis=1, inplace=True)\n", "ModelDataset2.insert(1,'Year',d.dt.year)\n", "ModelDataset2.insert(2,'Day of Year',d.dt.dayofyear)\n", "del d\n", "\n", "ModelDataset.head()" ], "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
YearDay of YearAvalancheSnow Water Equivalent (in) Start of Day ValuesPrecipitation Accumulation (in) Start of Day ValuesAir Temperature Maximum (degF)Air Temperature Minimum (degF)Air Temperature Average (degF)Precipitation Increment (in)
1437520141No8.9230779.61538527.38461511.00000019.4615380.207692
1437620142No9.1461549.82307736.07692311.23076921.6153850.046154
1437720143No9.1769239.86923137.30769216.07692325.6923080.023077
1437820144No9.2384629.89230826.153846-2.23076912.3076920.161538
1437920145No9.50000010.0538467.153846-5.0769230.3846150.069231
\n", "
" ], "text/plain": [ " Year ... Precipitation Increment (in)\n", "14375 2014 ... 0.207692\n", "14376 2014 ... 0.046154\n", "14377 2014 ... 0.023077\n", "14378 2014 ... 0.161538\n", "14379 2014 ... 0.069231\n", "\n", "[5 rows x 9 columns]" ] }, "metadata": { "tags": [] }, "execution_count": 76 } ] }, { "cell_type": "markdown", "metadata": { "id": "vlhsXyR3TXvE" }, "source": [ "Once our dataset is ready, we can define what our target variable below. For the Confusion Matrix Charts 0 is equal to no avalanches and 1 is equal to yes avalanches.\n" ] }, { "cell_type": "code", "metadata": { "id": "LTx3VNDmTdQJ", "colab": { "base_uri": "https://localhost:8080/", "height": 1000, "referenced_widgets": [ "499d8582265046e2970e453489ba6031", "fbf81571f4cb4c059a3e5a66b7ef2221", "4347d82e97784a83a087906c398d0e1f", "a6c8551cb31645318ee511bd4a1e3859", "7630cddea594473e9538bef58294d8c2", "169d6da9acf647d6bd4f509a5fdd50ba" ] }, "outputId": "f5fe5c38-5a02-48c5-af6b-7fba81584db2" }, "source": [ "Model = setup(ModelDataset, target='Avalanche', numeric_features=['Year'])\n" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
DescriptionValue
0session_id1506
1TargetAvalanche
2Target TypeBinary
3Label EncodedNo: 0, Yes: 1
4Original Data(3492, 9)
5Missing ValuesTrue
6Numeric Features8
7Categorical Features0
8Ordinal FeaturesFalse
9High Cardinality FeaturesFalse
10High Cardinality MethodNone
11Transformed Train Set(2444, 8)
12Transformed Test Set(1048, 8)
13Shuffle Train-TestTrue
14Stratify Train-TestFalse
15Fold GeneratorStratifiedKFold
16Fold Number10
17CPU Jobs-1
18Use GPUFalse
19Log ExperimentFalse
20Experiment Nameclf-default-name
21USIa3ee
22Imputation Typesimple
23Iterative Imputation IterationNone
24Numeric Imputermean
25Iterative Imputation Numeric ModelNone
26Categorical Imputerconstant
27Iterative Imputation Categorical ModelNone
28Unknown Categoricals Handlingleast_frequent
29NormalizeFalse
30Normalize MethodNone
31TransformationFalse
32Transformation MethodNone
33PCAFalse
34PCA MethodNone
35PCA ComponentsNone
36Ignore Low VarianceFalse
37Combine Rare LevelsFalse
38Rare Level ThresholdNone
39Numeric BinningFalse
40Remove OutliersFalse
41Outliers ThresholdNone
42Remove MulticollinearityFalse
43Multicollinearity ThresholdNone
44ClusteringFalse
45Clustering IterationNone
46Polynomial FeaturesFalse
47Polynomial DegreeNone
48Trignometry FeaturesFalse
49Polynomial ThresholdNone
50Group FeaturesFalse
51Feature SelectionFalse
52Features Selection ThresholdNone
53Feature InteractionFalse
54Feature RatioFalse
55Interaction ThresholdNone
56Fix ImbalanceFalse
57Fix Imbalance MethodSMOTE
\n", "
" ], "text/plain": [ " Description Value\n", "0 session_id 1506\n", "1 Target Avalanche\n", "2 Target Type Binary\n", "3 Label Encoded No: 0, Yes: 1\n", "4 Original Data (3492, 9)\n", "5 Missing Values True\n", "6 Numeric Features 8\n", "7 Categorical Features 0\n", "8 Ordinal Features False\n", "9 High Cardinality Features False\n", "10 High Cardinality Method None\n", "11 Transformed Train Set (2444, 8)\n", "12 Transformed Test Set (1048, 8)\n", "13 Shuffle Train-Test True\n", "14 Stratify Train-Test False\n", "15 Fold Generator StratifiedKFold\n", "16 Fold Number 10\n", "17 CPU Jobs -1\n", "18 Use GPU False\n", "19 Log Experiment False\n", "20 Experiment Name clf-default-name\n", "21 USI a3ee\n", "22 Imputation Type simple\n", "23 Iterative Imputation Iteration None\n", "24 Numeric Imputer mean\n", "25 Iterative Imputation Numeric Model None\n", "26 Categorical Imputer constant\n", "27 Iterative Imputation Categorical Model None\n", "28 Unknown Categoricals Handling least_frequent\n", "29 Normalize False\n", "30 Normalize Method None\n", "31 Transformation False\n", "32 Transformation Method None\n", "33 PCA False\n", "34 PCA Method None\n", "35 PCA Components None\n", "36 Ignore Low Variance False\n", "37 Combine Rare Levels False\n", "38 Rare Level Threshold None\n", "39 Numeric Binning False\n", "40 Remove Outliers False\n", "41 Outliers Threshold None\n", "42 Remove Multicollinearity False\n", "43 Multicollinearity Threshold None\n", "44 Clustering False\n", "45 Clustering Iteration None\n", "46 Polynomial Features False\n", "47 Polynomial Degree None\n", "48 Trignometry Features False\n", "49 Polynomial Threshold None\n", "50 Group Features False\n", "51 Feature Selection False\n", "52 Features Selection Threshold None\n", "53 Feature Interaction False\n", "54 Feature Ratio False\n", "55 Interaction Threshold None\n", "56 Fix Imbalance False\n", "57 Fix Imbalance Method SMOTE" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "DT_agGYPVJ_C", "colab": { "base_uri": "https://localhost:8080/", "height": 650, "referenced_widgets": [ "0e9ab74349ab43df8d009f7bd46b034f", "935ed9dc79c34b8ebd029281bfdcc6f8", "c7560dbc634b435a8b54faaa681f63c9" ] }, "outputId": "abdd5a3e-b28f-4633-bebb-2a284a26c0bb" }, "source": [ "compare_models()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
rfRandom Forest Classifier0.90550.97190.90780.87960.89320.80850.80930.617
lightgbmLight Gradient Boosting Machine0.90550.96840.90500.88210.89290.80840.80930.118
etExtra Trees Classifier0.90430.97360.89560.88640.89040.80540.80630.506
xgboostExtreme Gradient Boosting0.90060.96620.90120.87560.88760.79850.79960.891
catboostCatBoost Classifier0.89850.96710.90970.86520.88650.79490.79633.203
gbcGradient Boosting Classifier0.88910.96140.90120.85340.87620.77600.77760.351
dtDecision Tree Classifier0.88460.88630.89940.84600.87150.76700.76880.026
knnK Neighbors Classifier0.88340.94150.88340.85560.86840.76380.76540.120
adaAda Boost Classifier0.87560.94870.88430.84010.86100.74870.75040.165
nbNaive Bayes0.86130.91200.91350.79860.85170.72270.72910.019
lrLogistic Regression0.85560.92770.84660.82670.83590.70700.70800.343
qdaQuadratic Discriminant Analysis0.84940.92030.90310.78490.83950.69910.70590.019
ldaLinear Discriminant Analysis0.84740.92380.84190.81470.82750.69080.69180.021
ridgeRidge Classifier0.84570.00000.83910.81360.82550.68740.68850.017
svmSVM - Linear Kernel0.69230.00000.42850.66630.47850.33170.38650.028
\n", "
" ], "text/plain": [ " Model Accuracy AUC Recall Prec. \\\n", "rf Random Forest Classifier 0.9055 0.9719 0.9078 0.8796 \n", "lightgbm Light Gradient Boosting Machine 0.9055 0.9684 0.9050 0.8821 \n", "et Extra Trees Classifier 0.9043 0.9736 0.8956 0.8864 \n", "xgboost Extreme Gradient Boosting 0.9006 0.9662 0.9012 0.8756 \n", "catboost CatBoost Classifier 0.8985 0.9671 0.9097 0.8652 \n", "gbc Gradient Boosting Classifier 0.8891 0.9614 0.9012 0.8534 \n", "dt Decision Tree Classifier 0.8846 0.8863 0.8994 0.8460 \n", "knn K Neighbors Classifier 0.8834 0.9415 0.8834 0.8556 \n", "ada Ada Boost Classifier 0.8756 0.9487 0.8843 0.8401 \n", "nb Naive Bayes 0.8613 0.9120 0.9135 0.7986 \n", "lr Logistic Regression 0.8556 0.9277 0.8466 0.8267 \n", "qda Quadratic Discriminant Analysis 0.8494 0.9203 0.9031 0.7849 \n", "lda Linear Discriminant Analysis 0.8474 0.9238 0.8419 0.8147 \n", "ridge Ridge Classifier 0.8457 0.0000 0.8391 0.8136 \n", "svm SVM - Linear Kernel 0.6923 0.0000 0.4285 0.6663 \n", "\n", " F1 Kappa MCC TT (Sec) \n", "rf 0.8932 0.8085 0.8093 0.617 \n", "lightgbm 0.8929 0.8084 0.8093 0.118 \n", "et 0.8904 0.8054 0.8063 0.506 \n", "xgboost 0.8876 0.7985 0.7996 0.891 \n", "catboost 0.8865 0.7949 0.7963 3.203 \n", "gbc 0.8762 0.7760 0.7776 0.351 \n", "dt 0.8715 0.7670 0.7688 0.026 \n", "knn 0.8684 0.7638 0.7654 0.120 \n", "ada 0.8610 0.7487 0.7504 0.165 \n", "nb 0.8517 0.7227 0.7291 0.019 \n", "lr 0.8359 0.7070 0.7080 0.343 \n", "qda 0.8395 0.6991 0.7059 0.019 \n", "lda 0.8275 0.6908 0.6918 0.021 \n", "ridge 0.8255 0.6874 0.6885 0.017 \n", "svm 0.4785 0.3317 0.3865 0.028 " ] }, "metadata": { "tags": [] } }, { "output_type": "execute_result", "data": { "text/plain": [ "RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,\n", " criterion='gini', max_depth=None, max_features='auto',\n", " max_leaf_nodes=None, max_samples=None,\n", " min_impurity_decrease=0.0, min_impurity_split=None,\n", " min_samples_leaf=1, min_samples_split=2,\n", " min_weight_fraction_leaf=0.0, n_estimators=100,\n", " n_jobs=-1, oob_score=False, random_state=1506, verbose=0,\n", " warm_start=False)" ] }, "metadata": { "tags": [] }, "execution_count": 79 } ] }, { "cell_type": "code", "metadata": { "id": "degrZMJoTySA", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "73622256dba84671bcab7e329b378818", "81f4ba27c56546f48f4c958c203d9ff0", "4a04ba961a454ceda4d285771d7567a2" ] }, "outputId": "6381174b-4251-4fa7-d2f1-c627b0d44a0d" }, "source": [ "XGB = create_model(estimator='xgboost')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.90200.96650.90650.87390.88990.80170.8022
10.92650.97780.91590.91590.91590.85070.8507
20.90200.96340.88790.88790.88790.80090.8009
30.88570.96200.88680.85450.87040.76820.7687
40.88110.96200.90570.83480.86880.76050.7626
50.87700.95300.91510.82200.86610.75300.7567
60.90980.96490.85850.92860.89220.81490.8167
70.90160.96450.91510.86610.88990.80110.8021
80.91390.96740.89620.90480.90050.82470.8247
90.90570.98060.92450.86730.89500.80960.8110
Mean0.90060.96620.90120.87560.88760.79850.7996
SD0.01460.00750.01850.03250.01470.02870.0280
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.9020 0.9665 0.9065 0.8739 0.8899 0.8017 0.8022\n", "1 0.9265 0.9778 0.9159 0.9159 0.9159 0.8507 0.8507\n", "2 0.9020 0.9634 0.8879 0.8879 0.8879 0.8009 0.8009\n", "3 0.8857 0.9620 0.8868 0.8545 0.8704 0.7682 0.7687\n", "4 0.8811 0.9620 0.9057 0.8348 0.8688 0.7605 0.7626\n", "5 0.8770 0.9530 0.9151 0.8220 0.8661 0.7530 0.7567\n", "6 0.9098 0.9649 0.8585 0.9286 0.8922 0.8149 0.8167\n", "7 0.9016 0.9645 0.9151 0.8661 0.8899 0.8011 0.8021\n", "8 0.9139 0.9674 0.8962 0.9048 0.9005 0.8247 0.8247\n", "9 0.9057 0.9806 0.9245 0.8673 0.8950 0.8096 0.8110\n", "Mean 0.9006 0.9662 0.9012 0.8756 0.8876 0.7985 0.7996\n", "SD 0.0146 0.0075 0.0185 0.0325 0.0147 0.0287 0.0280" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "aQJlQzbGfwwL" }, "source": [ "Extreme Gradient Boosting Model\n", "\n", " What is it and where does it come from?\n", " https://towardsdatascience.com/xgboost-theory-and-practice-fb8912930ad6\n" ] }, { "cell_type": "code", "metadata": { "id": "8AwY36JfU5Hk", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "f49794a0e9f54c26a7d7f84c0f3344e4", "8adc97a7aeff4c6da935b5f1b7855696", "d490a6b4780f436685e43fd6614510ed" ] }, "outputId": "fbadefca-0823-441e-91b3-7350c6c7a655" }, "source": [ "TunedModel = tune_model(XGB)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.90200.96140.93460.85470.89290.80300.8057
10.91430.97550.93460.87720.90500.82710.8284
20.87760.96330.90650.82910.86610.75370.7563
30.87350.95980.92450.80990.86340.74650.7522
40.88520.96450.94340.81970.87720.77050.7772
50.88110.95730.94340.81300.87340.76260.7700
60.91800.96280.89620.91350.90480.83280.8329
70.90160.97160.94340.84750.89290.80240.8064
80.90160.96730.91510.86610.88990.80110.8021
90.89340.98130.94340.83330.88500.78640.7917
Mean0.89480.96650.92850.84640.88500.78860.7923
SD0.01450.00710.01640.03090.01400.02830.0266
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.9020 0.9614 0.9346 0.8547 0.8929 0.8030 0.8057\n", "1 0.9143 0.9755 0.9346 0.8772 0.9050 0.8271 0.8284\n", "2 0.8776 0.9633 0.9065 0.8291 0.8661 0.7537 0.7563\n", "3 0.8735 0.9598 0.9245 0.8099 0.8634 0.7465 0.7522\n", "4 0.8852 0.9645 0.9434 0.8197 0.8772 0.7705 0.7772\n", "5 0.8811 0.9573 0.9434 0.8130 0.8734 0.7626 0.7700\n", "6 0.9180 0.9628 0.8962 0.9135 0.9048 0.8328 0.8329\n", "7 0.9016 0.9716 0.9434 0.8475 0.8929 0.8024 0.8064\n", "8 0.9016 0.9673 0.9151 0.8661 0.8899 0.8011 0.8021\n", "9 0.8934 0.9813 0.9434 0.8333 0.8850 0.7864 0.7917\n", "Mean 0.8948 0.9665 0.9285 0.8464 0.8850 0.7886 0.7923\n", "SD 0.0145 0.0071 0.0164 0.0309 0.0140 0.0283 0.0266" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "GWU4gkFRVYHr", "colab": { "base_uri": "https://localhost:8080/", "height": 1000, "referenced_widgets": [ "6a21aea1e810435582c37b3aace35901", "63588303eaf74b1b8351bce44c98dec8", "8eb369ace554446aa838a50afd0bf50e", "c762527fa7374891b97f5d50430d5dd8", "9e49a094eca748aa9286b42c7bf180ed", "2994bc88f7624637ab65cef6e500da32", "e75c29fbbf504123a6518d12d501f3ab" ] }, "outputId": "d28ebc3c-d5c3-4976-fcbf-d6454472767b" }, "source": [ "evaluate_model(XGB)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "6a21aea1e810435582c37b3aace35901", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "My2Ky4kvXL21", "colab": { "base_uri": "https://localhost:8080/", "height": 401 }, "outputId": "a0650931-3c2a-40d0-c82c-c25b316ebcf7" }, "source": [ "plot_model(XGB, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "zh6wrvNxZFF0" }, "source": [ "The confusion matrix shows us all the data points that were tested to verify the quality of the model. From the tested data points:\n", "\n", "\n", "* 545 points were correctly classified as days without avalanches\n", "* 47 days had an avalanche predicted but none happened\n", "* In 405 days avalanches were predicted and they really happened\n", "* In 51 days there were unpredicted avalanches\n", "\n", "\n", "\n" ] }, { "cell_type": "code", "metadata": { "id": "6G086_FrXTJ0", "colab": { "base_uri": "https://localhost:8080/", "height": 418 }, "outputId": "1f7dbbc8-d600-4eae-9ffe-2687e463da76" }, "source": [ "plot_model(XGB, 'feature')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "0a8UR6ecf9k5" }, "source": [ "Logistic Regression" ] }, { "cell_type": "code", "metadata": { "id": "XPg0Fm0tfbt3", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "03350dd1e5214f3aabc48b7565ae4b49" ] }, "outputId": "d05996fd-8044-4a63-e036-92fe94ac3f60" }, "source": [ "LR = create_model(estimator='lr')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.88160.94170.87850.85450.86640.76020.7604
10.88160.95680.83180.89000.85990.75760.7589
20.85710.92400.87850.81030.84300.71240.7143
30.82040.89810.82080.77680.79820.63660.6374
40.81150.91330.82080.76320.79090.61970.6210
50.84020.89560.82080.81310.81690.67510.6751
60.82790.93320.76420.82650.79410.64660.6481
70.86890.93090.84910.84910.84910.73310.7331
80.86890.92580.89620.81900.85590.73600.7385
90.89750.95780.90570.86490.88480.79260.7933
Mean0.85560.92770.84660.82670.83590.70700.7080
SD0.02770.02030.04120.03710.03170.05610.0561
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8816 0.9417 0.8785 0.8545 0.8664 0.7602 0.7604\n", "1 0.8816 0.9568 0.8318 0.8900 0.8599 0.7576 0.7589\n", "2 0.8571 0.9240 0.8785 0.8103 0.8430 0.7124 0.7143\n", "3 0.8204 0.8981 0.8208 0.7768 0.7982 0.6366 0.6374\n", "4 0.8115 0.9133 0.8208 0.7632 0.7909 0.6197 0.6210\n", "5 0.8402 0.8956 0.8208 0.8131 0.8169 0.6751 0.6751\n", "6 0.8279 0.9332 0.7642 0.8265 0.7941 0.6466 0.6481\n", "7 0.8689 0.9309 0.8491 0.8491 0.8491 0.7331 0.7331\n", "8 0.8689 0.9258 0.8962 0.8190 0.8559 0.7360 0.7385\n", "9 0.8975 0.9578 0.9057 0.8649 0.8848 0.7926 0.7933\n", "Mean 0.8556 0.9277 0.8466 0.8267 0.8359 0.7070 0.7080\n", "SD 0.0277 0.0203 0.0412 0.0371 0.0317 0.0561 0.0561" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "MS2k_hAXgP-h", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "a463af2b79b94ecd9365cc4ba0ee1641", "db9f6b4f028741f8bd5f4d93803b5e67", "43c55b638f584647aaefcf3b9cfcee29" ] }, "outputId": "7a15c813-ab9a-4bbb-a44f-9e888812a7da" }, "source": [ "TunedModel2 = tune_model(LR)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.89800.94120.89720.87270.88480.79320.7935
10.88160.95700.83180.89000.85990.75760.7589
20.84080.92120.85050.79820.82350.67880.6799
30.82860.90150.83020.78570.80730.65310.6539
40.81150.91340.82080.76320.79090.61970.6210
50.84020.89570.82080.81310.81690.67510.6751
60.82790.93450.76420.82650.79410.64660.6481
70.86890.92970.85850.84260.85050.73370.7338
80.87300.92460.89620.82610.85970.74400.7460
90.90160.95770.90570.87270.88890.80070.8011
Mean0.85720.92760.84760.82910.83770.71030.7112
SD0.02990.01990.04160.03890.03410.06060.0604
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8980 0.9412 0.8972 0.8727 0.8848 0.7932 0.7935\n", "1 0.8816 0.9570 0.8318 0.8900 0.8599 0.7576 0.7589\n", "2 0.8408 0.9212 0.8505 0.7982 0.8235 0.6788 0.6799\n", "3 0.8286 0.9015 0.8302 0.7857 0.8073 0.6531 0.6539\n", "4 0.8115 0.9134 0.8208 0.7632 0.7909 0.6197 0.6210\n", "5 0.8402 0.8957 0.8208 0.8131 0.8169 0.6751 0.6751\n", "6 0.8279 0.9345 0.7642 0.8265 0.7941 0.6466 0.6481\n", "7 0.8689 0.9297 0.8585 0.8426 0.8505 0.7337 0.7338\n", "8 0.8730 0.9246 0.8962 0.8261 0.8597 0.7440 0.7460\n", "9 0.9016 0.9577 0.9057 0.8727 0.8889 0.8007 0.8011\n", "Mean 0.8572 0.9276 0.8476 0.8291 0.8377 0.7103 0.7112\n", "SD 0.0299 0.0199 0.0416 0.0389 0.0341 0.0606 0.0604" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "SD7RQpaaiJpJ", "colab": { "base_uri": "https://localhost:8080/", "height": 634, "referenced_widgets": [ "bce1c8fe885d45608d740beaadec1033", "7034122a4ff1489e9d7d26af63ce6af4", "bf891634e154429f9e7a228e21d84a2d", "2e407875db904ec0ae0a9b9ede4cd9ca", "55475be2cb3343bdac82821b1e7dc07b", "3ab14392cd464feca63d9f5bc7c721cf", "25ff3ee0e3ba4ac59b4b968455e6ffd1" ] }, "outputId": "a3a8f4b1-9ad8-48ce-c419-ad371b6a1317" }, "source": [ "evaluate_model(LR)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "bce1c8fe885d45608d740beaadec1033", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "ouT997cx7VIa", "colab": { "base_uri": "https://localhost:8080/", "height": 401 }, "outputId": "0bb2e8fe-f20c-44ed-c50a-58ddec171319" }, "source": [ "plot_model(LR, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "DTGqqou5_rKg", "colab": { "base_uri": "https://localhost:8080/", "height": 418 }, "outputId": "2af48b79-40bf-4550-ce74-12b4aa489bf3" }, "source": [ "plot_model(LR, 'feature')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "AfpCozhKUJMM" }, "source": [ "CatBoost" ] }, { "cell_type": "code", "metadata": { "id": "BaNWLrxg_RwN", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "465c097926b74791b7ed2dfeb41366e8", "26fb1c534a0f4c32850a5704b197684f", "729905d4b2234c8d9895a1fa6713748f" ] }, "outputId": "95788680-e13d-4c33-8a3c-3e88f25aab1e" }, "source": [ "catboost = create_model(estimator='catboost')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.87760.96570.86920.85320.86110.75160.7517
10.93470.98280.94390.90990.92660.86780.8683
20.88570.96190.91590.83760.87500.77010.7727
30.87760.96110.90570.82760.86490.75330.7559
40.88930.95590.92450.83760.87890.77750.7807
50.88110.95260.90570.83480.86880.76050.7626
60.90980.97190.87740.91180.89420.81570.8162
70.90160.97000.91510.86610.88990.80110.8021
80.91800.96690.94340.87720.90910.83460.8365
90.90980.98270.89620.89620.89620.81650.8165
Mean0.89850.96710.90970.86520.88650.79490.7963
SD0.01840.00960.02340.03050.01980.03680.0363
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8776 0.9657 0.8692 0.8532 0.8611 0.7516 0.7517\n", "1 0.9347 0.9828 0.9439 0.9099 0.9266 0.8678 0.8683\n", "2 0.8857 0.9619 0.9159 0.8376 0.8750 0.7701 0.7727\n", "3 0.8776 0.9611 0.9057 0.8276 0.8649 0.7533 0.7559\n", "4 0.8893 0.9559 0.9245 0.8376 0.8789 0.7775 0.7807\n", "5 0.8811 0.9526 0.9057 0.8348 0.8688 0.7605 0.7626\n", "6 0.9098 0.9719 0.8774 0.9118 0.8942 0.8157 0.8162\n", "7 0.9016 0.9700 0.9151 0.8661 0.8899 0.8011 0.8021\n", "8 0.9180 0.9669 0.9434 0.8772 0.9091 0.8346 0.8365\n", "9 0.9098 0.9827 0.8962 0.8962 0.8962 0.8165 0.8165\n", "Mean 0.8985 0.9671 0.9097 0.8652 0.8865 0.7949 0.7963\n", "SD 0.0184 0.0096 0.0234 0.0305 0.0198 0.0368 0.0363" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "iGxkUcOn_pHn", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "cc14420b2b9241d3b51fcf513404de1e", "108169e47ebe4b9bac95b4a38214dd1e", "ca04ad074d944f4daf5860fdd0393732" ] }, "outputId": "78f868fd-0ee5-4726-ae2c-3eed45061a77" }, "source": [ "TunedModel3 = tune_model(catboost)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.88570.96160.87850.86240.87040.76820.7683
10.93060.98270.93460.90910.92170.85940.8597
20.88570.95980.90650.84350.87390.76960.7713
30.88570.96390.91510.83620.87390.76980.7724
40.86890.95080.88680.82460.85450.73540.7370
50.88110.94890.90570.83480.86880.76050.7626
60.90160.97150.84910.91840.88240.79810.7999
70.90980.96450.93400.86840.90000.81810.8199
80.89750.96120.92450.85220.88690.79350.7957
90.91390.98180.91510.88990.90230.82540.8257
Mean0.89610.96470.90500.86390.88350.78980.7913
SD0.01740.01070.02540.03070.01870.03480.0344
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8857 0.9616 0.8785 0.8624 0.8704 0.7682 0.7683\n", "1 0.9306 0.9827 0.9346 0.9091 0.9217 0.8594 0.8597\n", "2 0.8857 0.9598 0.9065 0.8435 0.8739 0.7696 0.7713\n", "3 0.8857 0.9639 0.9151 0.8362 0.8739 0.7698 0.7724\n", "4 0.8689 0.9508 0.8868 0.8246 0.8545 0.7354 0.7370\n", "5 0.8811 0.9489 0.9057 0.8348 0.8688 0.7605 0.7626\n", "6 0.9016 0.9715 0.8491 0.9184 0.8824 0.7981 0.7999\n", "7 0.9098 0.9645 0.9340 0.8684 0.9000 0.8181 0.8199\n", "8 0.8975 0.9612 0.9245 0.8522 0.8869 0.7935 0.7957\n", "9 0.9139 0.9818 0.9151 0.8899 0.9023 0.8254 0.8257\n", "Mean 0.8961 0.9647 0.9050 0.8639 0.8835 0.7898 0.7913\n", "SD 0.0174 0.0107 0.0254 0.0307 0.0187 0.0348 0.0344" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "ZWnKH2A2Ah_R", "colab": { "base_uri": "https://localhost:8080/", "height": 1000, "referenced_widgets": [ "392d9d1a9fa146ab90b0a9e5949d6b61", "65706dd29fe5457bb1f2201f38b98161", "6e27df66c8244d3f8506606169a712e3", "d3f96bd6691643239b6757383587be54", "9e08f8f4343a441ab290545c679533cf", "e14d0ac066224518ac2eaef551c70c10", "a7a1a6b7f72e4a12bd574eb45c801b39" ] }, "outputId": "ba8c25bc-72e6-4e6f-cdc5-816ebb81fc54" }, "source": [ "evaluate_model(catboost)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "392d9d1a9fa146ab90b0a9e5949d6b61", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "uneAQNBXTZC5", "colab": { "base_uri": "https://localhost:8080/", "height": 401 }, "outputId": "b79abc7e-080b-4943-ff36-48f3559d942b" }, "source": [ "plot_model(catboost, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "K2Mg9VwdThZK", "colab": { "base_uri": "https://localhost:8080/", "height": 418 }, "outputId": "2e03e5c0-2e95-4feb-b74c-2560c3f72980" }, "source": [ "plot_model(catboost, 'feature')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "2s96g7J9jUFW", "colab": { "base_uri": "https://localhost:8080/", "height": 563 }, "outputId": "f2f0e19d-e650-46fb-aaef-fd0922cb152b" }, "source": [ "import seaborn as sns\n", "\n", "import matplotlib.pyplot as plt\n", "correlation_mat = ModelDataset2.corr()\n", "\n", "sns.heatmap(correlation_mat, annot = True)\n", "\n", "plt.show()\n" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "mR96DWU_FEQB" }, "source": [ "###Testing and Training" ] }, { "cell_type": "markdown", "metadata": { "id": "4g_e_cfcG5G5" }, "source": [ "In this section, the data was tested and trained with a 60:40 and 80:20. Previously the data was tested and trained with a 70:30. The reason this is done is to see if the accuracy of the models changes. We look into the same three models as earlier. Included is a link showing all charts together so that it is easier to look through them. It shows all of the same models with similiar accuracies even if the testing and training ratio changes. The three models are Logistic Regression, CatBoost, and Extreme Gradient Boost. All models and testing and training has showed that Snow Water Equivalent is important. https://drive.google.com/file/d/1njKn81QJfTAFwHFyHKL_ljy8a6pCZoV4/view?usp=sharing" ] }, { "cell_type": "code", "metadata": { "id": "b-sK6pFrFqGJ", "colab": { "base_uri": "https://localhost:8080/", "height": 616, "referenced_widgets": [ "afd584fbc8a24f1baaf7ffd336839df5", "9e412e3be60c4a65a00a62cc0900524c", "650fd903437f42138427259ae89385c0", "adc3728c289f4410b594a4212f5e729c", "dd30b884e50b47caa2c7eb30d7d5b397", "eb3d75a11c1c4575a621c248ccfe0f52", "60bb4204212e4b65b4e7fdf846790952", "7ea62fdec17144158b7fb4cfe3c83b21", "cf5589d70daf40ed94c7ffd89dac990e" ] }, "outputId": "f6ff91f4-f2a0-4954-baf2-98251e690e23" }, "source": [ "Model = setup(ModelDataset, target='Avalanche',train_size = 0.6,numeric_features=['Year'])\n", "compare_models()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
lightgbmLight Gradient Boosting Machine0.91410.96960.90370.89460.89860.82410.82490.115
etExtra Trees Classifier0.91260.97500.89920.89440.89660.82100.82130.515
rfRandom Forest Classifier0.91220.97310.91170.88460.89750.82070.82170.576
xgboostExtreme Gradient Boosting0.90550.96700.90260.87760.88940.80690.80792.537
catboostCatBoost Classifier0.90500.96610.90490.87480.88910.80610.80722.721
gbcGradient Boosting Classifier0.89690.96090.89910.86310.88000.78970.79120.310
knnK Neighbors Classifier0.88500.93990.87990.85220.86550.76510.76590.127
dtDecision Tree Classifier0.88350.88570.89920.83730.86660.76350.76590.027
adaAda Boost Classifier0.88160.95010.87200.85170.86130.75810.75880.160
lrLogistic Regression0.85920.92210.83800.83050.83350.71150.71250.314
nbNaive Bayes0.85870.90920.91160.78760.84450.71630.72380.021
qdaQuadratic Discriminant Analysis0.84630.91680.89460.77630.83070.69130.69810.020
ridgeRidge Classifier0.84340.00000.82210.81000.81510.67940.68050.017
ldaLinear Discriminant Analysis0.84340.91830.82210.81000.81510.67940.68050.021
svmSVM - Linear Kernel0.69790.00000.60250.66020.56950.36770.42680.026
\n", "
" ], "text/plain": [ " Model Accuracy AUC Recall Prec. \\\n", "lightgbm Light Gradient Boosting Machine 0.9141 0.9696 0.9037 0.8946 \n", "et Extra Trees Classifier 0.9126 0.9750 0.8992 0.8944 \n", "rf Random Forest Classifier 0.9122 0.9731 0.9117 0.8846 \n", "xgboost Extreme Gradient Boosting 0.9055 0.9670 0.9026 0.8776 \n", "catboost CatBoost Classifier 0.9050 0.9661 0.9049 0.8748 \n", "gbc Gradient Boosting Classifier 0.8969 0.9609 0.8991 0.8631 \n", "knn K Neighbors Classifier 0.8850 0.9399 0.8799 0.8522 \n", "dt Decision Tree Classifier 0.8835 0.8857 0.8992 0.8373 \n", "ada Ada Boost Classifier 0.8816 0.9501 0.8720 0.8517 \n", "lr Logistic Regression 0.8592 0.9221 0.8380 0.8305 \n", "nb Naive Bayes 0.8587 0.9092 0.9116 0.7876 \n", "qda Quadratic Discriminant Analysis 0.8463 0.9168 0.8946 0.7763 \n", "ridge Ridge Classifier 0.8434 0.0000 0.8221 0.8100 \n", "lda Linear Discriminant Analysis 0.8434 0.9183 0.8221 0.8100 \n", "svm SVM - Linear Kernel 0.6979 0.0000 0.6025 0.6602 \n", "\n", " F1 Kappa MCC TT (Sec) \n", "lightgbm 0.8986 0.8241 0.8249 0.115 \n", "et 0.8966 0.8210 0.8213 0.515 \n", "rf 0.8975 0.8207 0.8217 0.576 \n", "xgboost 0.8894 0.8069 0.8079 2.537 \n", "catboost 0.8891 0.8061 0.8072 2.721 \n", "gbc 0.8800 0.7897 0.7912 0.310 \n", "knn 0.8655 0.7651 0.7659 0.127 \n", "dt 0.8666 0.7635 0.7659 0.027 \n", "ada 0.8613 0.7581 0.7588 0.160 \n", "lr 0.8335 0.7115 0.7125 0.314 \n", "nb 0.8445 0.7163 0.7238 0.021 \n", "qda 0.8307 0.6913 0.6981 0.020 \n", "ridge 0.8151 0.6794 0.6805 0.017 \n", "lda 0.8151 0.6794 0.6805 0.021 \n", "svm 0.5695 0.3677 0.4268 0.026 " ] }, "metadata": { "tags": [] } }, { "output_type": "execute_result", "data": { "text/plain": [ "LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\n", " importance_type='split', learning_rate=0.1, max_depth=-1,\n", " min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,\n", " n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,\n", " random_state=4581, reg_alpha=0.0, reg_lambda=0.0, silent=True,\n", " subsample=1.0, subsample_for_bin=200000, subsample_freq=0)" ] }, "metadata": { "tags": [] }, "execution_count": 97 } ] }, { "cell_type": "code", "metadata": { "id": "sqZa1fdWgHVv", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "5f54753abe0e4486b04eb8d273109b4c", "87522b28665f4055afc2762b6d60ebe0", "547856fc003e480eb9533f7541f11b61" ] }, "outputId": "f3860f81-8179-4af3-9fd6-2807ac4868e6" }, "source": [ "XGB = create_model(estimator='xgboost')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.90480.96470.92130.86320.89130.80670.8081
10.89520.95160.87640.87640.87640.78550.7855
20.89520.95640.92130.84540.88170.78800.7904
30.90950.98160.93180.86320.89620.81620.8181
40.93330.97280.93180.91110.92130.86350.8637
50.87080.95900.84090.85060.84570.73460.7346
60.90430.96820.93180.85420.89130.80610.8086
70.93300.98650.93180.91110.92130.86300.8632
80.90430.97500.85230.91460.88240.80190.8033
90.90430.95460.88640.88640.88640.80370.8037
Mean0.90550.96700.90260.87760.88940.80690.8079
SD0.01720.01120.03380.02540.02070.03540.0353
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.9048 0.9647 0.9213 0.8632 0.8913 0.8067 0.8081\n", "1 0.8952 0.9516 0.8764 0.8764 0.8764 0.7855 0.7855\n", "2 0.8952 0.9564 0.9213 0.8454 0.8817 0.7880 0.7904\n", "3 0.9095 0.9816 0.9318 0.8632 0.8962 0.8162 0.8181\n", "4 0.9333 0.9728 0.9318 0.9111 0.9213 0.8635 0.8637\n", "5 0.8708 0.9590 0.8409 0.8506 0.8457 0.7346 0.7346\n", "6 0.9043 0.9682 0.9318 0.8542 0.8913 0.8061 0.8086\n", "7 0.9330 0.9865 0.9318 0.9111 0.9213 0.8630 0.8632\n", "8 0.9043 0.9750 0.8523 0.9146 0.8824 0.8019 0.8033\n", "9 0.9043 0.9546 0.8864 0.8864 0.8864 0.8037 0.8037\n", "Mean 0.9055 0.9670 0.9026 0.8776 0.8894 0.8069 0.8079\n", "SD 0.0172 0.0112 0.0338 0.0254 0.0207 0.0354 0.0353" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "6J5JEncjioBy", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "5505c035740744dba23dce1750ea4c06", "f48ed8a89f0a463eabd3c02d11807c26", "e3346fce67b341a189e271ae4dbbf637" ] }, "outputId": "78835874-f97e-442f-c220-ecbdbfadf8aa" }, "source": [ "TunedModel = tune_model(XGB)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.89520.95360.89890.86020.87910.78680.7874
10.87140.94900.78650.89740.83830.73240.7368
20.90000.95800.88760.87780.88270.79550.7956
30.90000.97570.88640.87640.88140.79490.7950
40.92380.96900.92050.90000.91010.84400.8442
50.90430.96260.86360.90480.88370.80250.8031
60.89470.95710.89770.85870.87780.78540.7860
70.92340.97870.90910.90910.90910.84300.8430
80.91870.97300.84090.96100.89700.83030.8353
90.89000.95280.82950.90120.86390.77180.7737
Mean0.90220.96290.87210.89470.88230.79870.8000
SD0.01550.01000.03960.02810.02000.03240.0319
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8952 0.9536 0.8989 0.8602 0.8791 0.7868 0.7874\n", "1 0.8714 0.9490 0.7865 0.8974 0.8383 0.7324 0.7368\n", "2 0.9000 0.9580 0.8876 0.8778 0.8827 0.7955 0.7956\n", "3 0.9000 0.9757 0.8864 0.8764 0.8814 0.7949 0.7950\n", "4 0.9238 0.9690 0.9205 0.9000 0.9101 0.8440 0.8442\n", "5 0.9043 0.9626 0.8636 0.9048 0.8837 0.8025 0.8031\n", "6 0.8947 0.9571 0.8977 0.8587 0.8778 0.7854 0.7860\n", "7 0.9234 0.9787 0.9091 0.9091 0.9091 0.8430 0.8430\n", "8 0.9187 0.9730 0.8409 0.9610 0.8970 0.8303 0.8353\n", "9 0.8900 0.9528 0.8295 0.9012 0.8639 0.7718 0.7737\n", "Mean 0.9022 0.9629 0.8721 0.8947 0.8823 0.7987 0.8000\n", "SD 0.0155 0.0100 0.0396 0.0281 0.0200 0.0324 0.0319" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "D9VxYXSRjfGA", "colab": { "base_uri": "https://localhost:8080/", "height": 1000, "referenced_widgets": [ "289080f92a784987bf9803c808c86b2f", "c00d0d4f76cf4b3ba143096fcabd9160", "1278fb36784f41728b5aed0c522375eb", "a391a8969f7044ddbb8f996f2ae9d841", "5983e5d1fcca4214afeeb0b6e3e9f01b", "5654c6ccc5e94fe5b4b6015c80437afd", "be8e6cd719384b719d8e05c54eab3225" ] }, "outputId": "99bf960f-dfb5-4209-ae4c-381a0c4bd384" }, "source": [ "evaluate_model(XGB)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "289080f92a784987bf9803c808c86b2f", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "Wih-yxD7kxYS", "colab": { "base_uri": "https://localhost:8080/", "height": 401, "referenced_widgets": [ "3f094aa3d2e34e2b988d99c742f9d393", "aa757b9ea18c486cac397ec90631be22", "2800e9fa0fa84f899598d83083a9f37f" ] }, "outputId": "01d760ff-a5ab-4619-f2d8-f34286b26b16" }, "source": [ "plot_model(XGB, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "RoSxqF1xnMhq", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "19bfaa8c92624fc49d00fb576eb168a0", "209a2ebbe1af4fc498e7ba114ccc3878", "3eb1e382648f4b47b0b31c76152573bd" ] }, "outputId": "95c76993-c8a3-4157-b610-e97b56c33c89" }, "source": [ "LR = create_model(estimator='lr')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.84290.90090.85390.79170.82160.68160.6831
10.85240.91500.82020.82950.82490.69730.6973
20.86670.91680.88760.81440.84950.73020.7324
30.89520.95710.86360.88370.87360.78420.7843
40.87620.93040.85230.85230.85230.74570.7457
50.87560.92150.86360.84440.85390.74560.7458
60.85170.91490.86360.80000.83060.69900.7006
70.87080.94860.85230.84270.84750.73540.7355
80.82780.91930.78410.80230.79310.64560.6457
90.83250.89590.73860.84420.78790.65060.6545
Mean0.85920.92210.83800.83050.83350.71150.7125
SD0.02030.01810.04270.02710.02600.04220.0416
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8429 0.9009 0.8539 0.7917 0.8216 0.6816 0.6831\n", "1 0.8524 0.9150 0.8202 0.8295 0.8249 0.6973 0.6973\n", "2 0.8667 0.9168 0.8876 0.8144 0.8495 0.7302 0.7324\n", "3 0.8952 0.9571 0.8636 0.8837 0.8736 0.7842 0.7843\n", "4 0.8762 0.9304 0.8523 0.8523 0.8523 0.7457 0.7457\n", "5 0.8756 0.9215 0.8636 0.8444 0.8539 0.7456 0.7458\n", "6 0.8517 0.9149 0.8636 0.8000 0.8306 0.6990 0.7006\n", "7 0.8708 0.9486 0.8523 0.8427 0.8475 0.7354 0.7355\n", "8 0.8278 0.9193 0.7841 0.8023 0.7931 0.6456 0.6457\n", "9 0.8325 0.8959 0.7386 0.8442 0.7879 0.6506 0.6545\n", "Mean 0.8592 0.9221 0.8380 0.8305 0.8335 0.7115 0.7125\n", "SD 0.0203 0.0181 0.0427 0.0271 0.0260 0.0422 0.0416" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "VYXTx0PnnNZj", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "6e579c53f5154dcc9f288f98732dfda5", "4a8be249ec484581994f11a00c835fd7", "224cb2b4e86f479d91d9fca0a4cff63b" ] }, "outputId": "e340ecf4-769a-449c-96bb-f0b65fa9fdb8" }, "source": [ "TunedModel = tune_model(LR)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.84290.90080.85390.79170.82160.68160.6831
10.85240.91500.82020.82950.82490.69730.6973
20.86670.91730.88760.81440.84950.73020.7324
30.89520.95710.86360.88370.87360.78420.7843
40.87620.92970.85230.85230.85230.74570.7457
50.87560.92150.86360.84440.85390.74560.7458
60.85170.91500.86360.80000.83060.69900.7006
70.87080.94860.85230.84270.84750.73540.7355
80.82780.91930.78410.80230.79310.64560.6457
90.83250.89590.73860.84420.78790.65060.6545
Mean0.85920.92200.83800.83050.83350.71150.7125
SD0.02030.01800.04270.02710.02600.04220.0416
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8429 0.9008 0.8539 0.7917 0.8216 0.6816 0.6831\n", "1 0.8524 0.9150 0.8202 0.8295 0.8249 0.6973 0.6973\n", "2 0.8667 0.9173 0.8876 0.8144 0.8495 0.7302 0.7324\n", "3 0.8952 0.9571 0.8636 0.8837 0.8736 0.7842 0.7843\n", "4 0.8762 0.9297 0.8523 0.8523 0.8523 0.7457 0.7457\n", "5 0.8756 0.9215 0.8636 0.8444 0.8539 0.7456 0.7458\n", "6 0.8517 0.9150 0.8636 0.8000 0.8306 0.6990 0.7006\n", "7 0.8708 0.9486 0.8523 0.8427 0.8475 0.7354 0.7355\n", "8 0.8278 0.9193 0.7841 0.8023 0.7931 0.6456 0.6457\n", "9 0.8325 0.8959 0.7386 0.8442 0.7879 0.6506 0.6545\n", "Mean 0.8592 0.9220 0.8380 0.8305 0.8335 0.7115 0.7125\n", "SD 0.0203 0.0180 0.0427 0.0271 0.0260 0.0422 0.0416" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "ejO1H3OrnTUF", "colab": { "base_uri": "https://localhost:8080/", "height": 169, "referenced_widgets": [ "8f6833e896f24ce1b691f340f19acbf3", "4a39820fd6e34def9e7df8b60b827dd4", "3745871b9e9d4960b65954a97c83eff2", "4a103d29196a45ddb2be13242dc5948d", "d4177e6dc2a34c94850207968293f112", "e8ffa2e43da84377803186697fdf7bd6", "61900fd657354669ac47d7fc218f0e63", "e5653ef1f4ac4568af5ca682912df39c", "bc82ef6f0b8f49f6a44179bd6b853445", "e05532a49de54883a2776a4ce69ff02e", "70b3c58232134d9cac7db23f5b62bfda", "c4db2e658ea54e1f896d3695a75fb0f8", "0edb902376534a8fbd01c22af54b7c27" ] }, "outputId": "6fe535b6-b886-4556-8a65-5311c788b434" }, "source": [ "evaluate_model(LR)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "8f6833e896f24ce1b691f340f19acbf3", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "4NutmU9xnsI5", "colab": { "base_uri": "https://localhost:8080/", "height": 401 }, "outputId": "f4e36e8b-a1b4-4119-e08d-367284ad09b5" }, "source": [ "plot_model(LR, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "u7s3L2rfoL2T", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "3659c16a4759447f9c8b2e9e1bd7860f", "ea4bd0ed110e4818a61de5d741d65792", "ab3daf44e84e407f89d82424587c45d2" ] }, "outputId": "7fb30ea4-4983-4e61-de43-a25d1d22d11c" }, "source": [ "catboost = create_model(estimator='catboost')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.90480.96510.92130.86320.89130.80670.8081
10.88570.95520.85390.87360.86360.76530.7654
20.89520.95600.91010.85260.88040.78740.7887
30.91900.97560.93180.88170.90610.83500.8360
40.91430.97310.93180.87230.90110.82560.8270
50.91870.96790.92050.89010.90500.83390.8343
60.89000.96240.92050.83510.87570.77740.7803
70.92820.97870.94320.89250.91710.85390.8549
80.90430.97670.86360.90480.88370.80250.8031
90.89000.94990.85230.88240.86710.77320.7736
Mean0.90500.96610.90490.87480.88910.80610.8072
SD0.01390.00950.03280.01940.01700.02870.0286
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.9048 0.9651 0.9213 0.8632 0.8913 0.8067 0.8081\n", "1 0.8857 0.9552 0.8539 0.8736 0.8636 0.7653 0.7654\n", "2 0.8952 0.9560 0.9101 0.8526 0.8804 0.7874 0.7887\n", "3 0.9190 0.9756 0.9318 0.8817 0.9061 0.8350 0.8360\n", "4 0.9143 0.9731 0.9318 0.8723 0.9011 0.8256 0.8270\n", "5 0.9187 0.9679 0.9205 0.8901 0.9050 0.8339 0.8343\n", "6 0.8900 0.9624 0.9205 0.8351 0.8757 0.7774 0.7803\n", "7 0.9282 0.9787 0.9432 0.8925 0.9171 0.8539 0.8549\n", "8 0.9043 0.9767 0.8636 0.9048 0.8837 0.8025 0.8031\n", "9 0.8900 0.9499 0.8523 0.8824 0.8671 0.7732 0.7736\n", "Mean 0.9050 0.9661 0.9049 0.8748 0.8891 0.8061 0.8072\n", "SD 0.0139 0.0095 0.0328 0.0194 0.0170 0.0287 0.0286" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "F7f6R9Iwoa60", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "9c93b53066f449cabffe42495002ff2b", "84de493313c4416ba147b8514bdf5ccd", "e8696e757e9140d38d0dec51809b5a37" ] }, "outputId": "4f69623f-55df-4a46-cad3-7f80b844b1f2" }, "source": [ "TunedModel = tune_model(catboost)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.89050.96500.89890.85110.87430.77740.7783
10.89520.95890.87640.87640.87640.78550.7855
20.89050.95890.92130.83670.87700.77870.7816
30.91900.97620.92050.89010.90500.83450.8349
40.92380.97620.93180.89130.91110.84450.8451
50.91390.96870.88640.90700.89660.82280.8230
60.90430.96660.93180.85420.89130.80610.8086
70.91870.98500.94320.87370.90710.83500.8369
80.92820.97700.88640.93980.91230.85160.8527
90.89470.95240.86360.88370.87360.78340.7836
Mean0.90790.96850.90600.88040.89250.81200.8130
SD0.01380.00960.02580.02820.01520.02760.0275
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8905 0.9650 0.8989 0.8511 0.8743 0.7774 0.7783\n", "1 0.8952 0.9589 0.8764 0.8764 0.8764 0.7855 0.7855\n", "2 0.8905 0.9589 0.9213 0.8367 0.8770 0.7787 0.7816\n", "3 0.9190 0.9762 0.9205 0.8901 0.9050 0.8345 0.8349\n", "4 0.9238 0.9762 0.9318 0.8913 0.9111 0.8445 0.8451\n", "5 0.9139 0.9687 0.8864 0.9070 0.8966 0.8228 0.8230\n", "6 0.9043 0.9666 0.9318 0.8542 0.8913 0.8061 0.8086\n", "7 0.9187 0.9850 0.9432 0.8737 0.9071 0.8350 0.8369\n", "8 0.9282 0.9770 0.8864 0.9398 0.9123 0.8516 0.8527\n", "9 0.8947 0.9524 0.8636 0.8837 0.8736 0.7834 0.7836\n", "Mean 0.9079 0.9685 0.9060 0.8804 0.8925 0.8120 0.8130\n", "SD 0.0138 0.0096 0.0258 0.0282 0.0152 0.0276 0.0275" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "XVMyXIFJodSw", "colab": { "base_uri": "https://localhost:8080/", "height": 1000, "referenced_widgets": [ "679526b38f8c47ad9a8759d066aabb5c", "4bb43807c6ed4bbb8bc7a1de36170aad", "15bacfbd614c48e7ac46997961421489", "9d221ee267124302b6aac1bab99db046", "c0a39ef9ad4c46bca8299fb6a5fffec8", "29af3b998a664828a5afa4b9f7dda07c", "bc3075446d0348bcb00f9a672dcc8ad1" ] }, "outputId": "f3531890-87f9-482a-f21a-c3de8ec5cc88" }, "source": [ "evaluate_model(catboost)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "679526b38f8c47ad9a8759d066aabb5c", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "-A_sFs8OojtI", "colab": { "base_uri": "https://localhost:8080/", "height": 758, "referenced_widgets": [ "69bbea89321f407eae6f435e00728d9d", "5facd9a5cac94c8d87e51d5d79cc6aca", "75c2ebf71ba14b8da324d470fde6096b" ] }, "outputId": "3682454a-6d30-4982-8b5f-298512b2d99e" }, "source": [ "plot_model(catboost, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "69bbea89321f407eae6f435e00728d9d", "version_minor": 0, "version_major": 2 }, "text/plain": [ "IntProgress(value=0, description='Processing: ', max=5)" ] }, "metadata": { "tags": [] } }, { "output_type": "error", "ename": "TypeError", "evalue": "ignored", "traceback": [ "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", "\u001b[0;31mTypeError\u001b[0m Traceback (most recent call last)", "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mplot_model\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcatboost\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'confusion_matrix'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pycaret/classification.py\u001b[0m in \u001b[0;36mplot_model\u001b[0;34m(estimator, plot, scale, save, fold, fit_kwargs, groups, use_train_data, verbose)\u001b[0m\n\u001b[1;32m 1539\u001b[0m \u001b[0mverbose\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mverbose\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1540\u001b[0m \u001b[0muse_train_data\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0muse_train_data\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1541\u001b[0;31m \u001b[0msystem\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1542\u001b[0m )\n\u001b[1;32m 1543\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pycaret/internal/tabular.py\u001b[0m in \u001b[0;36mplot_model\u001b[0;34m(estimator, plot, scale, save, fold, fit_kwargs, groups, feature_name, label, use_train_data, verbose, system, display)\u001b[0m\n\u001b[1;32m 7167\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7168\u001b[0m \u001b[0;31m# execute the plot method\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 7169\u001b[0;31m \u001b[0mret\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mlocals\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mplot\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 7170\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mret\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7171\u001b[0m \u001b[0mplot_filename\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mret\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pycaret/internal/tabular.py\u001b[0m in \u001b[0;36mconfusion_matrix\u001b[0;34m()\u001b[0m\n\u001b[1;32m 6451\u001b[0m \u001b[0mfit_kwargs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mfit_kwargs\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 6452\u001b[0m \u001b[0mgroups\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mgroups\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 6453\u001b[0;31m \u001b[0mdisplay\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mdisplay\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 6454\u001b[0m )\n\u001b[1;32m 6455\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pycaret/internal/plotting.py\u001b[0m in \u001b[0;36mshow_yellowbrick_plot\u001b[0;34m(visualizer, X_train, y_train, X_test, y_test, name, handle_train, handle_test, scale, save, fit_kwargs, groups, display, **kwargs)\u001b[0m\n\u001b[1;32m 59\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0mhandle_test\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0;34m\"score\"\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 60\u001b[0m \u001b[0mlogger\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0minfo\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"Scoring test/hold-out set\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 61\u001b[0;31m \u001b[0mvisualizer\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mscore\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mX_test\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my_test\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 62\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 63\u001b[0m \u001b[0mdisplay\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmove_progress\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/yellowbrick/classifier/confusion_matrix.py\u001b[0m in \u001b[0;36mscore\u001b[0;34m(self, X, y)\u001b[0m\n\u001b[1;32m 206\u001b[0m \u001b[0;31m# Compute the confusion matrix and class counts\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 207\u001b[0m self.confusion_matrix_ = confusion_matrix_metric(\n\u001b[0;32m--> 208\u001b[0;31m \u001b[0my\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my_pred\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mlabels\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mlabels\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0msample_weight\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msample_weight\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 209\u001b[0m )\n\u001b[1;32m 210\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mclass_counts_\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mzip\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0munique\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0my\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreturn_counts\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/sklearn/utils/validation.py\u001b[0m in \u001b[0;36minner_f\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 70\u001b[0m FutureWarning)\n\u001b[1;32m 71\u001b[0m \u001b[0mkwargs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mupdate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0marg\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0marg\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mzip\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msig\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mparameters\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 72\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mf\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 73\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0minner_f\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 74\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/sklearn/metrics/_classification.py\u001b[0m in \u001b[0;36mconfusion_matrix\u001b[0;34m(y_true, y_pred, labels, sample_weight, normalize)\u001b[0m\n\u001b[1;32m 274\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 275\u001b[0m \"\"\"\n\u001b[0;32m--> 276\u001b[0;31m \u001b[0my_type\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my_true\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my_pred\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0m_check_targets\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0my_true\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my_pred\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 277\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0my_type\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32min\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0;34m\"binary\"\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m\"multiclass\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 278\u001b[0m \u001b[0;32mraise\u001b[0m \u001b[0mValueError\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"%s is not supported\"\u001b[0m \u001b[0;34m%\u001b[0m \u001b[0my_type\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/sklearn/metrics/_classification.py\u001b[0m in \u001b[0;36m_check_targets\u001b[0;34m(y_true, y_pred)\u001b[0m\n\u001b[1;32m 102\u001b[0m \u001b[0my_pred\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcolumn_or_1d\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0my_pred\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 103\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0my_type\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0;34m\"binary\"\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 104\u001b[0;31m \u001b[0munique_values\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0munion1d\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0my_true\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my_pred\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 105\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0munique_values\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0;36m2\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 106\u001b[0m \u001b[0my_type\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m\"multiclass\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m<__array_function__ internals>\u001b[0m in \u001b[0;36munion1d\u001b[0;34m(*args, **kwargs)\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/numpy/lib/arraysetops.py\u001b[0m in \u001b[0;36munion1d\u001b[0;34m(ar1, ar2)\u001b[0m\n\u001b[1;32m 736\u001b[0m \u001b[0marray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m2\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m3\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m4\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m6\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 737\u001b[0m \"\"\"\n\u001b[0;32m--> 738\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0munique\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mconcatenate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mar1\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mar2\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 739\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 740\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m<__array_function__ internals>\u001b[0m in \u001b[0;36munique\u001b[0;34m(*args, **kwargs)\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/numpy/lib/arraysetops.py\u001b[0m in \u001b[0;36munique\u001b[0;34m(ar, return_index, return_inverse, return_counts, axis)\u001b[0m\n\u001b[1;32m 261\u001b[0m \u001b[0mar\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0masanyarray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mar\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 262\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0maxis\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 263\u001b[0;31m \u001b[0mret\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0m_unique1d\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mar\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreturn_index\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreturn_inverse\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreturn_counts\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 264\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0m_unpack_tuple\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mret\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 265\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/numpy/lib/arraysetops.py\u001b[0m in \u001b[0;36m_unique1d\u001b[0;34m(ar, return_index, return_inverse, return_counts)\u001b[0m\n\u001b[1;32m 309\u001b[0m \u001b[0maux\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mar\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mperm\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 310\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 311\u001b[0;31m \u001b[0mar\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msort\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 312\u001b[0m \u001b[0maux\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mar\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 313\u001b[0m \u001b[0mmask\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mempty\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0maux\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbool_\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;31mTypeError\u001b[0m: '<' not supported between instances of 'int' and 'str'" ] }, { "output_type": "display_data", "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAegAAAFOCAYAAABNFY7/AAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4yLjIsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy+WH4yJAAATm0lEQVR4nO3dX2jd9f3H8VfSpBk0pTTQrPaPsxRKWYJiWwVJsbOkww0vxaTMPzhRBN3QWYZ2w8hmYgXdxdQLkbGLKrUiYexC7GAojJquLmyVRKR/wFD/0CZWy1K11vX8LsRgf2pOWnuaT5vH4yrffr+e8+aN5en5nvZrXaVSqQQAKEr9dA8AAHydQANAgQQaAAok0ABQIIEGgAIJNAAUaEqB3rt3bzo7O/Pss89+7dxrr72W66+/Pl1dXXnqqafO+oAAMBNVDfTHH3+c3//+97nqqqu+8fzDDz+cJ554Itu2bcvOnTuzf//+sz4kAMw0VQM9e/bsPPPMM2ltbf3auYMHD2bevHm56KKLUl9fn3Xr1mVgYKAmgwLATNJQ9YKGhjQ0fPNlo6OjaWlpmThuaWnJwYMHv/W1Tp48mWPHjqWxsTF1dXVnMC4AnF8qlUpOnDiROXPmpL5+6n/0q2qgz6Zjx45l79695/ItAaAIK1asyNy5c6d8/XcKdGtra8bGxiaODx069I23wr/U2NiY5IshZ8+e/V3emkkMDQ2lvb19use44Nlz7dlx7dlx7X322WfZu3fvRAOn6jsFesmSJRkfH88777yThQsX5pVXXsljjz32rdd/eVt79uzZaWpq+i5vTRX2e27Yc+3Zce3Z8blxul/tVg300NBQHn300bz77rtpaGjIjh07sn79+ixZsiQbNmzIQw89lPvuuy9J8tOf/jTLli07s8kBgAlVA93e3p6tW7d+6/krrrgi27dvP6tDAcBM50liAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABSoYSoX9fX1Zc+ePamrq8vmzZtz6aWXTpx77rnn8te//jX19fVpb2/Pb37zm5oNCwAzRdVP0Lt3787IyEi2b9+e3t7e9Pb2TpwbHx/Pn/70pzz33HPZtm1bDhw4kP/85z81HRgAZoKqgR4YGEhnZ2eSZPny5Tl69GjGx8eTJI2NjWlsbMzHH3+czz//PJ988knmzZtX24kBYAaoGuixsbHMnz9/4rilpSWjo6NJkqamptx1113p7OzMNddck8suuyzLli2r3bQAMENM6Tvor6pUKhM/j4+P5+mnn87LL7+c5ubm3HLLLXnrrbeycuXKSV9jaGjo9CfltAwODk73CDOCPdeeHdeeHZepaqBbW1szNjY2cXz48OEsWLAgSXLgwIEsXbo0LS0tSZI1a9ZkaGioaqDb29vT1NT0XeZmEoODg1m9evV0j3HBs+fas+Pas+PaO378+Bl9MK16i7ujoyM7duxIkgwPD6e1tTXNzc1JksWLF+fAgQP59NNPk3zxyfiSSy457SEAgFNV/QS9atWqtLW1pbu7O3V1denp6Ul/f3/mzp2bDRs25LbbbsvNN9+cWbNm5fLLL8+aNWvOxdwAcEGb0nfQmzZtOuX4q7ewu7u7093dfXanAoAZzpPEAKBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoAChQw1Qu6uvry549e1JXV5fNmzfn0ksvnTj3/vvv51e/+lVOnDiRH/7wh/nd735Xs2EBYKao+gl69+7dGRkZyfbt29Pb25ve3t5Tzm/ZsiU///nP8+KLL2bWrFl57733ajYsAMwUVQM9MDCQzs7OJMny5ctz9OjRjI+PJ0lOnjyZwcHBrF+/PknS09OTRYsW1XBcAJgZqt7iHhsbS1tb28RxS0tLRkdH09zcnCNHjmTOnDl55JFHMjw8nDVr1uS+++6r+qZDQ0PfbWqqGhwcnO4RZgR7rj07rj07LtOUvoP+qkqlcsrPhw4dys0335zFixfnjjvuyKuvvpof/ehHk75Ge3t7mpqaTntYpmZwcDCrV6+e7jEuePZce3Zce3Zce8ePHz+jD6ZVb3G3trZmbGxs4vjw4cNZsGBBkmT+/PlZtGhRLr744syaNStXXXVV9u3bd9pDAACnqhrojo6O7NixI0kyPDyc1tbWNDc3J0kaGhqydOnSvP322xPnly1bVrtpAWCGqHqLe9WqVWlra0t3d3fq6urS09OT/v7+zJ07Nxs2bMjmzZtz//33p1KpZMWKFRN/YAwAOHNT+g5606ZNpxyvXLly4ucf/OAH2bZt29mdCgBmOE8SA4ACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAUwp0X19furq60t3dnTfeeOMbr3n88cdz0003ndXhAGCmqhro3bt3Z2RkJNu3b09vb296e3u/ds3+/fvz+uuv12RAAJiJqgZ6YGAgnZ2dSZLly5fn6NGjGR8fP+WaLVu25N57763NhAAwAzVUu2BsbCxtbW0Txy0tLRkdHU1zc3OSpL+/P1deeWUWL1485TcdGho6g1E5HYODg9M9woxgz7Vnx7Vnx2WqGuj/r1KpTPz80Ucfpb+/P3/+859z6NChKb9Ge3t7mpqaTvetmaLBwcGsXr16use44Nlz7dlx7dlx7R0/fvyMPphWvcXd2tqasbGxiePDhw9nwYIFSZJdu3blyJEj+dnPfpa77747w8PD6evrO+0hAIBTVQ10R0dHduzYkSQZHh5Oa2vrxO3ta6+9Ni+99FJeeOGFPPnkk2lra8vmzZtrOzEAzABVb3GvWrUqbW1t6e7uTl1dXXp6etLf35+5c+dmw4YN52JGAJhxpvQd9KZNm045Xrly5deuWbJkSbZu3Xp2pgKAGc6TxACgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAVqmMpFfX192bNnT+rq6rJ58+ZceumlE+d27dqVP/zhD6mvr8+yZcvS29ub+nrdB4DvompJd+/enZGRkWzfvj29vb3p7e095fyDDz6YP/7xj3n++edz7Nix/OMf/6jZsAAwU1QN9MDAQDo7O5Mky5cvz9GjRzM+Pj5xvr+/PwsXLkyStLS05MMPP6zRqAAwc1QN9NjYWObPnz9x3NLSktHR0Ynj5ubmJMnhw4ezc+fOrFu3rgZjAsDMMqXvoL+qUql87dc++OCD3Hnnnenp6Tkl5t9maGjodN+W0zQ4ODjdI8wI9lx7dlx7dlymqoFubW3N2NjYxPHhw4ezYMGCiePx8fHcfvvtueeee7J27dopvWl7e3uamprOYFymYnBwMKtXr57uMS549lx7dlx7dlx7x48fP6MPplVvcXd0dGTHjh1JkuHh4bS2tk7c1k6SLVu25JZbbsnVV1992m8OAHyzqp+gV61alba2tnR3d6euri49PT3p7+/P3Llzs3bt2vzlL3/JyMhIXnzxxSTJddddl66urpoPDgAXsil9B71p06ZTjleuXDnxs++TAeDs80QRACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAok0ABQIIEGgAIJNAAUSKABoEACDQAFEmgAKJBAA0CBBBoACiTQAFAggQaAAgk0ABRIoAGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFEigAaBAAg0ABRJoACiQQANAgQQaAAo0pUD39fWlq6sr3d3deeONN04599prr+X6669PV1dXnnrqqZoMCQAzTdVA7969OyMjI9m+fXt6e3vT29t7yvmHH344TzzxRLZt25adO3dm//79NRsWAGaKqoEeGBhIZ2dnkmT58uU5evRoxsfHkyQHDx7MvHnzctFFF6W+vj7r1q3LwMBAbScGgBmgodoFY2NjaWtrmzhuaWnJ6OhompubMzo6mpaWllPOHTx48Ftfq1KpJEk+++yz7zIzU3D8+PHpHmFGsOfas+Pas+Pa+rJ5XzZwqqoG+v873Tf4qhMnTiRJ9u7de8avwdQMDQ1N9wgzgj3Xnh3Xnh2fGydOnMj3vve9KV9fNdCtra0ZGxubOD58+HAWLFjwjecOHTqU1tbWb32tOXPmZMWKFWlsbExdXd2UhwSA81WlUsmJEycyZ86c0/rnqga6o6MjTzzxRLq7uzM8PJzW1tY0NzcnSZYsWZLx8fG88847WbhwYV555ZU89thj3/pa9fX1mTt37mkNCADnu9P55PylusoU7lk/9thj+de//pW6urr09PTkzTffzNy5c7Nhw4a8/vrrE1H+8Y9/nNtuu+30JwcATjGlQAMA55YniQFAgQQaAApU00B7RGjtTbbjXbt25YYbbkh3d3ceeOCBnDx5cpqmPL9NtuMvPf7447npppvO8WQXjsl2/P7772fjxo25/vrr8+CDD07ThBeGyfb83HPPpaurKxs3bvzaEyOZur1796azszPPPvvs186ddvcqNfLPf/6zcscdd1QqlUpl//79lRtuuOGU8z/5yU8q7733XuV///tfZePGjZV9+/bVapQLVrUdb9iwofL+++9XKpVK5Re/+EXl1VdfPecznu+q7bhSqVT27dtX6erqqtx4443nerwLQrUd//KXv6z87W9/q1QqlcpDDz1Ueffdd8/5jBeCyfb83//+t3LNNddUTpw4UalUKpVbb7218u9//3ta5jyfHTt2rHLjjTdWfvvb31a2bt36tfOn272afYL2iNDam2zHSdLf35+FCxcm+eIpbx9++OG0zHk+q7bjJNmyZUvuvffe6RjvgjDZjk+ePJnBwcGsX78+SdLT05NFixZN26zns8n23NjYmMbGxnz88cf5/PPP88knn2TevHnTOe55afbs2XnmmWe+8XkgZ9K9mgV6bGws8+fPnzj+8hGhSb7xEaFfnmPqJttxkom/r3748OHs3Lkz69atO+cznu+q7bi/vz9XXnllFi9ePB3jXRAm2/GRI0cyZ86cPPLII9m4cWMef/zx6RrzvDfZnpuamnLXXXels7Mz11xzTS677LIsW7ZsukY9bzU0NHzr33c+k+6dsz8kVvG3uWrum3b8wQcf5M4770xPT88pvzk5M1/d8UcffZT+/v7ceuut0zjRheerO65UKjl06FBuvvnmPPvss3nzzTfz6quvTt9wF5Cv7nl8fDxPP/10Xn755fz973/Pnj178tZbb03jdCQ1DPTZfEQo32yyHSdf/Ka7/fbbc88992Tt2rXTMeJ5b7Id79q1K0eOHMnPfvaz3H333RkeHk5fX990jXremmzH8+fPz6JFi3LxxRdn1qxZueqqq7Jv377pGvW8NtmeDxw4kKVLl6alpSWzZ8/OmjVrPJ/7LDuT7tUs0B0dHdmxY0eSTPqI0M8//zyvvPJKOjo6ajXKBWuyHSdffDd6yy235Oqrr56uEc97k+342muvzUsvvZQXXnghTz75ZNra2rJ58+bpHPe8NNmOGxoasnTp0rz99tsT5916PTOT7Xnx4sU5cOBAPv300yRf/M8zLrnkkuka9YJ0Jt2r6ZPEPCK09r5tx2vXrs0VV1yRyy+/fOLa6667Ll1dXdM47flpsn+Pv/TOO+/kgQceyNatW6dx0vPXZDseGRnJ/fffn0qlkhUrVuShhx5Kfb1HOJyJyfb8/PPPp7+/P7Nmzcrll1+eX//619M97nlnaGgojz76aN599900NDTk+9//ftavX58lS5acUfc86hMACuQ/QwGgQAINAAUSaAAokEADQIEEGgAKJNAAUCCBBoACCTQAFOj/ALjguq4NbxIbAAAAAElFTkSuQmCC\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "IK5koP97dMM1", "colab": { "base_uri": "https://localhost:8080/", "height": 650, "referenced_widgets": [ "8707725331314861821ce500a3eeffac", "4be5360cabe647d5849b88f489b6cd20", "eb95926f6a4944c292da60aa0213e396", "8395d1cb9e454d068dd6a3db160fc9c6", "b8d139ba355646888a39dfaa52bb6c36", "6d74e458826c4bd1aed9dca2760c8ca0", "c24b28b804be4c248eba0b3eb3099673", "5737d68310e24f188f9a1c8844aa4831", "0df65d85f8fc4afd845d8a8346d0ac00" ] }, "outputId": "eae9f466-b458-4330-db8b-7275394be7ff" }, "source": [ "Model = setup(ModelDataset, target='Avalanche',train_size = 0.8,numeric_features=['Year'])\n", "compare_models()" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
etExtra Trees Classifier0.91660.97670.90190.90300.90230.82950.82980.518
rfRandom Forest Classifier0.91440.97410.91200.89100.90100.82570.82630.617
xgboostExtreme Gradient Boosting0.91410.97000.91540.88760.90090.82510.82590.787
lightgbmLight Gradient Boosting Machine0.91370.97020.91370.88800.90050.82430.82490.125
catboostCatBoost Classifier0.91230.96980.91290.88590.89880.82140.82233.152
gbcGradient Boosting Classifier0.89940.96510.90700.86440.88500.79570.79670.386
dtDecision Tree Classifier0.89190.89280.89940.85570.87660.78050.78190.028
knnK Neighbors Classifier0.88690.94430.88690.85430.86990.76990.77090.125
adaAda Boost Classifier0.88000.94730.88350.84360.86280.75640.75740.176
nbNaive Bayes0.85860.91400.90450.79370.84530.71610.72160.020
lrLogistic Regression0.85460.92520.83820.82490.83120.70360.70410.346
qdaQuadratic Discriminant Analysis0.84930.91980.90280.77950.83640.69800.70500.020
ldaLinear Discriminant Analysis0.84210.92120.82730.80800.81730.67830.67880.021
ridgeRidge Classifier0.84170.00000.82650.80790.81680.67750.67810.018
svmSVM - Linear Kernel0.72750.00000.64670.77940.63980.43560.50250.030
\n", "
" ], "text/plain": [ " Model Accuracy AUC Recall Prec. \\\n", "et Extra Trees Classifier 0.9166 0.9767 0.9019 0.9030 \n", "rf Random Forest Classifier 0.9144 0.9741 0.9120 0.8910 \n", "xgboost Extreme Gradient Boosting 0.9141 0.9700 0.9154 0.8876 \n", "lightgbm Light Gradient Boosting Machine 0.9137 0.9702 0.9137 0.8880 \n", "catboost CatBoost Classifier 0.9123 0.9698 0.9129 0.8859 \n", "gbc Gradient Boosting Classifier 0.8994 0.9651 0.9070 0.8644 \n", "dt Decision Tree Classifier 0.8919 0.8928 0.8994 0.8557 \n", "knn K Neighbors Classifier 0.8869 0.9443 0.8869 0.8543 \n", "ada Ada Boost Classifier 0.8800 0.9473 0.8835 0.8436 \n", "nb Naive Bayes 0.8586 0.9140 0.9045 0.7937 \n", "lr Logistic Regression 0.8546 0.9252 0.8382 0.8249 \n", "qda Quadratic Discriminant Analysis 0.8493 0.9198 0.9028 0.7795 \n", "lda Linear Discriminant Analysis 0.8421 0.9212 0.8273 0.8080 \n", "ridge Ridge Classifier 0.8417 0.0000 0.8265 0.8079 \n", "svm SVM - Linear Kernel 0.7275 0.0000 0.6467 0.7794 \n", "\n", " F1 Kappa MCC TT (Sec) \n", "et 0.9023 0.8295 0.8298 0.518 \n", "rf 0.9010 0.8257 0.8263 0.617 \n", "xgboost 0.9009 0.8251 0.8259 0.787 \n", "lightgbm 0.9005 0.8243 0.8249 0.125 \n", "catboost 0.8988 0.8214 0.8223 3.152 \n", "gbc 0.8850 0.7957 0.7967 0.386 \n", "dt 0.8766 0.7805 0.7819 0.028 \n", "knn 0.8699 0.7699 0.7709 0.125 \n", "ada 0.8628 0.7564 0.7574 0.176 \n", "nb 0.8453 0.7161 0.7216 0.020 \n", "lr 0.8312 0.7036 0.7041 0.346 \n", "qda 0.8364 0.6980 0.7050 0.020 \n", "lda 0.8173 0.6783 0.6788 0.021 \n", "ridge 0.8168 0.6775 0.6781 0.018 \n", "svm 0.6398 0.4356 0.5025 0.030 " ] }, "metadata": { "tags": [] } }, { "output_type": "execute_result", "data": { "text/plain": [ "ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,\n", " criterion='gini', max_depth=None, max_features='auto',\n", " max_leaf_nodes=None, max_samples=None,\n", " min_impurity_decrease=0.0, min_impurity_split=None,\n", " min_samples_leaf=1, min_samples_split=2,\n", " min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,\n", " oob_score=False, random_state=5221, verbose=0,\n", " warm_start=False)" ] }, "metadata": { "tags": [] }, "execution_count": 112 } ] }, { "cell_type": "code", "metadata": { "id": "zhEEYGIVg6KY", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "8dd10b0c4c8e4c2d899ca98ddf26f19f", "4cf7d8abf42d43239a03e760182abacd", "46c96d3cfe814a7fb86366bdf21700ea" ] }, "outputId": "f6acd055-43a6-41ff-faeb-1f521bcfe12d" }, "source": [ "XGB = create_model(estimator='xgboost')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.91430.97560.90830.89340.90080.82540.8255
10.91070.96330.86670.92040.89270.81640.8175
20.92140.97350.91670.90160.90910.83990.8400
30.91400.97400.92440.88000.90160.82530.8261
40.90320.94760.89920.87700.88800.80280.8030
50.91760.97490.94120.87500.90690.83310.8349
60.89960.96230.90760.86400.88520.79620.7969
70.92110.96740.90760.90760.90760.83880.8388
80.90680.97280.91600.87200.89340.81070.8115
90.93190.98860.96640.88460.92370.86240.8652
Mean0.91410.97000.91540.88760.90090.82510.8259
SD0.00910.01020.02480.01690.01100.01870.0191
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.9143 0.9756 0.9083 0.8934 0.9008 0.8254 0.8255\n", "1 0.9107 0.9633 0.8667 0.9204 0.8927 0.8164 0.8175\n", "2 0.9214 0.9735 0.9167 0.9016 0.9091 0.8399 0.8400\n", "3 0.9140 0.9740 0.9244 0.8800 0.9016 0.8253 0.8261\n", "4 0.9032 0.9476 0.8992 0.8770 0.8880 0.8028 0.8030\n", "5 0.9176 0.9749 0.9412 0.8750 0.9069 0.8331 0.8349\n", "6 0.8996 0.9623 0.9076 0.8640 0.8852 0.7962 0.7969\n", "7 0.9211 0.9674 0.9076 0.9076 0.9076 0.8388 0.8388\n", "8 0.9068 0.9728 0.9160 0.8720 0.8934 0.8107 0.8115\n", "9 0.9319 0.9886 0.9664 0.8846 0.9237 0.8624 0.8652\n", "Mean 0.9141 0.9700 0.9154 0.8876 0.9009 0.8251 0.8259\n", "SD 0.0091 0.0102 0.0248 0.0169 0.0110 0.0187 0.0191" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "kmNsROM5ilKd", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "3516024e5141494ba968244737483245", "4885cdb5a3d2483e924c0cc0d75f97e5", "dfb224af140240ecb4e4b055a3238bf8" ] }, "outputId": "ed61f6a5-1081-4823-e7fc-d26db7ad28de" }, "source": [ "TunedModel = tune_model(XGB)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.89640.97390.93330.84210.88540.79140.7949
10.91070.96620.90000.89260.89630.81790.8179
20.92140.97860.94170.88280.91130.84090.8423
30.89250.96830.93280.83460.88100.78350.7875
40.88890.94870.90760.84380.87450.77510.7767
50.91040.97150.94120.86150.89960.81900.8216
60.89610.96360.92440.84620.88350.79000.7925
70.88890.96730.91600.83850.87550.77550.7780
80.89250.97090.92440.83970.88000.78300.7860
90.91760.98770.98320.84780.91050.83490.8427
Mean0.90150.96970.93040.85290.88980.80110.8040
SD0.01160.00960.02180.01880.01300.02350.0239
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8964 0.9739 0.9333 0.8421 0.8854 0.7914 0.7949\n", "1 0.9107 0.9662 0.9000 0.8926 0.8963 0.8179 0.8179\n", "2 0.9214 0.9786 0.9417 0.8828 0.9113 0.8409 0.8423\n", "3 0.8925 0.9683 0.9328 0.8346 0.8810 0.7835 0.7875\n", "4 0.8889 0.9487 0.9076 0.8438 0.8745 0.7751 0.7767\n", "5 0.9104 0.9715 0.9412 0.8615 0.8996 0.8190 0.8216\n", "6 0.8961 0.9636 0.9244 0.8462 0.8835 0.7900 0.7925\n", "7 0.8889 0.9673 0.9160 0.8385 0.8755 0.7755 0.7780\n", "8 0.8925 0.9709 0.9244 0.8397 0.8800 0.7830 0.7860\n", "9 0.9176 0.9877 0.9832 0.8478 0.9105 0.8349 0.8427\n", "Mean 0.9015 0.9697 0.9304 0.8529 0.8898 0.8011 0.8040\n", "SD 0.0116 0.0096 0.0218 0.0188 0.0130 0.0235 0.0239" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "t8eCmI1YjgpM", "colab": { "base_uri": "https://localhost:8080/", "height": 1000, "referenced_widgets": [ "5238ac85157f48ebbef40b4332450a4d", "3e4c48f925694b4992df24d3db4cd08d", "90305a6b029b4002915d714b18d2dc6a", "36efa56b78d848e18fc9d8ff5248025b", "cbb0a03436964633b5fb8378022b6af0", "389e9955fa29468eb796fe3c1421b4cb", "3e279ee794e54f74b1af69f76a966a31", "da0fead6fe0547549f7d21c109295c78", "1d64432c0de54747a4373d2055e990ea", "20959362abf54f809bbc9279cfeda188" ] }, "outputId": "ae49d4f2-9afc-431b-d42f-8347d44d4274" }, "source": [ "evaluate_model(XGB)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "5238ac85157f48ebbef40b4332450a4d", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "b7ZesJMGkzcC", "colab": { "base_uri": "https://localhost:8080/", "height": 401 }, "outputId": "7753c792-a33c-48da-e1db-a81c516ff428" }, "source": [ "plot_model(XGB, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "OSKkKyufo1NC", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "738bda43761e444481ea74b6c2da8022", "fe521331d9a64ddb94d82c0b68616d84", "63bc1fbd946143a28334f9a2237178fd" ] }, "outputId": "cc5e2393-17db-4207-caf5-34d075d7f941" }, "source": [ "LR = create_model(estimator='lr')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.86790.93170.82500.86090.84260.72880.7293
10.86790.92380.83330.85470.84390.72940.7295
20.86070.94890.85000.82930.83950.71650.7167
30.86740.92230.86550.83060.84770.73040.7308
40.82440.89910.78990.79660.79320.64060.6406
50.87460.91990.84030.86210.85110.74270.7429
60.85300.94310.84030.81970.82990.70060.7007
70.86020.93670.87390.81250.84210.71700.7185
80.81000.90150.78990.77050.78010.61290.6131
90.86020.92540.87390.81250.84210.71700.7185
Mean0.85460.92520.83820.82490.83120.70360.7041
SD0.01980.01530.02880.02780.02310.04030.0405
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8679 0.9317 0.8250 0.8609 0.8426 0.7288 0.7293\n", "1 0.8679 0.9238 0.8333 0.8547 0.8439 0.7294 0.7295\n", "2 0.8607 0.9489 0.8500 0.8293 0.8395 0.7165 0.7167\n", "3 0.8674 0.9223 0.8655 0.8306 0.8477 0.7304 0.7308\n", "4 0.8244 0.8991 0.7899 0.7966 0.7932 0.6406 0.6406\n", "5 0.8746 0.9199 0.8403 0.8621 0.8511 0.7427 0.7429\n", "6 0.8530 0.9431 0.8403 0.8197 0.8299 0.7006 0.7007\n", "7 0.8602 0.9367 0.8739 0.8125 0.8421 0.7170 0.7185\n", "8 0.8100 0.9015 0.7899 0.7705 0.7801 0.6129 0.6131\n", "9 0.8602 0.9254 0.8739 0.8125 0.8421 0.7170 0.7185\n", "Mean 0.8546 0.9252 0.8382 0.8249 0.8312 0.7036 0.7041\n", "SD 0.0198 0.0153 0.0288 0.0278 0.0231 0.0403 0.0405" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "yABfbsENo3RS", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "2ed584d9e8da4f5da346b1e8d581efc2", "f46001a0e4914f3db48a84f7987d6b5b", "33bad682059a4e12839d36d0913169a9" ] }, "outputId": "9d7fa2fe-8b0e-4f92-e7ce-ec022eafdbf3" }, "source": [ "TunedModel = tune_model(LR)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.86790.93170.82500.86090.84260.72880.7293
10.86430.92430.82500.85340.83900.72180.7221
20.86790.94970.85830.83740.84770.73100.7312
30.86740.92200.86550.83060.84770.73040.7308
40.82440.89900.78990.79660.79320.64060.6406
50.87460.92220.84030.86210.85110.74270.7429
60.85300.94320.84030.81970.82990.70060.7007
70.86020.93670.87390.81250.84210.71700.7185
80.81360.90180.79830.77240.78510.62060.6209
90.86380.92230.87390.81890.84550.72400.7252
Mean0.85570.92530.83910.82640.83240.70570.7062
SD0.01930.01540.02830.02730.02240.03920.0393
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.8679 0.9317 0.8250 0.8609 0.8426 0.7288 0.7293\n", "1 0.8643 0.9243 0.8250 0.8534 0.8390 0.7218 0.7221\n", "2 0.8679 0.9497 0.8583 0.8374 0.8477 0.7310 0.7312\n", "3 0.8674 0.9220 0.8655 0.8306 0.8477 0.7304 0.7308\n", "4 0.8244 0.8990 0.7899 0.7966 0.7932 0.6406 0.6406\n", "5 0.8746 0.9222 0.8403 0.8621 0.8511 0.7427 0.7429\n", "6 0.8530 0.9432 0.8403 0.8197 0.8299 0.7006 0.7007\n", "7 0.8602 0.9367 0.8739 0.8125 0.8421 0.7170 0.7185\n", "8 0.8136 0.9018 0.7983 0.7724 0.7851 0.6206 0.6209\n", "9 0.8638 0.9223 0.8739 0.8189 0.8455 0.7240 0.7252\n", "Mean 0.8557 0.9253 0.8391 0.8264 0.8324 0.7057 0.7062\n", "SD 0.0193 0.0154 0.0283 0.0273 0.0224 0.0392 0.0393" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "Ufq9DQtqo4P5", "colab": { "base_uri": "https://localhost:8080/", "height": 634, "referenced_widgets": [ "77c8ccd8bd8f425cb99be8e58ee3d931", "72ee822a95ed4232bdc1c1ce909333ee", "dde01c732630412ba04e143c691fef50", "802bef155bd8481cbdfe9220094b971e", "940b0b4b95b547e8847918ae1d4c1ee6", "fdbb8e58e39a4ee3a4b53252a2a17dd6", "cb21cc1e1e9a415da8bca9e7ddd1afd4" ] }, "outputId": "c6a0345a-ada7-4203-a6f3-f7bf0aa483d2" }, "source": [ "evaluate_model(LR)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "77c8ccd8bd8f425cb99be8e58ee3d931", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "7zjKIvxjo7e6", "colab": { "base_uri": "https://localhost:8080/", "height": 401 }, "outputId": "8930f5da-a1c4-42f0-e937-d36c41a45258" }, "source": [ "plot_model(LR, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "wyWKtziNpCW8", "colab": { "base_uri": "https://localhost:8080/", "height": 421, "referenced_widgets": [ "fb4b36fcd06149798f6bd0ac5b92f623", "c28813b57f4149a290aa7fcdad2213cc", "370d6ac451114cbd9d38f3082e51cfbe" ] }, "outputId": "65f9929a-c44b-41a3-ebaa-f3469a535f98" }, "source": [ "catboost = create_model(estimator='catboost')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.90000.97130.87500.88980.88240.79540.7955
10.91430.96650.87500.92110.89740.82390.8247
20.93930.97940.93330.92560.92950.87620.8762
30.90680.96590.92440.86610.89430.81110.8125
40.88890.94690.89920.84920.87350.77460.7756
50.91040.97070.91600.87900.89710.81780.8184
60.88890.96830.89080.85480.87240.77410.7746
70.91760.96830.90760.90000.90380.83170.8317
80.92110.97230.94120.88190.91060.84020.8416
90.93550.98810.96640.89150.92740.86950.8718
Mean0.91230.96980.91290.88590.89880.82140.8223
SD0.01630.01000.02790.02410.01890.03320.0333
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.9000 0.9713 0.8750 0.8898 0.8824 0.7954 0.7955\n", "1 0.9143 0.9665 0.8750 0.9211 0.8974 0.8239 0.8247\n", "2 0.9393 0.9794 0.9333 0.9256 0.9295 0.8762 0.8762\n", "3 0.9068 0.9659 0.9244 0.8661 0.8943 0.8111 0.8125\n", "4 0.8889 0.9469 0.8992 0.8492 0.8735 0.7746 0.7756\n", "5 0.9104 0.9707 0.9160 0.8790 0.8971 0.8178 0.8184\n", "6 0.8889 0.9683 0.8908 0.8548 0.8724 0.7741 0.7746\n", "7 0.9176 0.9683 0.9076 0.9000 0.9038 0.8317 0.8317\n", "8 0.9211 0.9723 0.9412 0.8819 0.9106 0.8402 0.8416\n", "9 0.9355 0.9881 0.9664 0.8915 0.9274 0.8695 0.8718\n", "Mean 0.9123 0.9698 0.9129 0.8859 0.8988 0.8214 0.8223\n", "SD 0.0163 0.0100 0.0279 0.0241 0.0189 0.0332 0.0333" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "yvGrVHhMpEOK", "colab": { "base_uri": "https://localhost:8080/", "referenced_widgets": [ "666ea6b6c5e1477088874e17dc9c33b7", "7175066c42e54289a5038da594728ee0", "3d3e94b00fe743eb9499e640ae18a553" ] }, "outputId": "e63bbf68-559e-4d12-ef56-dfc05884c7e4" }, "source": [ "TunedModel = tune_model(catboost)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AccuracyAUCRecallPrec.F1KappaMCC
00.91430.97320.91670.88710.90160.82570.8261
10.91430.96980.89170.90680.89920.82460.8247
20.93930.97860.93330.92560.92950.87620.8762
30.91400.96960.92440.88000.90160.82530.8261
40.88170.95320.89080.84130.86530.76000.7610
50.92110.97450.91600.90080.90830.83920.8392
60.90320.96790.89920.87700.88800.80280.8030
70.90680.96930.90760.87800.89260.81030.8107
80.92110.97280.94120.88190.91060.84020.8416
90.94620.99050.97480.90620.93930.89120.8931
Mean0.91620.97190.91950.88850.90360.82950.8302
SD0.01720.00890.02430.02180.01970.03490.0350
\n", "
" ], "text/plain": [ " Accuracy AUC Recall Prec. F1 Kappa MCC\n", "0 0.9143 0.9732 0.9167 0.8871 0.9016 0.8257 0.8261\n", "1 0.9143 0.9698 0.8917 0.9068 0.8992 0.8246 0.8247\n", "2 0.9393 0.9786 0.9333 0.9256 0.9295 0.8762 0.8762\n", "3 0.9140 0.9696 0.9244 0.8800 0.9016 0.8253 0.8261\n", "4 0.8817 0.9532 0.8908 0.8413 0.8653 0.7600 0.7610\n", "5 0.9211 0.9745 0.9160 0.9008 0.9083 0.8392 0.8392\n", "6 0.9032 0.9679 0.8992 0.8770 0.8880 0.8028 0.8030\n", "7 0.9068 0.9693 0.9076 0.8780 0.8926 0.8103 0.8107\n", "8 0.9211 0.9728 0.9412 0.8819 0.9106 0.8402 0.8416\n", "9 0.9462 0.9905 0.9748 0.9062 0.9393 0.8912 0.8931\n", "Mean 0.9162 0.9719 0.9195 0.8885 0.9036 0.8295 0.8302\n", "SD 0.0172 0.0089 0.0243 0.0218 0.0197 0.0349 0.0350" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "_5346QYnpG3l", "colab": { "base_uri": "https://localhost:8080/", "height": 1000, "referenced_widgets": [ "f298fe3f4539460f892778917dca8e35", "3ae88fa2ea8642d88a4b44091352d1ae", "268e0463c4b44a1a9811775756d77c41", "d434264ed45c4de8af5e31ac2901b8c4", "497321ff3b6849b19b7ab938133316ad", "cc0fbcf2f77846f4bd1266103d07a1f7", "b995a9f6bf614675ac2153fc65daa3de" ] }, "outputId": "6d0aa99a-122a-4774-84f0-032d101b8171" }, "source": [ "evaluate_model(catboost)" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "f298fe3f4539460f892778917dca8e35", "version_minor": 0, "version_major": 2 }, "text/plain": [ "interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Hyperparameters', 'param…" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "ATpPxL1spLjy", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "742531e4-a803-4243-ca65-cf1b9025f991" }, "source": [ "plot_model(catboost, 'confusion_matrix')" ], "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "tags": [] } } ] }, { "cell_type": "markdown", "metadata": { "id": "X-7o23lc-bzA" }, "source": [ "# Conclusions" ] }, { "cell_type": "markdown", "metadata": { "id": "UQTuQkQJKomt" }, "source": [ "In our study we analyzed data from avalanches and measured weather variables for specific locations and dates to identify whether it was possible to predict an avalanche using the existing measured data.\n", "\n", "In this specific notebook the average of weather data from all locations was used in the analysis and prediction, so instead of focusing on particular data to understand avalanches in specific locations the study is more focused in a macro-weather environment that seems to be prone to avalanche incidence.\n", "\n", "By looking at the distributions of weather data from the days with and without avalanches we can see that Snow Water Equivalent is very important and this was confirmed when looking at feature importance in the final model. Also we were able to identify that the majority of avalanches happen in spring, probably because that is when snow is melting and mountains might be more unstable.\n", "\n", "The prediction model created is well capable to predict whether an avalanche might happen in one of the locations considering the overall weather data. However this model might not be good to predict the occurence of an avalanche in a specific location, as it uses that average of weather information. To get results for specific locations it would be recommended to collect weather data for as many locations as possible, and then cross those datasets to create the model." ] } ] }