diff --git a/scripts/Crop Prediction Model/Crop Prediction Model.ipynb b/scripts/Crop Prediction Model/Crop Prediction Model.ipynb new file mode 100644 index 0000000..5f3eb5e --- /dev/null +++ b/scripts/Crop Prediction Model/Crop Prediction Model.ipynb @@ -0,0 +1,7425 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [], + "collapsed_sections": [] + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + }, + "widgets": { + "application/vnd.jupyter.widget-state+json": { + "4d97448b0669441088bc1de94e9dc607": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_c91b2e4623f34177906f987bec76baf9", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 3, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 3, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_ac7d7c15b58e42feb475769f33a49f9d" + } + }, + "c91b2e4623f34177906f987bec76baf9": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "ac7d7c15b58e42feb475769f33a49f9d": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "4ec49eefe7b540309e3e519c7910f01b": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_5b2685d48b934e9cbbc7fab76fbe298c", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_29d19e3812564b86baa4871b47e78df9" + } + }, + "5b2685d48b934e9cbbc7fab76fbe298c": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "29d19e3812564b86baa4871b47e78df9": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "03a1c790ef41418291e4f80ba7828a47": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_da2198944b6045e2ac84185ccacbe869", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 3, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 3, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_a025df127a9f49b482e5f95693de90c4" + } + }, + "da2198944b6045e2ac84185ccacbe869": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "a025df127a9f49b482e5f95693de90c4": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "e803d5985cbf441ebb877da74cc47699": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_76bf50cb26144c4bbc0ebcb7fa71709e", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_c637685280d74a898eb266d991ccf636" + } + }, + "76bf50cb26144c4bbc0ebcb7fa71709e": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "c637685280d74a898eb266d991ccf636": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "5c642b3b0cf241b4b506c4aca79c361e": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_8cb9bb2280d34ab7949b4cb69f446ca4", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_2919f3677c134e74bf57badfe652fdfe" + } + }, + "8cb9bb2280d34ab7949b4cb69f446ca4": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "2919f3677c134e74bf57badfe652fdfe": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "f122f577289f4a93bfc6acd2bf23606b": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_70fa5ddb71044f61b83db783b5ab375e", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 3, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 3, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_08f8fdf2810e4c17855a725463b4f4a3" + } + }, + "70fa5ddb71044f61b83db783b5ab375e": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "08f8fdf2810e4c17855a725463b4f4a3": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "d299f7a26ebf45c188a3f24c9ba05974": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_6b18966bb05c4e418f177138db323181", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_fc462dcdd16d4084be2b9846ec39e172" + } + }, + "6b18966bb05c4e418f177138db323181": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "fc462dcdd16d4084be2b9846ec39e172": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "0c746ea40f204ab399fb8b1c9244da46": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_017e0f0f2fbe478f9a3b1045d92a72de", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 3, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 3, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_447d58fbe53745a79d8bfc43cba7a3e4" + } + }, + "017e0f0f2fbe478f9a3b1045d92a72de": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "447d58fbe53745a79d8bfc43cba7a3e4": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "6569f12f7f1b43f6acd5eaeb1867205d": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_4af4d5e36f174f23b592040a83ea4392", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_80f1ef7f786640cfac147d9ec65a5ad8" + } + }, + "4af4d5e36f174f23b592040a83ea4392": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "80f1ef7f786640cfac147d9ec65a5ad8": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "db4e51edffaf466c8a1a412095446f57": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_51ccf98d9bb54a0cbf3df2fbd90c82b6", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 3, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 3, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_c8ae01a51cd44aca9c56fbae5d6a4a0c" + } + }, + "51ccf98d9bb54a0cbf3df2fbd90c82b6": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "c8ae01a51cd44aca9c56fbae5d6a4a0c": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "c6af45d2d3244894ab43aa11587569fb": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_f569da0783864292890fb8bf352b1a0d", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_2b4cc526625e4736834375327176a117" + } + }, + "f569da0783864292890fb8bf352b1a0d": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "2b4cc526625e4736834375327176a117": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "e353c2e9634a41cc9754b120750c37b2": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_396885cfdccc48bb8f1cfd0223c97aa5", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 5, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 5, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_0568e477bbb745e68f7bd06a18056d9e" + } + }, + "396885cfdccc48bb8f1cfd0223c97aa5": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "0568e477bbb745e68f7bd06a18056d9e": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "0c7a96b7437d4f439ee58a7348112c07": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_3957ae44c0b64b01b4420040a5a107da", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 4, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 4, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_dac75abfd15a434bb8a399900709f4c6" + } + }, + "3957ae44c0b64b01b4420040a5a107da": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "dac75abfd15a434bb8a399900709f4c6": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "d5fa15c649734224a62b0416f1589e4c": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_bd048ed3009f474a99c795838ae4e809", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 5, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 5, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_3adfd8382a004ba493cf96f2228d28ed" + } + }, + "bd048ed3009f474a99c795838ae4e809": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "3adfd8382a004ba493cf96f2228d28ed": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "ca525e1c57d541299c9b4862c1fea11d": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_1dcfa769f8254370a963327b6f74b159", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 4, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 4, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_723e82f233be473789f249ecf0703ee2" + } + }, + "1dcfa769f8254370a963327b6f74b159": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "723e82f233be473789f249ecf0703ee2": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "e31ab003321c43b49caec0a8a7dde1cd": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_4647c3143e1340ff84efd9f4b3851a2a", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 5, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 5, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_db6f2f19b0e043cc8a0f71a3f9b49095" + } + }, + "4647c3143e1340ff84efd9f4b3851a2a": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "db6f2f19b0e043cc8a0f71a3f9b49095": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "a5c08029facf463a9683e5f23797fbcc": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_8257770e8802452db5e40e16c40c80da", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 5, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 5, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_b4c98f4b9fc646ebbf1e1c0d0ee9d3fc" + } + }, + "8257770e8802452db5e40e16c40c80da": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "b4c98f4b9fc646ebbf1e1c0d0ee9d3fc": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "db14ff1586104c1bb34e607996c13318": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_50d16bc916de4be295898de3aca4a08d", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 5, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 5, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_315962e470d04c78a2afc0a866afc592" + } + }, + "50d16bc916de4be295898de3aca4a08d": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "315962e470d04c78a2afc0a866afc592": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "2ac9fd07fa8e412abe829854d8b5ab09": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_7d21d3653fbc4502960a11960c92f416", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 3, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 3, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_27006ecb01ed4cc18f7ac2561ad883ab" + } + }, + "7d21d3653fbc4502960a11960c92f416": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "27006ecb01ed4cc18f7ac2561ad883ab": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "d86784e47b8c4c629b8c41625515777a": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_7d56b83610594b35b1bcd8151c08be13", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_fa1016a6026348ad99cd29901cd0dab1" + } + }, + "7d56b83610594b35b1bcd8151c08be13": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "fa1016a6026348ad99cd29901cd0dab1": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "424154f0a3a147ef8168c882e2fa0828": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_82499bfe63f44bc0aae73f91bc6fb978", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 3, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 3, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_19e9ca6460034820b935b5e9ca8b26ac" + } + }, + "82499bfe63f44bc0aae73f91bc6fb978": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "19e9ca6460034820b935b5e9ca8b26ac": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "a18cf2c481544c7da684a9fb97dbbe1b": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_4bdb923ebb8346e094c63efc2803c68a", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_fd7caca5c81a40ec83f6a8d941eac0d0" + } + }, + "4bdb923ebb8346e094c63efc2803c68a": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "fd7caca5c81a40ec83f6a8d941eac0d0": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "3326cab329d342979aca08e4ce37d5cb": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_62f0feb68ba4429ca76a68e9b6bac62d", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 3, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 3, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_942f83712fd84bc2b2020e89df1a44ce" + } + }, + "62f0feb68ba4429ca76a68e9b6bac62d": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "942f83712fd84bc2b2020e89df1a44ce": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + }, + "3c7626fe583a4cfc9b958fb4ddd2e15c": { + "model_module": "@jupyter-widgets/controls", + "model_name": "IntProgressModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "ProgressView", + "style": "IPY_MODEL_9a97b2b50ca949bf96f9a52599a2333c", + "_dom_classes": [], + "description": "Processing: ", + "_model_name": "IntProgressModel", + "bar_style": "", + "max": 74, + "_view_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "value": 74, + "_view_count": null, + "_view_module_version": "1.5.0", + "orientation": "horizontal", + "min": 0, + "description_tooltip": null, + "_model_module": "@jupyter-widgets/controls", + "layout": "IPY_MODEL_524f9ac1f5b4436ca47a6e9be1686d04" + } + }, + "9a97b2b50ca949bf96f9a52599a2333c": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_view_name": "StyleView", + "_model_name": "ProgressStyleModel", + "description_width": "", + "_view_module": "@jupyter-widgets/base", + "_model_module_version": "1.5.0", + "_view_count": null, + "_view_module_version": "1.2.0", + "bar_color": null, + "_model_module": "@jupyter-widgets/controls" + } + }, + "524f9ac1f5b4436ca47a6e9be1686d04": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_view_name": "LayoutView", + "grid_template_rows": null, + "right": null, + "justify_content": null, + "_view_module": "@jupyter-widgets/base", + "overflow": null, + "_model_module_version": "1.2.0", + "_view_count": null, + "flex_flow": null, + "width": null, + "min_width": null, + "border": null, + "align_items": null, + "bottom": null, + "_model_module": "@jupyter-widgets/base", + "top": null, + "grid_column": null, + "overflow_y": null, + "overflow_x": null, + "grid_auto_flow": null, + "grid_area": null, + "grid_template_columns": null, + "flex": null, + "_model_name": "LayoutModel", + "justify_items": null, + "grid_row": null, + "max_height": null, + "align_content": null, + "visibility": null, + "align_self": null, + "height": null, + "min_height": null, + "padding": null, + "grid_auto_rows": null, + "grid_gap": null, + "max_width": null, + "order": null, + "_view_module_version": "1.2.0", + "grid_template_areas": null, + "object_position": null, + "object_fit": null, + "grid_auto_columns": null, + "margin": null, + "display": null, + "left": null + } + } + } + } + }, + "cells": [ + { + "cell_type": "code", + "metadata": { + "id": "5CIgMSa8keZc", + "colab": { + "base_uri": "https://localhost:8080/", + "height": 223 + }, + "outputId": "b336f85a-37ed-4514-bc6c-266536f5587e" + }, + "source": [ + "import pandas as pd\n", + "\n", + "cropDataSet = pd.read_csv('/content/Crop_recommendation.csv')\n", + "print(type(cropDataSet))\n", + "\n", + "cropDataSet.head()" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\n" + ] + }, + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NPKtemperaturehumidityphrainfalllabel
090424320.87974482.0027446.502985202.935536rice
185584121.77046280.3196447.038096226.655537rice
260554423.00445982.3207637.840207263.964248rice
374354026.49109680.1583636.980401242.864034rice
478424220.13017581.6048737.628473262.717340rice
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " N P K temperature humidity ph rainfall label\n", + "0 90 42 43 20.879744 82.002744 6.502985 202.935536 rice\n", + "1 85 58 41 21.770462 80.319644 7.038096 226.655537 rice\n", + "2 60 55 44 23.004459 82.320763 7.840207 263.964248 rice\n", + "3 74 35 40 26.491096 80.158363 6.980401 242.864034 rice\n", + "4 78 42 42 20.130175 81.604873 7.628473 262.717340 rice" + ] + }, + "metadata": {}, + "execution_count": 1 + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "A30y-VtNim1h" + }, + "source": [ + "#### **(a) Install Pycaret**" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "cF_mSA9Xim1j", + "outputId": "94c66439-5011-4310-b903-22408449754b" + }, + "source": [ + "!pip install pycaret &> /dev/null\n", + "print (\"Pycaret installed sucessfully!!\")" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Pycaret installed sucessfully!!\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "B2r61OBMs1N6" + }, + "source": [ + "---\n", + "### **1.7 Three line of code for model comparison for \"Crop\" dataset**\n", + "---" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "2ac9fd07fa8e412abe829854d8b5ab09", + "7d21d3653fbc4502960a11960c92f416", + "27006ecb01ed4cc18f7ac2561ad883ab", + "d86784e47b8c4c629b8c41625515777a", + "7d56b83610594b35b1bcd8151c08be13", + "fa1016a6026348ad99cd29901cd0dab1" + ] + }, + "id": "OIoRFpzis1N8", + "outputId": "ffba049c-8ee7-4340-d915-89e807b564c4" + }, + "source": [ + "from pycaret.datasets import get_data\n", + "from pycaret.classification import *\n", + "\n", + "s = setup(data = cropDataSet, target='label', silent=True)\n", + "cm = compare_models()" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
rfRandom Forest Classifier0.99551.00000.99550.99630.99540.99520.99530.611
nbNaive Bayes0.99481.00000.99490.99540.99480.99460.99460.034
etExtra Trees Classifier0.99481.00000.99480.99570.99480.99460.99460.534
qdaQuadratic Discriminant Analysis0.99221.00000.99220.99300.99220.99180.99190.035
lightgbmLight Gradient Boosting Machine0.98830.99990.98820.99020.98830.98770.98781.010
gbcGradient Boosting Classifier0.98700.99990.98720.98920.98690.98640.98656.781
dtDecision Tree Classifier0.98250.99080.98230.98540.98240.98160.98180.034
knnK Neighbors Classifier0.97860.99770.97910.98200.97860.97750.97770.137
lrLogistic Regression0.96950.99960.96990.97280.96900.96800.96822.375
ldaLinear Discriminant Analysis0.96560.99970.96600.97290.96520.96390.96430.032
ridgeRidge Classifier0.71870.00000.71020.68620.65610.70500.71210.018
svmSVM - Linear Kernel0.71410.00000.71210.77190.69720.70040.72010.095
adaAda Boost Classifier0.18260.68500.18180.10070.11650.14270.23380.226
dummyDummy Classifier0.04680.50000.04550.00220.00420.00000.00000.026
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "rf Random Forest Classifier 0.9955 1.0000 0.9955 0.9963 \n", + "nb Naive Bayes 0.9948 1.0000 0.9949 0.9954 \n", + "et Extra Trees Classifier 0.9948 1.0000 0.9948 0.9957 \n", + "qda Quadratic Discriminant Analysis 0.9922 1.0000 0.9922 0.9930 \n", + "lightgbm Light Gradient Boosting Machine 0.9883 0.9999 0.9882 0.9902 \n", + "gbc Gradient Boosting Classifier 0.9870 0.9999 0.9872 0.9892 \n", + "dt Decision Tree Classifier 0.9825 0.9908 0.9823 0.9854 \n", + "knn K Neighbors Classifier 0.9786 0.9977 0.9791 0.9820 \n", + "lr Logistic Regression 0.9695 0.9996 0.9699 0.9728 \n", + "lda Linear Discriminant Analysis 0.9656 0.9997 0.9660 0.9729 \n", + "ridge Ridge Classifier 0.7187 0.0000 0.7102 0.6862 \n", + "svm SVM - Linear Kernel 0.7141 0.0000 0.7121 0.7719 \n", + "ada Ada Boost Classifier 0.1826 0.6850 0.1818 0.1007 \n", + "dummy Dummy Classifier 0.0468 0.5000 0.0455 0.0022 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "rf 0.9954 0.9952 0.9953 0.611 \n", + "nb 0.9948 0.9946 0.9946 0.034 \n", + "et 0.9948 0.9946 0.9946 0.534 \n", + "qda 0.9922 0.9918 0.9919 0.035 \n", + "lightgbm 0.9883 0.9877 0.9878 1.010 \n", + "gbc 0.9869 0.9864 0.9865 6.781 \n", + "dt 0.9824 0.9816 0.9818 0.034 \n", + "knn 0.9786 0.9775 0.9777 0.137 \n", + "lr 0.9690 0.9680 0.9682 2.375 \n", + "lda 0.9652 0.9639 0.9643 0.032 \n", + "ridge 0.6561 0.7050 0.7121 0.018 \n", + "svm 0.6972 0.7004 0.7201 0.095 \n", + "ada 0.1165 0.1427 0.2338 0.226 \n", + "dummy 0.0042 0.0000 0.0000 0.026 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "CCVV6JlQim2A" + }, + "source": [ + "#### **2.1 Model Performance using data \"Normalization\"**" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "424154f0a3a147ef8168c882e2fa0828", + "82499bfe63f44bc0aae73f91bc6fb978", + "19e9ca6460034820b935b5e9ca8b26ac", + "a18cf2c481544c7da684a9fb97dbbe1b", + "4bdb923ebb8346e094c63efc2803c68a", + "fd7caca5c81a40ec83f6a8d941eac0d0" + ] + }, + "id": "Atd6jNvmim2A", + "outputId": "fe97434f-f13c-4820-bea7-f10a6f56be21" + }, + "source": [ + "## Commonly used techniques: clipping, log scaling, z-score, minmax, maxabs, robust\n", + "s = setup(data=cropDataSet, target='label', normalize = True, normalize_method = 'zscore', silent=True)\n", + "cm = compare_models()\n" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
nbNaive Bayes0.99350.99990.99320.99480.99330.99320.99330.035
etExtra Trees Classifier0.99350.99990.99320.99480.99330.99320.99330.534
qdaQuadratic Discriminant Analysis0.99280.99990.99230.99430.99260.99250.99260.035
rfRandom Forest Classifier0.99221.00000.99170.99390.99190.99180.99190.631
lightgbmLight Gradient Boosting Machine0.99221.00000.99200.99340.99220.99180.99191.050
dtDecision Tree Classifier0.98640.99290.98600.98810.98610.98570.98580.034
gbcGradient Boosting Classifier0.98570.99990.98530.98810.98530.98500.98526.821
knnK Neighbors Classifier0.97210.99780.97220.97700.97170.97070.97100.137
ldaLinear Discriminant Analysis0.96690.99970.96690.97440.96640.96530.96570.033
lrLogistic Regression0.96560.99950.96520.96960.96510.96390.96420.226
svmSVM - Linear Kernel0.89730.00000.89790.93730.90400.89240.89530.070
ridgeRidge Classifier0.73100.00000.72980.70510.67730.71810.72450.017
adaAda Boost Classifier0.18320.68840.17730.09390.11080.13980.22640.226
dummyDummy Classifier0.05200.50000.04550.00270.00510.00000.00000.029
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "nb Naive Bayes 0.9935 0.9999 0.9932 0.9948 \n", + "et Extra Trees Classifier 0.9935 0.9999 0.9932 0.9948 \n", + "qda Quadratic Discriminant Analysis 0.9928 0.9999 0.9923 0.9943 \n", + "rf Random Forest Classifier 0.9922 1.0000 0.9917 0.9939 \n", + "lightgbm Light Gradient Boosting Machine 0.9922 1.0000 0.9920 0.9934 \n", + "dt Decision Tree Classifier 0.9864 0.9929 0.9860 0.9881 \n", + "gbc Gradient Boosting Classifier 0.9857 0.9999 0.9853 0.9881 \n", + "knn K Neighbors Classifier 0.9721 0.9978 0.9722 0.9770 \n", + "lda Linear Discriminant Analysis 0.9669 0.9997 0.9669 0.9744 \n", + "lr Logistic Regression 0.9656 0.9995 0.9652 0.9696 \n", + "svm SVM - Linear Kernel 0.8973 0.0000 0.8979 0.9373 \n", + "ridge Ridge Classifier 0.7310 0.0000 0.7298 0.7051 \n", + "ada Ada Boost Classifier 0.1832 0.6884 0.1773 0.0939 \n", + "dummy Dummy Classifier 0.0520 0.5000 0.0455 0.0027 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "nb 0.9933 0.9932 0.9933 0.035 \n", + "et 0.9933 0.9932 0.9933 0.534 \n", + "qda 0.9926 0.9925 0.9926 0.035 \n", + "rf 0.9919 0.9918 0.9919 0.631 \n", + "lightgbm 0.9922 0.9918 0.9919 1.050 \n", + "dt 0.9861 0.9857 0.9858 0.034 \n", + "gbc 0.9853 0.9850 0.9852 6.821 \n", + "knn 0.9717 0.9707 0.9710 0.137 \n", + "lda 0.9664 0.9653 0.9657 0.033 \n", + "lr 0.9651 0.9639 0.9642 0.226 \n", + "svm 0.9040 0.8924 0.8953 0.070 \n", + "ridge 0.6773 0.7181 0.7245 0.017 \n", + "ada 0.1108 0.1398 0.2264 0.226 \n", + "dummy 0.0051 0.0000 0.0000 0.029 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "WtiL4kV2uPHr" + }, + "source": [ + "**minmax : scales and translates each feature individually such that it is in the range of 0 – 1.**" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "3326cab329d342979aca08e4ce37d5cb", + "62f0feb68ba4429ca76a68e9b6bac62d", + "942f83712fd84bc2b2020e89df1a44ce", + "3c7626fe583a4cfc9b958fb4ddd2e15c", + "9a97b2b50ca949bf96f9a52599a2333c", + "524f9ac1f5b4436ca47a6e9be1686d04" + ] + }, + "id": "2a9HLuShuLZK", + "outputId": "8bb323b6-1efe-4b2d-f193-2802691fba02" + }, + "source": [ + "## Commonly used techniques: clipping, log scaling, z-score, minmax, maxabs, robust\n", + "s = setup(data=cropDataSet, target='label', normalize = True, normalize_method = 'minmax', silent=True)\n", + "cm = compare_models()\n" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
rfRandom Forest Classifier0.99611.00000.99620.99660.99610.99590.99590.626
nbNaive Bayes0.99351.00000.99350.99480.99340.99320.99330.037
qdaQuadratic Discriminant Analysis0.99221.00000.99210.99310.99220.99180.99190.034
etExtra Trees Classifier0.99161.00000.99130.99270.99140.99110.99120.524
lightgbmLight Gradient Boosting Machine0.98640.99990.98610.98830.98610.98570.98580.977
dtDecision Tree Classifier0.98510.99220.98510.98630.98490.98430.98440.036
gbcGradient Boosting Classifier0.98440.99990.98450.98620.98420.98370.98386.813
knnK Neighbors Classifier0.97860.99850.97860.98170.97820.97750.97770.131
ldaLinear Discriminant Analysis0.96620.99970.96640.97240.96560.96460.96500.033
lrLogistic Regression0.92400.99690.92140.94110.91770.92030.92150.186
svmSVM - Linear Kernel0.90120.00000.89870.92610.90020.89650.89810.067
ridgeRidge Classifier0.68090.00000.67390.64180.61220.66540.67280.019
adaAda Boost Classifier0.18190.68720.17270.09260.10940.13810.22390.234
dummyDummy Classifier0.05200.50000.04550.00270.00510.00000.00000.024
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "rf Random Forest Classifier 0.9961 1.0000 0.9962 0.9966 \n", + "nb Naive Bayes 0.9935 1.0000 0.9935 0.9948 \n", + "qda Quadratic Discriminant Analysis 0.9922 1.0000 0.9921 0.9931 \n", + "et Extra Trees Classifier 0.9916 1.0000 0.9913 0.9927 \n", + "lightgbm Light Gradient Boosting Machine 0.9864 0.9999 0.9861 0.9883 \n", + "dt Decision Tree Classifier 0.9851 0.9922 0.9851 0.9863 \n", + "gbc Gradient Boosting Classifier 0.9844 0.9999 0.9845 0.9862 \n", + "knn K Neighbors Classifier 0.9786 0.9985 0.9786 0.9817 \n", + "lda Linear Discriminant Analysis 0.9662 0.9997 0.9664 0.9724 \n", + "lr Logistic Regression 0.9240 0.9969 0.9214 0.9411 \n", + "svm SVM - Linear Kernel 0.9012 0.0000 0.8987 0.9261 \n", + "ridge Ridge Classifier 0.6809 0.0000 0.6739 0.6418 \n", + "ada Ada Boost Classifier 0.1819 0.6872 0.1727 0.0926 \n", + "dummy Dummy Classifier 0.0520 0.5000 0.0455 0.0027 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "rf 0.9961 0.9959 0.9959 0.626 \n", + "nb 0.9934 0.9932 0.9933 0.037 \n", + "qda 0.9922 0.9918 0.9919 0.034 \n", + "et 0.9914 0.9911 0.9912 0.524 \n", + "lightgbm 0.9861 0.9857 0.9858 0.977 \n", + "dt 0.9849 0.9843 0.9844 0.036 \n", + "gbc 0.9842 0.9837 0.9838 6.813 \n", + "knn 0.9782 0.9775 0.9777 0.131 \n", + "lda 0.9656 0.9646 0.9650 0.033 \n", + "lr 0.9177 0.9203 0.9215 0.186 \n", + "svm 0.9002 0.8965 0.8981 0.067 \n", + "ridge 0.6122 0.6654 0.6728 0.019 \n", + "ada 0.1094 0.1381 0.2239 0.234 \n", + "dummy 0.0051 0.0000 0.0000 0.024 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "ms4-H0buufKC" + }, + "source": [ + "**robust : scales and translates each feature according to the Interquartile range. When the dataset contains outliers, robust scaler often gives better results.**" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "5c642b3b0cf241b4b506c4aca79c361e", + "8cb9bb2280d34ab7949b4cb69f446ca4", + "2919f3677c134e74bf57badfe652fdfe" + ] + }, + "id": "SjtgooljudSZ", + "outputId": "0667f94f-00a6-45a8-b6fa-8d98adc6adc5" + }, + "source": [ + "## Commonly used techniques: clipping, log scaling, z-score, minmax, maxabs, robust\n", + "s = setup(data=cropDataSet, target='label', normalize = True, normalize_method = 'robust', silent=True)\n", + "cm = compare_models()\n" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
rfRandom Forest Classifier0.99481.00000.99520.99550.99480.99460.99460.627
lightgbmLight Gradient Boosting Machine0.99421.00000.99410.99490.99410.99390.99391.084
nbNaive Bayes0.99350.99990.99390.99430.99350.99320.99320.034
etExtra Trees Classifier0.99350.99990.99370.99430.99350.99320.99320.516
qdaQuadratic Discriminant Analysis0.98960.99990.98990.99080.98960.98910.98920.031
gbcGradient Boosting Classifier0.98770.99990.98780.98930.98750.98710.98727.245
dtDecision Tree Classifier0.98310.99110.98340.98460.98300.98230.98240.032
knnK Neighbors Classifier0.97660.99780.97760.98030.97620.97550.97570.128
lrLogistic Regression0.96620.99950.96680.96980.96600.96460.96480.257
ldaLinear Discriminant Analysis0.96360.99960.96470.96980.96300.96190.96230.031
svmSVM - Linear Kernel0.91610.00000.91440.94230.91980.91210.91390.069
ridgeRidge Classifier0.66410.00000.64950.62230.58900.64750.65580.018
adaAda Boost Classifier0.21050.70230.20000.12670.14240.16900.26410.241
dummyDummy Classifier0.04940.50000.04550.00240.00470.00000.00000.023
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "rf Random Forest Classifier 0.9948 1.0000 0.9952 0.9955 \n", + "lightgbm Light Gradient Boosting Machine 0.9942 1.0000 0.9941 0.9949 \n", + "nb Naive Bayes 0.9935 0.9999 0.9939 0.9943 \n", + "et Extra Trees Classifier 0.9935 0.9999 0.9937 0.9943 \n", + "qda Quadratic Discriminant Analysis 0.9896 0.9999 0.9899 0.9908 \n", + "gbc Gradient Boosting Classifier 0.9877 0.9999 0.9878 0.9893 \n", + "dt Decision Tree Classifier 0.9831 0.9911 0.9834 0.9846 \n", + "knn K Neighbors Classifier 0.9766 0.9978 0.9776 0.9803 \n", + "lr Logistic Regression 0.9662 0.9995 0.9668 0.9698 \n", + "lda Linear Discriminant Analysis 0.9636 0.9996 0.9647 0.9698 \n", + "svm SVM - Linear Kernel 0.9161 0.0000 0.9144 0.9423 \n", + "ridge Ridge Classifier 0.6641 0.0000 0.6495 0.6223 \n", + "ada Ada Boost Classifier 0.2105 0.7023 0.2000 0.1267 \n", + "dummy Dummy Classifier 0.0494 0.5000 0.0455 0.0024 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "rf 0.9948 0.9946 0.9946 0.627 \n", + "lightgbm 0.9941 0.9939 0.9939 1.084 \n", + "nb 0.9935 0.9932 0.9932 0.034 \n", + "et 0.9935 0.9932 0.9932 0.516 \n", + "qda 0.9896 0.9891 0.9892 0.031 \n", + "gbc 0.9875 0.9871 0.9872 7.245 \n", + "dt 0.9830 0.9823 0.9824 0.032 \n", + "knn 0.9762 0.9755 0.9757 0.128 \n", + "lr 0.9660 0.9646 0.9648 0.257 \n", + "lda 0.9630 0.9619 0.9623 0.031 \n", + "svm 0.9198 0.9121 0.9139 0.069 \n", + "ridge 0.5890 0.6475 0.6558 0.018 \n", + "ada 0.1424 0.1690 0.2641 0.241 \n", + "dummy 0.0047 0.0000 0.0000 0.023 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "oWMPU3KMim2B" + }, + "source": [ + "---\n", + "### **2.2 Model Performance using \"Feature Selection\"**\n", + "---" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "f122f577289f4a93bfc6acd2bf23606b", + "70fa5ddb71044f61b83db783b5ab375e", + "08f8fdf2810e4c17855a725463b4f4a3", + "d299f7a26ebf45c188a3f24c9ba05974", + "6b18966bb05c4e418f177138db323181", + "fc462dcdd16d4084be2b9846ec39e172" + ] + }, + "id": "43l42fj_im2C", + "outputId": "5bb360be-901a-47b9-ea1d-f55966728b11" + }, + "source": [ + "s = setup(data=cropDataSet, target='label', feature_selection = True, feature_selection_threshold = 0.6, silent=True)\n", + "cm = compare_models()" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
rfRandom Forest Classifier0.98960.99990.98960.99110.98950.98910.98920.631
nbNaive Bayes0.98830.99990.98790.99010.98790.98770.98790.030
etExtra Trees Classifier0.98770.99990.98750.98930.98750.98710.98720.510
qdaQuadratic Discriminant Analysis0.98510.99980.98470.98680.98480.98430.98440.030
lightgbmLight Gradient Boosting Machine0.98380.99970.98400.98590.98380.98300.98310.912
dtDecision Tree Classifier0.97920.98910.97940.98130.97900.97820.97830.031
gbcGradient Boosting Classifier0.97860.99980.97810.98260.97880.97750.97776.166
knnK Neighbors Classifier0.96690.99690.96610.97040.96640.96530.96550.125
lrLogistic Regression0.94480.99850.94370.95050.94460.94210.94242.338
ldaLinear Discriminant Analysis0.94480.99930.94440.95170.94320.94210.94260.032
svmSVM - Linear Kernel0.56730.00000.56710.59950.52950.54690.57430.120
ridgeRidge Classifier0.53480.00000.51790.48230.45440.51170.52360.017
adaAda Boost Classifier0.17670.67500.16820.09130.10700.13260.22230.219
dummyDummy Classifier0.05200.50000.04550.00270.00510.00000.00000.024
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "rf Random Forest Classifier 0.9896 0.9999 0.9896 0.9911 \n", + "nb Naive Bayes 0.9883 0.9999 0.9879 0.9901 \n", + "et Extra Trees Classifier 0.9877 0.9999 0.9875 0.9893 \n", + "qda Quadratic Discriminant Analysis 0.9851 0.9998 0.9847 0.9868 \n", + "lightgbm Light Gradient Boosting Machine 0.9838 0.9997 0.9840 0.9859 \n", + "dt Decision Tree Classifier 0.9792 0.9891 0.9794 0.9813 \n", + "gbc Gradient Boosting Classifier 0.9786 0.9998 0.9781 0.9826 \n", + "knn K Neighbors Classifier 0.9669 0.9969 0.9661 0.9704 \n", + "lr Logistic Regression 0.9448 0.9985 0.9437 0.9505 \n", + "lda Linear Discriminant Analysis 0.9448 0.9993 0.9444 0.9517 \n", + "svm SVM - Linear Kernel 0.5673 0.0000 0.5671 0.5995 \n", + "ridge Ridge Classifier 0.5348 0.0000 0.5179 0.4823 \n", + "ada Ada Boost Classifier 0.1767 0.6750 0.1682 0.0913 \n", + "dummy Dummy Classifier 0.0520 0.5000 0.0455 0.0027 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "rf 0.9895 0.9891 0.9892 0.631 \n", + "nb 0.9879 0.9877 0.9879 0.030 \n", + "et 0.9875 0.9871 0.9872 0.510 \n", + "qda 0.9848 0.9843 0.9844 0.030 \n", + "lightgbm 0.9838 0.9830 0.9831 0.912 \n", + "dt 0.9790 0.9782 0.9783 0.031 \n", + "gbc 0.9788 0.9775 0.9777 6.166 \n", + "knn 0.9664 0.9653 0.9655 0.125 \n", + "lr 0.9446 0.9421 0.9424 2.338 \n", + "lda 0.9432 0.9421 0.9426 0.032 \n", + "svm 0.5295 0.5469 0.5743 0.120 \n", + "ridge 0.4544 0.5117 0.5236 0.017 \n", + "ada 0.1070 0.1326 0.2223 0.219 \n", + "dummy 0.0051 0.0000 0.0000 0.024 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "1yxgZDazvZcS" + }, + "source": [ + "**When Threshold is increased to 0.8**" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "0c746ea40f204ab399fb8b1c9244da46", + "017e0f0f2fbe478f9a3b1045d92a72de", + "447d58fbe53745a79d8bfc43cba7a3e4", + "6569f12f7f1b43f6acd5eaeb1867205d", + "4af4d5e36f174f23b592040a83ea4392", + "80f1ef7f786640cfac147d9ec65a5ad8" + ] + }, + "id": "8rzW7L-WvghD", + "outputId": "1ff7083c-281b-4e5e-fb94-51e9e0cb501e" + }, + "source": [ + "s = setup(data=cropDataSet, target='label', feature_selection = True, feature_selection_threshold = 0.8, silent=True)\n", + "cm = compare_models()" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
rfRandom Forest Classifier0.99221.00000.99200.99350.99210.99180.99190.612
etExtra Trees Classifier0.99091.00000.99060.99230.99080.99050.99050.521
qdaQuadratic Discriminant Analysis0.98961.00000.98960.99090.98950.98910.98920.030
nbNaive Bayes0.98900.99990.98900.99050.98890.98840.98850.030
gbcGradient Boosting Classifier0.98640.99990.98630.98820.98640.98570.98586.559
dtDecision Tree Classifier0.98440.99180.98450.98650.98430.98370.98380.031
lightgbmLight Gradient Boosting Machine0.98440.99990.98460.98630.98430.98370.98380.908
knnK Neighbors Classifier0.97460.99870.97490.97860.97440.97340.97370.124
ldaLinear Discriminant Analysis0.96750.99960.96820.97390.96710.96600.96630.030
lrLogistic Regression0.95970.99950.96000.96470.95910.95780.95811.995
ridgeRidge Classifier0.70890.00000.70240.70060.65690.69480.70210.021
svmSVM - Linear Kernel0.68940.00000.68790.75550.67310.67440.69420.089
adaAda Boost Classifier0.18390.68800.18180.09820.11420.14190.23030.221
dummyDummy Classifier0.05000.50000.04550.00250.00480.00000.00000.022
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "rf Random Forest Classifier 0.9922 1.0000 0.9920 0.9935 \n", + "et Extra Trees Classifier 0.9909 1.0000 0.9906 0.9923 \n", + "qda Quadratic Discriminant Analysis 0.9896 1.0000 0.9896 0.9909 \n", + "nb Naive Bayes 0.9890 0.9999 0.9890 0.9905 \n", + "gbc Gradient Boosting Classifier 0.9864 0.9999 0.9863 0.9882 \n", + "dt Decision Tree Classifier 0.9844 0.9918 0.9845 0.9865 \n", + "lightgbm Light Gradient Boosting Machine 0.9844 0.9999 0.9846 0.9863 \n", + "knn K Neighbors Classifier 0.9746 0.9987 0.9749 0.9786 \n", + "lda Linear Discriminant Analysis 0.9675 0.9996 0.9682 0.9739 \n", + "lr Logistic Regression 0.9597 0.9995 0.9600 0.9647 \n", + "ridge Ridge Classifier 0.7089 0.0000 0.7024 0.7006 \n", + "svm SVM - Linear Kernel 0.6894 0.0000 0.6879 0.7555 \n", + "ada Ada Boost Classifier 0.1839 0.6880 0.1818 0.0982 \n", + "dummy Dummy Classifier 0.0500 0.5000 0.0455 0.0025 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "rf 0.9921 0.9918 0.9919 0.612 \n", + "et 0.9908 0.9905 0.9905 0.521 \n", + "qda 0.9895 0.9891 0.9892 0.030 \n", + "nb 0.9889 0.9884 0.9885 0.030 \n", + "gbc 0.9864 0.9857 0.9858 6.559 \n", + "dt 0.9843 0.9837 0.9838 0.031 \n", + "lightgbm 0.9843 0.9837 0.9838 0.908 \n", + "knn 0.9744 0.9734 0.9737 0.124 \n", + "lda 0.9671 0.9660 0.9663 0.030 \n", + "lr 0.9591 0.9578 0.9581 1.995 \n", + "ridge 0.6569 0.6948 0.7021 0.021 \n", + "svm 0.6731 0.6744 0.6942 0.089 \n", + "ada 0.1142 0.1419 0.2303 0.221 \n", + "dummy 0.0048 0.0000 0.0000 0.022 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "affIBZhevkSS" + }, + "source": [ + "**When Threshold is decresed to 0.4**" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "db4e51edffaf466c8a1a412095446f57", + "51ccf98d9bb54a0cbf3df2fbd90c82b6", + "c8ae01a51cd44aca9c56fbae5d6a4a0c", + "c6af45d2d3244894ab43aa11587569fb", + "f569da0783864292890fb8bf352b1a0d", + "2b4cc526625e4736834375327176a117" + ] + }, + "id": "xW6UHzRBvpuX", + "outputId": "5f62672f-5437-4555-82b4-71b3b08a101a" + }, + "source": [ + "s = setup(data=cropDataSet, target='label', feature_selection = True, feature_selection_threshold = 0.4, silent=True)\n", + "cm = compare_models()" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
nbNaive Bayes0.96100.99890.95840.96820.95990.95910.95960.031
qdaQuadratic Discriminant Analysis0.95840.99880.95590.96590.95740.95640.95690.032
rfRandom Forest Classifier0.95710.99810.95450.96180.95660.95510.95540.591
etExtra Trees Classifier0.94870.99770.94600.95460.94800.94620.94650.531
lightgbmLight Gradient Boosting Machine0.94740.99700.94460.95330.94730.94480.94520.843
gbcGradient Boosting Classifier0.94610.99760.94290.95210.94560.94350.94385.157
dtDecision Tree Classifier0.93960.96840.93690.94460.93900.93670.93700.030
knnK Neighbors Classifier0.93570.99120.93230.94510.93320.93260.93320.126
ldaLinear Discriminant Analysis0.89340.99570.89070.90680.88780.88830.88950.029
lrLogistic Regression0.83820.99080.83780.84590.83250.83040.83141.979
svmSVM - Linear Kernel0.33590.00000.33980.28460.28040.30520.36550.121
ridgeRidge Classifier0.26970.00000.26830.12500.14970.23460.24780.019
adaAda Boost Classifier0.23390.70320.22730.16420.17470.19390.30300.209
dummyDummy Classifier0.05130.50000.04550.00260.00500.00000.00000.021
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "nb Naive Bayes 0.9610 0.9989 0.9584 0.9682 \n", + "qda Quadratic Discriminant Analysis 0.9584 0.9988 0.9559 0.9659 \n", + "rf Random Forest Classifier 0.9571 0.9981 0.9545 0.9618 \n", + "et Extra Trees Classifier 0.9487 0.9977 0.9460 0.9546 \n", + "lightgbm Light Gradient Boosting Machine 0.9474 0.9970 0.9446 0.9533 \n", + "gbc Gradient Boosting Classifier 0.9461 0.9976 0.9429 0.9521 \n", + "dt Decision Tree Classifier 0.9396 0.9684 0.9369 0.9446 \n", + "knn K Neighbors Classifier 0.9357 0.9912 0.9323 0.9451 \n", + "lda Linear Discriminant Analysis 0.8934 0.9957 0.8907 0.9068 \n", + "lr Logistic Regression 0.8382 0.9908 0.8378 0.8459 \n", + "svm SVM - Linear Kernel 0.3359 0.0000 0.3398 0.2846 \n", + "ridge Ridge Classifier 0.2697 0.0000 0.2683 0.1250 \n", + "ada Ada Boost Classifier 0.2339 0.7032 0.2273 0.1642 \n", + "dummy Dummy Classifier 0.0513 0.5000 0.0455 0.0026 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "nb 0.9599 0.9591 0.9596 0.031 \n", + "qda 0.9574 0.9564 0.9569 0.032 \n", + "rf 0.9566 0.9551 0.9554 0.591 \n", + "et 0.9480 0.9462 0.9465 0.531 \n", + "lightgbm 0.9473 0.9448 0.9452 0.843 \n", + "gbc 0.9456 0.9435 0.9438 5.157 \n", + "dt 0.9390 0.9367 0.9370 0.030 \n", + "knn 0.9332 0.9326 0.9332 0.126 \n", + "lda 0.8878 0.8883 0.8895 0.029 \n", + "lr 0.8325 0.8304 0.8314 1.979 \n", + "svm 0.2804 0.3052 0.3655 0.121 \n", + "ridge 0.1497 0.2346 0.2478 0.019 \n", + "ada 0.1747 0.1939 0.3030 0.209 \n", + "dummy 0.0050 0.0000 0.0000 0.021 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "kt034D2wim2C" + }, + "source": [ + "---\n", + "### **2.3 Model Performance using \"Outlier Removal\"**\n", + "---" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "4d97448b0669441088bc1de94e9dc607", + "c91b2e4623f34177906f987bec76baf9", + "ac7d7c15b58e42feb475769f33a49f9d", + "4ec49eefe7b540309e3e519c7910f01b", + "5b2685d48b934e9cbbc7fab76fbe298c", + "29d19e3812564b86baa4871b47e78df9" + ] + }, + "id": "oAaDhJctim2D", + "outputId": "723da45e-33b0-44f3-99ad-5fdcddb76354" + }, + "source": [ + "s = setup(data=cropDataSet, target='label', remove_outliers = True, outliers_threshold = 0.05, silent=True)\n", + "cm = compare_models()" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
rfRandom Forest Classifier0.99521.00000.99530.99570.99520.99500.99500.572
nbNaive Bayes0.99450.99990.99470.99490.99450.99430.99430.027
etExtra Trees Classifier0.99320.99990.99340.99360.99310.99280.99290.489
qdaQuadratic Discriminant Analysis0.99180.99990.99210.99230.99160.99140.99140.028
lightgbmLight Gradient Boosting Machine0.98970.99980.99010.99100.98980.98920.98930.917
dtDecision Tree Classifier0.98630.99280.98600.98790.98610.98570.98570.028
gbcGradient Boosting Classifier0.98430.99980.98470.98660.98420.98350.98366.434
knnK Neighbors Classifier0.97470.99940.97510.97750.97440.97340.97360.131
lrLogistic Regression0.96850.99950.96950.97100.96830.96700.96721.682
ldaLinear Discriminant Analysis0.96850.99970.96980.97460.96780.96700.96740.026
ridgeRidge Classifier0.72020.00000.70010.66120.65130.70640.71300.015
svmSVM - Linear Kernel0.69220.00000.69190.76540.67870.67670.70060.076
adaAda Boost Classifier0.20930.68280.20450.13260.14540.16580.27210.202
dummyDummy Classifier0.05400.50000.04550.00290.00550.00000.00000.022
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "rf Random Forest Classifier 0.9952 1.0000 0.9953 0.9957 \n", + "nb Naive Bayes 0.9945 0.9999 0.9947 0.9949 \n", + "et Extra Trees Classifier 0.9932 0.9999 0.9934 0.9936 \n", + "qda Quadratic Discriminant Analysis 0.9918 0.9999 0.9921 0.9923 \n", + "lightgbm Light Gradient Boosting Machine 0.9897 0.9998 0.9901 0.9910 \n", + "dt Decision Tree Classifier 0.9863 0.9928 0.9860 0.9879 \n", + "gbc Gradient Boosting Classifier 0.9843 0.9998 0.9847 0.9866 \n", + "knn K Neighbors Classifier 0.9747 0.9994 0.9751 0.9775 \n", + "lr Logistic Regression 0.9685 0.9995 0.9695 0.9710 \n", + "lda Linear Discriminant Analysis 0.9685 0.9997 0.9698 0.9746 \n", + "ridge Ridge Classifier 0.7202 0.0000 0.7001 0.6612 \n", + "svm SVM - Linear Kernel 0.6922 0.0000 0.6919 0.7654 \n", + "ada Ada Boost Classifier 0.2093 0.6828 0.2045 0.1326 \n", + "dummy Dummy Classifier 0.0540 0.5000 0.0455 0.0029 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "rf 0.9952 0.9950 0.9950 0.572 \n", + "nb 0.9945 0.9943 0.9943 0.027 \n", + "et 0.9931 0.9928 0.9929 0.489 \n", + "qda 0.9916 0.9914 0.9914 0.028 \n", + "lightgbm 0.9898 0.9892 0.9893 0.917 \n", + "dt 0.9861 0.9857 0.9857 0.028 \n", + "gbc 0.9842 0.9835 0.9836 6.434 \n", + "knn 0.9744 0.9734 0.9736 0.131 \n", + "lr 0.9683 0.9670 0.9672 1.682 \n", + "lda 0.9678 0.9670 0.9674 0.026 \n", + "ridge 0.6513 0.7064 0.7130 0.015 \n", + "svm 0.6787 0.6767 0.7006 0.076 \n", + "ada 0.1454 0.1658 0.2721 0.202 \n", + "dummy 0.0055 0.0000 0.0000 0.022 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "9IIR2eMyim2E" + }, + "source": [ + "\n", + "### **2.4 Model Performance using \"PCA\"**\n", + "---" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 488, + "referenced_widgets": [ + "03a1c790ef41418291e4f80ba7828a47", + "da2198944b6045e2ac84185ccacbe869", + "a025df127a9f49b482e5f95693de90c4", + "e803d5985cbf441ebb877da74cc47699", + "76bf50cb26144c4bbc0ebcb7fa71709e", + "c637685280d74a898eb266d991ccf636" + ] + }, + "id": "IbRChxn3im2E", + "outputId": "a66ce3f4-6b83-4cd2-b8ea-1c6392a36f29" + }, + "source": [ + "s = setup(data=cropDataSet, target='label', pca = True, pca_method = 'linear', silent=True)\n", + "cm = compare_models()" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ModelAccuracyAUCRecallPrec.F1KappaMCCTT (Sec)
qdaQuadratic Discriminant Analysis0.98770.99990.98740.98870.98770.98710.98710.028
etExtra Trees Classifier0.98510.99980.98460.98680.98490.98430.98440.494
nbNaive Bayes0.98440.99990.98420.98690.98430.98370.98380.028
rfRandom Forest Classifier0.98370.99930.98340.98590.98380.98300.98310.620
lrLogistic Regression0.97990.99980.97930.98220.97960.97890.97901.740
knnK Neighbors Classifier0.97660.99840.97600.97900.97650.97550.97560.126
lightgbmLight Gradient Boosting Machine0.97140.99920.97120.97400.97140.97000.97021.007
dtDecision Tree Classifier0.95780.97790.95670.96230.95760.95570.95600.030
ldaLinear Discriminant Analysis0.95650.99940.95560.96330.95650.95440.95470.026
gbcGradient Boosting Classifier0.95580.99900.95520.96300.95650.95370.95406.285
svmSVM - Linear Kernel0.77780.00000.77560.76340.73940.76720.77290.067
ridgeRidge Classifier0.61530.00000.60270.53780.52690.59660.60740.014
adaAda Boost Classifier0.14490.62970.13700.08250.08590.09980.19430.206
dummyDummy Classifier0.05070.50000.04550.00260.00490.00000.00000.023
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " Model Accuracy AUC Recall Prec. \\\n", + "qda Quadratic Discriminant Analysis 0.9877 0.9999 0.9874 0.9887 \n", + "et Extra Trees Classifier 0.9851 0.9998 0.9846 0.9868 \n", + "nb Naive Bayes 0.9844 0.9999 0.9842 0.9869 \n", + "rf Random Forest Classifier 0.9837 0.9993 0.9834 0.9859 \n", + "lr Logistic Regression 0.9799 0.9998 0.9793 0.9822 \n", + "knn K Neighbors Classifier 0.9766 0.9984 0.9760 0.9790 \n", + "lightgbm Light Gradient Boosting Machine 0.9714 0.9992 0.9712 0.9740 \n", + "dt Decision Tree Classifier 0.9578 0.9779 0.9567 0.9623 \n", + "lda Linear Discriminant Analysis 0.9565 0.9994 0.9556 0.9633 \n", + "gbc Gradient Boosting Classifier 0.9558 0.9990 0.9552 0.9630 \n", + "svm SVM - Linear Kernel 0.7778 0.0000 0.7756 0.7634 \n", + "ridge Ridge Classifier 0.6153 0.0000 0.6027 0.5378 \n", + "ada Ada Boost Classifier 0.1449 0.6297 0.1370 0.0825 \n", + "dummy Dummy Classifier 0.0507 0.5000 0.0455 0.0026 \n", + "\n", + " F1 Kappa MCC TT (Sec) \n", + "qda 0.9877 0.9871 0.9871 0.028 \n", + "et 0.9849 0.9843 0.9844 0.494 \n", + "nb 0.9843 0.9837 0.9838 0.028 \n", + "rf 0.9838 0.9830 0.9831 0.620 \n", + "lr 0.9796 0.9789 0.9790 1.740 \n", + "knn 0.9765 0.9755 0.9756 0.126 \n", + "lightgbm 0.9714 0.9700 0.9702 1.007 \n", + "dt 0.9576 0.9557 0.9560 0.030 \n", + "lda 0.9565 0.9544 0.9547 0.026 \n", + "gbc 0.9565 0.9537 0.9540 6.285 \n", + "svm 0.7394 0.7672 0.7729 0.067 \n", + "ridge 0.5269 0.5966 0.6074 0.014 \n", + "ada 0.0859 0.0998 0.1943 0.206 \n", + "dummy 0.0049 0.0000 0.0000 0.023 " + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "YBbGvYyvyrLZ" + }, + "source": [ + "**kernel : dimensionality reduction through the use of RVF kernel.**" + ] + }, + { + "cell_type": "code", + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 182 + }, + "id": "4KhTwkKjy0ma", + "outputId": "59d8805f-1a7f-480f-de06-8a1dc68d5782" + }, + "source": [ + "s = setup(data=cropDataSet, target='label', pca = True, pca_method = 'kernel', silent=True)\n", + "cm = compare_models()" + ], + "execution_count": null, + "outputs": [ + { + "output_type": "error", + "ename": "NameError", + "evalue": "ignored", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mNameError\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0ms\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0msetup\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcropDataSet\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtarget\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m'label'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mpca\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mpca_method\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m'kernel'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0msilent\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 2\u001b[0m \u001b[0mcm\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcompare_models\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mNameError\u001b[0m: name 'setup' is not defined" + ] + } + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "VC3iI98s1BtE" + }, + "source": [ + "k_range = range(1,11)\n", + "scores = []\n", + "\n", + "for k in k_range:\n", + " knn = KNeighborsClassifier(n_neighbors = k)\n", + " knn.fit(X_train_scaled, y_train)\n", + " scores.append(knn.score(X_test_scaled, y_test))\n", + "\n", + "plt.xlabel('k')\n", + "plt.ylabel('accuracy')\n", + "plt.scatter(k_range, scores)\n", + "plt.vlines(k_range,0, scores, linestyle=\"dashed\")\n", + "plt.ylim(0.96,0.99)\n", + "plt.xticks([i for i in range(1,11)]);" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "from pycaret.datasets import get_data\n", + "from pycaret.classification import *\n", + "\n", + " # SN is 46\n", + "s = setup(data=cropDataSet, target='label', normalize = True, normalize_method = 'zscore', silent=True)\n", + "\n", + "nbModel = create_model('nb')\n", + "plot_model(nbModel, plot='confusion_matrix')\n" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 374 + }, + "id": "KgegJAMLEAJC", + "outputId": "36f8e68c-8c68-4ce9-9d22-5bd5d8e7d98a" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "error", + "ename": "ModuleNotFoundError", + "evalue": "ignored", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0;32mfrom\u001b[0m \u001b[0mpycaret\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdatasets\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mget_data\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 2\u001b[0m \u001b[0;32mfrom\u001b[0m \u001b[0mpycaret\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mclassification\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 3\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 4\u001b[0m \u001b[0;31m# SN is 46\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 5\u001b[0m \u001b[0ms\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0msetup\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcropDataSet\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtarget\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m'label'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnormalize\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnormalize_method\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m'zscore'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0msilent\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mModuleNotFoundError\u001b[0m: No module named 'pycaret'", + "", + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0;32m\nNOTE: If your import is failing due to a missing package, you can\nmanually install dependencies using either !pip or !apt.\n\nTo view examples of installing some common dependencies, click the\n\"Open Examples\" button below.\n\u001b[0;31m---------------------------------------------------------------------------\u001b[0m\n" + ], + "errorDetails": { + "actions": [ + { + "action": "open_url", + "actionText": "Open Examples", + "url": "/notebooks/snippets/importing_libraries.ipynb" + } + ] + } + } + ] + }, + { + "cell_type": "code", + "source": [ + "sm = save_model(nbModel, 'nbModelFile')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "XxRIJFMPEzse", + "outputId": "f1f8a4ca-b8c6-42a4-d14b-e96a774978d4" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Transformation Pipeline and Model Successfully Saved\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "nbModel = load_model('nbModelFile')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "Z8ZTQv6XF8PJ", + "outputId": "50e10b43-d001-4e30-f21e-f81c42f71692" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Transformation Pipeline and Model Successfully Loaded\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "newDataSet = cropDataSet.iloc[:2]\n", + "newDataSet" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 112 + }, + "id": "vbiV0Z5VGC12", + "outputId": "e3cd46e5-0caf-4ae8-8cd8-dcb12c49dac6" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NPKtemperaturehumidityphrainfalllabel
090424320.87974482.0027446.502985202.935536rice
185584121.77046280.3196447.038096226.655537rice
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " N P K temperature humidity ph rainfall label\n", + "0 90 42 43 20.879744 82.002744 6.502985 202.935536 rice\n", + "1 85 58 41 21.770462 80.319644 7.038096 226.655537 rice" + ] + }, + "metadata": {}, + "execution_count": 62 + } + ] + }, + { + "cell_type": "code", + "source": [ + "newDataSet1 = cropDataSet.iloc[500:502]\n", + "newDataSet1" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 112 + }, + "id": "61I1wItobd6_", + "outputId": "fd2632c3-229e-48e5-bdca-6b4a9167b6b2" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NPKtemperaturehumidityphrainfalllabel
5003491827.91095264.7093063.69286432.678919mothbeans
50122592327.32220651.2786884.37174636.503791mothbeans
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " N P K temperature humidity ph rainfall label\n", + "500 3 49 18 27.910952 64.709306 3.692864 32.678919 mothbeans\n", + "501 22 59 23 27.322206 51.278688 4.371746 36.503791 mothbeans" + ] + }, + "metadata": {}, + "execution_count": 61 + } + ] + }, + { + "cell_type": "code", + "source": [ + "newDataSet2 = cropDataSet.iloc[300:302]\n", + "newDataSet2" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 112 + }, + "id": "mmuuekEybkwB", + "outputId": "ecf861c9-46f4-47dc-a921-27cd37fcb2bf" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NPKtemperaturehumidityphrainfalllabel
30013602517.13692820.5954175.685972128.256862kidneybeans
30125701619.63474318.9070565.759237106.359818kidneybeans
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " N P K temperature humidity ph rainfall label\n", + "300 13 60 25 17.136928 20.595417 5.685972 128.256862 kidneybeans\n", + "301 25 70 16 19.634743 18.907056 5.759237 106.359818 kidneybeans" + ] + }, + "metadata": {}, + "execution_count": 60 + } + ] + }, + { + "cell_type": "code", + "source": [ + "newDataSet3 = cropDataSet.iloc[800:802]\n", + "newDataSet3" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 112 + }, + "id": "FVl0lHoUb50p", + "outputId": "a312fc93-b946-499c-9d6e-61af7d07a4c9" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NPKtemperaturehumidityphrainfalllabel
80032761528.05153663.4980227.60411043.357954lentil
80113612219.44084363.2777157.72883246.831301lentil
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " N P K temperature humidity ph rainfall label\n", + "800 32 76 15 28.051536 63.498022 7.604110 43.357954 lentil\n", + "801 13 61 22 19.440843 63.277715 7.728832 46.831301 lentil" + ] + }, + "metadata": {}, + "execution_count": 67 + } + ] + }, + { + "cell_type": "code", + "source": [ + "newDataSet4 = cropDataSet.iloc[1000:1002]\n", + "newDataSet4" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 112 + }, + "id": "anTWFEnCb-W5", + "outputId": "87187e93-6f31-4c62-d9cf-8b672cfadb3f" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NPKtemperaturehumidityphrainfalllabel
100091944629.36792476.2490016.14993492.828409banana
1001105955027.33369083.6767525.849076101.049479banana
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " N P K temperature humidity ph rainfall label\n", + "1000 91 94 46 29.367924 76.249001 6.149934 92.828409 banana\n", + "1001 105 95 50 27.333690 83.676752 5.849076 101.049479 banana" + ] + }, + "metadata": {}, + "execution_count": 68 + } + ] + }, + { + "cell_type": "code", + "source": [ + "frames = [newDataSet, newDataSet1, newDataSet2, newDataSet3, newDataSet4]\n", + "result = pd.concat(frames)\n", + "#display(result)\n", + "result" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 363 + }, + "id": "cMQJ2DPncP6K", + "outputId": "16352c64-d005-40b1-b3c3-2273778e60f5" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NPKtemperaturehumidityphrainfalllabel
090424320.87974482.0027446.502985202.935536rice
185584121.77046280.3196447.038096226.655537rice
5003491827.91095264.7093063.69286432.678919mothbeans
50122592327.32220651.2786884.37174636.503791mothbeans
30013602517.13692820.5954175.685972128.256862kidneybeans
30125701619.63474318.9070565.759237106.359818kidneybeans
80032761528.05153663.4980227.60411043.357954lentil
80113612219.44084363.2777157.72883246.831301lentil
100091944629.36792476.2490016.14993492.828409banana
1001105955027.33369083.6767525.849076101.049479banana
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " N P K temperature humidity ph rainfall label\n", + "0 90 42 43 20.879744 82.002744 6.502985 202.935536 rice\n", + "1 85 58 41 21.770462 80.319644 7.038096 226.655537 rice\n", + "500 3 49 18 27.910952 64.709306 3.692864 32.678919 mothbeans\n", + "501 22 59 23 27.322206 51.278688 4.371746 36.503791 mothbeans\n", + "300 13 60 25 17.136928 20.595417 5.685972 128.256862 kidneybeans\n", + "301 25 70 16 19.634743 18.907056 5.759237 106.359818 kidneybeans\n", + "800 32 76 15 28.051536 63.498022 7.604110 43.357954 lentil\n", + "801 13 61 22 19.440843 63.277715 7.728832 46.831301 lentil\n", + "1000 91 94 46 29.367924 76.249001 6.149934 92.828409 banana\n", + "1001 105 95 50 27.333690 83.676752 5.849076 101.049479 banana" + ] + }, + "metadata": {}, + "execution_count": 70 + } + ] + }, + { + "cell_type": "code", + "source": [ + "newPredictions = predict_model(nbModel, data = result)\n", + "newPredictions" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 363 + }, + "id": "bEz9ouhgHCRX", + "outputId": "c78cb74d-e09b-49b5-da8d-81c143031f13" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NPKtemperaturehumidityphrainfalllabelLabelScore
090424320.87974482.0027446.502985202.935536ricerice0.9982
185584121.77046280.3196447.038096226.655537ricerice0.9997
5003491827.91095264.7093063.69286432.678919mothbeansmothbeans1.0000
50122592327.32220651.2786884.37174636.503791mothbeansmothbeans0.9994
30013602517.13692820.5954175.685972128.256862kidneybeanskidneybeans0.9997
30125701619.63474318.9070565.759237106.359818kidneybeanskidneybeans0.9999
80032761528.05153663.4980227.60411043.357954lentillentil0.9998
80113612219.44084363.2777157.72883246.831301lentillentil1.0000
100091944629.36792476.2490016.14993492.828409bananabanana1.0000
1001105955027.33369083.6767525.849076101.049479bananabanana1.0000
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " N P K temperature ... rainfall label Label Score\n", + "0 90 42 43 20.879744 ... 202.935536 rice rice 0.9982\n", + "1 85 58 41 21.770462 ... 226.655537 rice rice 0.9997\n", + "500 3 49 18 27.910952 ... 32.678919 mothbeans mothbeans 1.0000\n", + "501 22 59 23 27.322206 ... 36.503791 mothbeans mothbeans 0.9994\n", + "300 13 60 25 17.136928 ... 128.256862 kidneybeans kidneybeans 0.9997\n", + "301 25 70 16 19.634743 ... 106.359818 kidneybeans kidneybeans 0.9999\n", + "800 32 76 15 28.051536 ... 43.357954 lentil lentil 0.9998\n", + "801 13 61 22 19.440843 ... 46.831301 lentil lentil 1.0000\n", + "1000 91 94 46 29.367924 ... 92.828409 banana banana 1.0000\n", + "1001 105 95 50 27.333690 ... 101.049479 banana banana 1.0000\n", + "\n", + "[10 rows x 10 columns]" + ] + }, + "metadata": {}, + "execution_count": 71 + } + ] + }, + { + "cell_type": "code", + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "predicted = newPredictions.iloc[:,-2] # Last column\n", + "actual = newPredictions.iloc[:,-3] # 2nd last column\n", + "\n", + "plt.scatter(actual, predicted)\n", + "plt.xlabel('Predicted')\n", + "plt.ylabel('Actual')\n", + "plt.title('Actul Vs Predicted')\n", + "plt.savefig(\"result-scatter-plot.jpg\", dpi=300)\n", + "plt.show()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 376 + }, + "id": "QRYjUEz0HM5-", + "outputId": "0c3199a2-618c-4c18-8ec0-3a6531271b7a" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "plot_model(nbModel, plot='error')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 399, + "referenced_widgets": [ + "e353c2e9634a41cc9754b120750c37b2", + "396885cfdccc48bb8f1cfd0223c97aa5", + "0568e477bbb745e68f7bd06a18056d9e" + ] + }, + "id": "RIwgRM24HmYr", + "outputId": "b73f7c79-41bf-436c-dbfd-933b03610e4b" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "nbModel = create_model('nb', verbose=True)\n", + "plot_model(nbModel, plot='learning')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 376, + "referenced_widgets": [ + "0c7a96b7437d4f439ee58a7348112c07", + "3957ae44c0b64b01b4420040a5a107da", + "dac75abfd15a434bb8a399900709f4c6", + "d5fa15c649734224a62b0416f1589e4c", + "bd048ed3009f474a99c795838ae4e809", + "3adfd8382a004ba493cf96f2228d28ed" + ] + }, + "id": "rF9WUkQlH62o", + "outputId": "cdba6326-2d91-4346-929b-95e215a9f9ff" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "nbModel = create_model('nb', verbose=True)\n", + "plot_model(nbModel, plot='vc')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 376, + "referenced_widgets": [ + "ca525e1c57d541299c9b4862c1fea11d", + "1dcfa769f8254370a963327b6f74b159", + "723e82f233be473789f249ecf0703ee2", + "e31ab003321c43b49caec0a8a7dde1cd", + "4647c3143e1340ff84efd9f4b3851a2a", + "db6f2f19b0e043cc8a0f71a3f9b49095" + ] + }, + "id": "5VzE-IXfRUJy", + "outputId": "2bbc20a3-c374-4761-adff-6902a99b74b6" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "rfModel = create_model('rf', verbose=False)\n", + "plot_model(rfModel, plot='feature')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 478, + "referenced_widgets": [ + "a5c08029facf463a9683e5f23797fbcc", + "8257770e8802452db5e40e16c40c80da", + "b4c98f4b9fc646ebbf1e1c0d0ee9d3fc" + ] + }, + "id": "0tiJcVv5RooV", + "outputId": "196ef4da-4da5-44de-ff7a-06020022eb41" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "etModel = create_model('et', verbose=False)\n", + "plot_model(etModel, plot='feature')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 478, + "referenced_widgets": [ + "db14ff1586104c1bb34e607996c13318", + "50d16bc916de4be295898de3aca4a08d", + "315962e470d04c78a2afc0a866afc592" + ] + }, + "id": "BzkVfLQVTCEp", + "outputId": "ebe5ab3f-869f-4d38-88f9-435c9fa8081a" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "display_data", + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": {} + } + ] + } + ] +} \ No newline at end of file diff --git a/scripts/Crop Prediction Model/Readme.md b/scripts/Crop Prediction Model/Readme.md new file mode 100644 index 0000000..32e2ed1 --- /dev/null +++ b/scripts/Crop Prediction Model/Readme.md @@ -0,0 +1,11 @@ +# Crop Prediction Model + +A machine learning model to predict the best suitable crop to grow on a particular piece of land based on different factors like humidity, ph, rainfall. + +## Data set used + +The data set is taken from kaggle which includes data of several crops. +link - https://www.kaggle.com/datasets/atharvaingle/crop-recommendation-dataset + +## Pycaret +I have used pycaret to compare all the classification models and optimized them for the best results. diff --git a/scripts/Fetching trending stocks using nlp/Readme.md b/scripts/Fetching trending stocks using nlp/Readme.md new file mode 100644 index 0000000..a0b1c33 --- /dev/null +++ b/scripts/Fetching trending stocks using nlp/Readme.md @@ -0,0 +1,5 @@ +## How to run the app +To run the app, simply open the cmd in the directory and run +command - streamlit run app.py + +Note: It can take 5-10 mins to load and show the trending stocks. diff --git a/scripts/Fetching trending stocks using nlp/app.py b/scripts/Fetching trending stocks using nlp/app.py new file mode 100644 index 0000000..362f329 --- /dev/null +++ b/scripts/Fetching trending stocks using nlp/app.py @@ -0,0 +1,77 @@ +import pandas as pd +import requests +import spacy +import streamlit as st +import os + +from spacy import displacy +from bs4 import BeautifulSoup +import yfinance as yf +import matplotlib + +st.title('Trending Stocks :zap:') + +def extract_text_from_rss(rss_link): + headings = [] + r1 = requests.get('https://economictimes.indiatimes.com/markets/stocks/rssfeeds/2146842.cms') + r2 = requests.get(rss_link) + soup1 = BeautifulSoup(r1.content, features='lxml') + soup2 = BeautifulSoup(r2.content, features='lxml') + headings1 = soup1.findAll('title') + headings2 = (soup2.findAll('title')) + print(headings2) + headings = headings1 + headings2 + return headings + + +token_dict = { + 'Org': [], + 'Symbol': [], + 'currentPrice': [], + 'dayHigh': [], + 'dayLow': [], + 'forwardPE': [], + 'dividendYield': [] +} +nlp = spacy.load("en_core_web_sm") + +def stock_info(headings): + + stocks_df = pd.read_csv("./data/ind_nifty500list.csv") + for title in headings: + doc = nlp(title.text) + for token in doc.ents: + try: + if stocks_df['Company Name'].str.contains(token.text).sum(): + symbol = stocks_df[stocks_df['Company Name'].\ + str.contains(token.text)]['Symbol'].values[0] + org_name = stocks_df[stocks_df['Company Name'].\ + str.contains(token.text)]['Company Name'].values[0] + token_dict['Org'].append(org_name) + print(symbol+".NS") + token_dict['Symbol'].append(symbol) + stock_info = yf.Ticker(symbol+".NS").info + token_dict['currentPrice'].append(stock_info['currentPrice']) + token_dict['dayHigh'].append(stock_info['dayHigh']) + token_dict['dayLow'].append(stock_info['dayLow']) + token_dict['forwardPE'].append(stock_info['forwardPE']) + token_dict['dividendYield'].append(stock_info['dividendYield']) + else: + pass + except: + pass + output_df = pd.DataFrame(token_dict) + return output_df + + +user_input = st.text_input("Add your RSS link here!", "https://www.moneycontrol.com/rss/buzzingstocks.xml") + +fin_headings = extract_text_from_rss(user_input) + +output_df = stock_info(fin_headings) +output_df.drop_duplicates(inplace=True) +st.dataframe(output_df) + +with st.expander("Expand for Financial News!"): + for h in fin_headings: + st.markdown("* " + h.text) diff --git a/scripts/Fetching trending stocks using nlp/data/History_102.txt b/scripts/Fetching trending stocks using nlp/data/History_102.txt new file mode 100644 index 0000000..68e6acb --- /dev/null +++ b/scripts/Fetching trending stocks using nlp/data/History_102.txt @@ -0,0 +1,53 @@ +0 Betancourt, Rómulo +The chief long-term effect was the prolonged divi- U.S. intromission in this oil-rich country, Betancourt +sion of Germany. The Western Allies had confronted the contributed in enduring ways to the institutionaliza- +Soviets and had maintained their commitments without tion of Venezuelan democracy. +having to resort to armed action. The blockade also Born in the town of Guatire in the state of Miranda +proved damaging to world opinion of the Soviet Union. to a family of modest means, he starting working at +Berlin, long perceived as a bastion of German-Prussian 14 years of age to put himself through high school, +militarism, had been transformed into a symbol of free- college, and law school. In 1928 he participated in stu- +dom. The allied presence in Berlin would be the source dent protests against the dictatorship of Juan Vicente +of almost constant difficulty for the East German state, Gómez, events marking him as a leading member of +as it provided an enclave of Western liberalism and eco- the “Generation of 28” dedicated to democratization +nomic prosperity that was a constant source of entice- and social reform. After being jailed by the Gómez +ment for the citizens of the communist state. West Berlin regime he went into exile and became active in various +would be a popular destination for East German emi- leftist political groups, including the Communist Party +grants over the course of the next decade, their massive of Costa Rica. +flight from the east stopped only by the erection of the At age 23 he penned the Plan of Barranquilla, a +Berlin Wall in 1961. Marxist-inspired document outlining his vision of +See also cold war. his homeland’s political future. After Gómez’s death +in 1936, he returned clandestinely to Venezuela and +Further reading: Eisenberg, Carolyn. Drawing the Line: became engaged in political activity against the mili- +The American Decision to Divide Germany, 1944–1949. tary regime. In 1940 he went into exile in Chile, where +New York: Cambridge University Press, 1996; Gaddis, he published Venezuelan Problems (Problemas Vene- +John Lewis. The Cold War: A New History. New York: zolanos). A year later he returned to Venezuela and +Penguin Press, 2005; Haydock, Michael. City Under Siege: founded AD, gathering around him a team commit- +The Berlin Blockade and Airlift, 1948–1949. Washington, ted to reform that formed the nucleus of the party and +D.C.: Brassey’s, 1999; Large, David Clay. Berlin. Berlin: skillfully using the press and other media to dissemi- +Basic Books, 2000; Parrish, Thomas. Berlin in the Bal- nate his ideas. +ance, 1945–1949: The Blockade, Airlift, the First Major On October 19, 1945, a coalition of AD reformers +Battle of the Cold War. Reading, MA: Addison-Wesley, 1999; and disgruntled army officers overthrew the military +Trachtenberg, Marc. A Constructed Peace: The Making of regime and installed Betancourt as president of a provi- +the European Settlement, 1945–1963. Princeton, NJ: Princ- sional government. During his first presidency (1945– +eton University Press, 1999. 48), Betancourt’s government instituted a wide range +of political, economic, and social reforms, including +Nicholas J. Schlosser universal suffrage; mechanisms for free and fair elec- +tions; an accord with foreign oil companies that guar- +anteed a reasonable profit, decent wages, and ensured +Betancourt, Rómulo +labor peace; agrarian reform; expansion of public edu- +(1908–1981) Venezuelan president cation and public health facilities; and related initia- +tives. Declining to run for a second successive term, in +One of the leading figures of 20th-century Venezuelan 1948 he transferred power to his successor, the novel- +history, Rómulo Betancourt is generally credited with ist and activist Rómulo Gallegos. Later that year, in +playing a pivotal role in helping to establish viable and December, the military in collusion with conservative +sustainable democratic institutions in Venezuela that elements overthrew the Gallegos government, ruling +endured from his second presidency (1959–64) to the Venezuela for the next 10 years under General Marcos +2000s. A moderate social reformer and forerunner of Pérez Jiménez. +latter-day Venezuelan president Hugo Chávez in his In 1958 a resurgent coalition of reformers and +advocacy of populist social democracy focusing on the army officers overthrew the Jiménez regime, installing +needs of the poor, Betancourt founded the political party a democratic AD-dominated government, with Betan- +Democratic Action (Acción Democrática, AD) in 1941, court again as president, which broadened and deep- +which would play a major role in subsequent Venezu- ened the reforms of the 1940s. Since 1958 Venezuela +elan political life. Threading a difficult line between the has been ruled by a succession of democratically elect- +far Left, the far Right, and the omnipresent specter of ed governments. Surviving an assassination attempt \ No newline at end of file diff --git a/scripts/Fetching trending stocks using nlp/data/ind_nifty500list.csv b/scripts/Fetching trending stocks using nlp/data/ind_nifty500list.csv new file mode 100644 index 0000000..0ef065f --- /dev/null +++ b/scripts/Fetching trending stocks using nlp/data/ind_nifty500list.csv @@ -0,0 +1,502 @@ +Company Name,Industry,Symbol,Series,ISIN Code +3M India Ltd.,CONSUMER GOODS,3MINDIA,EQ,INE470A01017 +ABB India Ltd.,INDUSTRIAL MANUFACTURING,ABB,EQ,INE117A01022 +ABB Power Products and Systems India Ltd.,INDUSTRIAL MANUFACTURING,POWERINDIA,EQ,INE07Y701011 +ACC Ltd.,CEMENT & CEMENT PRODUCTS,ACC,EQ,INE012A01025 +AIA Engineering Ltd.,INDUSTRIAL MANUFACTURING,AIAENG,EQ,INE212H01026 +APL Apollo Tubes Ltd.,METALS,APLAPOLLO,EQ,INE702C01027 +AU Small Finance Bank Ltd.,FINANCIAL SERVICES,AUBANK,EQ,INE949L01017 +Aarti Drugs Ltd.,PHARMA,AARTIDRUGS,EQ,INE767A01016 +Aarti Industries Ltd.,CHEMICALS,AARTIIND,EQ,INE769A01020 +Aavas Financiers Ltd.,FINANCIAL SERVICES,AAVAS,EQ,INE216P01012 +Abbott India Ltd.,PHARMA,ABBOTINDIA,EQ,INE358A01014 +Adani Enterprises Ltd.,METALS,ADANIENT,EQ,INE423A01024 +Adani Green Energy Ltd.,POWER,ADANIGREEN,EQ,INE364U01010 +Adani Ports and Special Economic Zone Ltd.,SERVICES,ADANIPORTS,EQ,INE742F01042 +Adani Total Gas Ltd.,OIL & GAS,ATGL,BE,INE399L01023 +Adani Transmission Ltd.,POWER,ADANITRANS,BE,INE931S01010 +Aditya Birla Capital Ltd.,FINANCIAL SERVICES,ABCAPITAL,EQ,INE674K01013 +Aditya Birla Fashion and Retail Ltd.,CONSUMER SERVICES,ABFRL,EQ,INE647O01011 +Advanced Enzyme Tech Ltd.,CONSUMER GOODS,ADVENZYMES,EQ,INE837H01020 +Aegis Logistics Ltd.,SERVICES,AEGISCHEM,EQ,INE208C01025 +Affle (India) Ltd.,IT,AFFLE,EQ,INE00WC01019 +Ajanta Pharmaceuticals Ltd.,PHARMA,AJANTPHARM,EQ,INE031B01049 +Akzo Nobel India Ltd.,CONSUMER GOODS,AKZOINDIA,EQ,INE133A01011 +Alembic Ltd.,PHARMA,ALEMBICLTD,EQ,INE426A01027 +Alembic Pharmaceuticals Ltd.,PHARMA,APLLTD,EQ,INE901L01018 +Alkem Laboratories Ltd.,PHARMA,ALKEM,EQ,INE540L01014 +Alkyl Amines Chemicals Ltd.,CHEMICALS,ALKYLAMINE,EQ,INE150B01039 +Alok Industries Ltd.,TEXTILES,ALOKINDS,EQ,INE270A01029 +Amara Raja Batteries Ltd.,AUTOMOBILE,AMARAJABAT,EQ,INE885A01032 +Amber Enterprises India Ltd.,CONSUMER GOODS,AMBER,EQ,INE371P01015 +Ambuja Cements Ltd.,CEMENT & CEMENT PRODUCTS,AMBUJACEM,EQ,INE079A01024 +Angel Broking Ltd.,FINANCIAL SERVICES,ANGELBRKG,EQ,INE732I01013 +Apollo Hospitals Enterprise Ltd.,HEALTHCARE SERVICES,APOLLOHOSP,EQ,INE437A01024 +Apollo Tyres Ltd.,AUTOMOBILE,APOLLOTYRE,EQ,INE438A01022 +Asahi India Glass Ltd.,AUTOMOBILE,ASAHIINDIA,EQ,INE439A01020 +Ashok Leyland Ltd.,AUTOMOBILE,ASHOKLEY,EQ,INE208A01029 +Ashoka Buildcon Ltd.,CONSTRUCTION,ASHOKA,EQ,INE442H01029 +Asian Paints Ltd.,CONSUMER GOODS,ASIANPAINT,EQ,INE021A01026 +Aster DM Healthcare Ltd.,HEALTHCARE SERVICES,ASTERDM,EQ,INE914M01019 +AstraZenca Pharma India Ltd.,PHARMA,ASTRAZEN,EQ,INE203A01020 +Astral Ltd.,INDUSTRIAL MANUFACTURING,ASTRAL,EQ,INE006I01046 +Atul Ltd.,CHEMICALS,ATUL,EQ,INE100A01010 +Aurobindo Pharma Ltd.,PHARMA,AUROPHARMA,EQ,INE406A01037 +Avanti Feeds Ltd.,CONSUMER GOODS,AVANTIFEED,EQ,INE871C01038 +Avenue Supermarts Ltd.,CONSUMER SERVICES,DMART,EQ,INE192R01011 +Axis Bank Ltd.,FINANCIAL SERVICES,AXISBANK,EQ,INE238A01034 +BASF India Ltd.,CHEMICALS,BASF,EQ,INE373A01013 +BEML Ltd.,INDUSTRIAL MANUFACTURING,BEML,EQ,INE258A01016 +BSE Ltd.,FINANCIAL SERVICES,BSE,EQ,INE118H01025 +Bajaj Auto Ltd.,AUTOMOBILE,BAJAJ-AUTO,EQ,INE917I01010 +Bajaj Consumer Care Ltd.,CONSUMER GOODS,BAJAJCON,EQ,INE933K01021 +Bajaj Electricals Ltd,CONSUMER GOODS,BAJAJELEC,EQ,INE193E01025 +Bajaj Finance Ltd.,FINANCIAL SERVICES,BAJFINANCE,EQ,INE296A01024 +Bajaj Finserv Ltd.,FINANCIAL SERVICES,BAJAJFINSV,EQ,INE918I01018 +Bajaj Holdings & Investment Ltd.,FINANCIAL SERVICES,BAJAJHLDNG,EQ,INE118A01012 +Balaji Amines Ltd.,CHEMICALS,BALAMINES,EQ,INE050E01027 +Balkrishna Industries Ltd.,AUTOMOBILE,BALKRISIND,EQ,INE787D01026 +Balmer Lawrie & Co. Ltd.,INDUSTRIAL MANUFACTURING,BALMLAWRIE,EQ,INE164A01016 +Balrampur Chini Mills Ltd.,CONSUMER GOODS,BALRAMCHIN,EQ,INE119A01028 +Bandhan Bank Ltd.,FINANCIAL SERVICES,BANDHANBNK,EQ,INE545U01014 +Bank of Baroda,FINANCIAL SERVICES,BANKBARODA,EQ,INE028A01039 +Bank of India,FINANCIAL SERVICES,BANKINDIA,EQ,INE084A01016 +Bank of Maharashtra.,FINANCIAL SERVICES,MAHABANK,EQ,INE457A01014 +Bata India Ltd.,CONSUMER GOODS,BATAINDIA,EQ,INE176A01028 +Bayer Cropscience Ltd.,FERTILISERS & PESTICIDES,BAYERCROP,EQ,INE462A01022 +Berger Paints India Ltd.,CONSUMER GOODS,BERGEPAINT,EQ,INE463A01038 +Bharat Dynamics Ltd.,INDUSTRIAL MANUFACTURING,BDL,EQ,INE171Z01018 +Bharat Electronics Ltd.,INDUSTRIAL MANUFACTURING,BEL,EQ,INE263A01024 +Bharat Forge Ltd.,INDUSTRIAL MANUFACTURING,BHARATFORG,EQ,INE465A01025 +Bharat Heavy Electricals Ltd.,INDUSTRIAL MANUFACTURING,BHEL,EQ,INE257A01026 +Bharat Petroleum Corporation Ltd.,OIL & GAS,BPCL,EQ,INE029A01011 +Bharat Rasayan Ltd.,FERTILISERS & PESTICIDES,BHARATRAS,EQ,INE838B01013 +Bharti Airtel Ltd.,TELECOM,BHARTIARTL,EQ,INE397D01024 +Biocon Ltd.,PHARMA,BIOCON,EQ,INE376G01013 +Birla Corporation Ltd.,CEMENT & CEMENT PRODUCTS,BIRLACORPN,EQ,INE340A01012 +Birlasoft Ltd.,IT,BSOFT,EQ,INE836A01035 +Bliss GVS Pharma Ltd.,PHARMA,BLISSGVS,EQ,INE416D01022 +Blue Dart Express Ltd.,SERVICES,BLUEDART,EQ,INE233B01017 +Blue Star Ltd.,CONSUMER GOODS,BLUESTARCO,EQ,INE472A01039 +Bombay Burmah Trading Corporation Ltd.,CONSUMER GOODS,BBTC,EQ,INE050A01025 +Bosch Ltd.,AUTOMOBILE,BOSCHLTD,EQ,INE323A01026 +Brigade Enterprises Ltd.,CONSTRUCTION,BRIGADE,EQ,INE791I01019 +Britannia Industries Ltd.,CONSUMER GOODS,BRITANNIA,EQ,INE216A01030 +Burger King India Ltd.,CONSUMER SERVICES,BURGERKING,EQ,INE07T201019 +CCL Products (I) Ltd.,CONSUMER GOODS,CCL,EQ,INE421D01022 +CESC Ltd.,POWER,CESC,EQ,INE486A01013 +CRISIL Ltd.,FINANCIAL SERVICES,CRISIL,EQ,INE007A01025 +CSB Bank Ltd.,FINANCIAL SERVICES,CSBBANK,EQ,INE679A01013 +Cadila Healthcare Ltd.,PHARMA,CADILAHC,EQ,INE010B01027 +Can Fin Homes Ltd.,FINANCIAL SERVICES,CANFINHOME,EQ,INE477A01020 +Canara Bank,FINANCIAL SERVICES,CANBK,EQ,INE476A01014 +Caplin Point Laboratories Ltd.,PHARMA,CAPLIPOINT,EQ,INE475E01026 +Capri Global Capital Ltd.,FINANCIAL SERVICES,CGCL,EQ,INE180C01026 +Carborundum Universal Ltd.,INDUSTRIAL MANUFACTURING,CARBORUNIV,EQ,INE120A01034 +Castrol India Ltd.,OIL & GAS,CASTROLIND,EQ,INE172A01027 +Ceat Ltd.,AUTOMOBILE,CEATLTD,EQ,INE482A01020 +Central Bank of India,FINANCIAL SERVICES,CENTRALBK,EQ,INE483A01010 +Central Depository Services (India) Ltd.,FINANCIAL SERVICES,CDSL,BE,INE736A01011 +Century Plyboards (India) Ltd.,CONSUMER GOODS,CENTURYPLY,EQ,INE348B01021 +Century Textile & Industries Ltd.,PAPER AND JUTE,CENTURYTEX,EQ,INE055A01016 +Cera Sanitaryware Ltd,CONSUMER GOODS,CERA,EQ,INE739E01017 +Chalet Hotels Ltd.,CONSUMER SERVICES,CHALET,EQ,INE427F01016 +Chambal Fertilizers & Chemicals Ltd.,FERTILISERS & PESTICIDES,CHAMBLFERT,EQ,INE085A01013 +Cholamandalam Financial Holdings Ltd.,FINANCIAL SERVICES,CHOLAHLDNG,EQ,INE149A01033 +Cholamandalam Investment and Finance Company Ltd.,FINANCIAL SERVICES,CHOLAFIN,EQ,INE121A01024 +Cipla Ltd.,PHARMA,CIPLA,EQ,INE059A01026 +City Union Bank Ltd.,FINANCIAL SERVICES,CUB,EQ,INE491A01021 +Coal India Ltd.,METALS,COALINDIA,EQ,INE522F01014 +Cochin Shipyard Ltd.,INDUSTRIAL MANUFACTURING,COCHINSHIP,EQ,INE704P01017 +Coforge Ltd.,IT,COFORGE,EQ,INE591G01017 +Colgate Palmolive (India) Ltd.,CONSUMER GOODS,COLPAL,EQ,INE259A01022 +Computer Age Management Services Ltd.,FINANCIAL SERVICES,CAMS,EQ,INE596I01012 +Container Corporation of India Ltd.,SERVICES,CONCOR,EQ,INE111A01025 +Coromandel International Ltd.,FERTILISERS & PESTICIDES,COROMANDEL,EQ,INE169A01031 +CreditAccess Grameen Ltd.,FINANCIAL SERVICES,CREDITACC,EQ,INE741K01010 +Crompton Greaves Consumer Electricals Ltd.,CONSUMER GOODS,CROMPTON,EQ,INE299U01018 +Cummins India Ltd.,INDUSTRIAL MANUFACTURING,CUMMINSIND,EQ,INE298A01020 +Cyient Ltd.,IT,CYIENT,EQ,INE136B01020 +DCB Bank Ltd.,FINANCIAL SERVICES,DCBBANK,EQ,INE503A01015 +DCM Shriram Ltd.,CONSUMER GOODS,DCMSHRIRAM,EQ,INE499A01024 +DLF Ltd.,CONSTRUCTION,DLF,EQ,INE271C01023 +Dabur India Ltd.,CONSUMER GOODS,DABUR,EQ,INE016A01026 +Dalmia Bharat Ltd.,CEMENT & CEMENT PRODUCTS,DALBHARAT,EQ,INE00R701025 +Deepak Nitrite Ltd.,CHEMICALS,DEEPAKNTR,EQ,INE288B01029 +Delta Corp Ltd.,CONSUMER SERVICES,DELTACORP,EQ,INE124G01033 +Dhani Services Ltd.,FINANCIAL SERVICES,DHANI,EQ,INE274G01010 +Dhanuka Agritech Ltd.,FERTILISERS & PESTICIDES,DHANUKA,EQ,INE435G01025 +Dilip Buildcon Ltd.,CONSTRUCTION,DBL,EQ,INE917M01012 +Dish TV India Ltd.,MEDIA ENTERTAINMENT & PUBLICATION,DISHTV,EQ,INE836F01026 +Dishman Carbogen Amcis Ltd.,PHARMA,DCAL,EQ,INE385W01011 +Divi's Laboratories Ltd.,PHARMA,DIVISLAB,EQ,INE361B01024 +Dixon Technologies (India) Ltd.,CONSUMER GOODS,DIXON,EQ,INE935N01020 +Dr. Lal Path Labs Ltd.,HEALTHCARE SERVICES,LALPATHLAB,EQ,INE600L01024 +Dr. Reddy's Laboratories Ltd.,PHARMA,DRREDDY,EQ,INE089A01023 +E.I.D. Parry (India) Ltd.,CONSUMER GOODS,EIDPARRY,EQ,INE126A01031 +EIH Ltd.,CONSUMER SERVICES,EIHOTEL,EQ,INE230A01023 +EPL Ltd.,INDUSTRIAL MANUFACTURING,EPL,EQ,INE255A01020 +Edelweiss Financial Services Ltd.,FINANCIAL SERVICES,EDELWEISS,EQ,INE532F01054 +Eicher Motors Ltd.,AUTOMOBILE,EICHERMOT,EQ,INE066A01021 +Elgi Equipments Ltd.,INDUSTRIAL MANUFACTURING,ELGIEQUIP,EQ,INE285A01027 +Emami Ltd.,CONSUMER GOODS,EMAMILTD,EQ,INE548C01032 +Endurance Technologies Ltd.,AUTOMOBILE,ENDURANCE,EQ,INE913H01037 +Engineers India Ltd.,CONSTRUCTION,ENGINERSIN,EQ,INE510A01028 +Equitas Holdings Ltd.,FINANCIAL SERVICES,EQUITAS,EQ,INE988K01017 +Eris Lifesciences Ltd.,PHARMA,ERIS,EQ,INE406M01024 +Escorts Ltd.,AUTOMOBILE,ESCORTS,EQ,INE042A01014 +Exide Industries Ltd.,AUTOMOBILE,EXIDEIND,EQ,INE302A01020 +FDC Ltd.,PHARMA,FDC,EQ,INE258B01022 +Federal Bank Ltd.,FINANCIAL SERVICES,FEDERALBNK,EQ,INE171A01029 +Fine Organic Industries Ltd.,CHEMICALS,FINEORG,EQ,INE686Y01026 +Finolex Cables Ltd.,INDUSTRIAL MANUFACTURING,FINCABLES,EQ,INE235A01022 +Finolex Industries Ltd.,INDUSTRIAL MANUFACTURING,FINPIPE,EQ,INE183A01024 +Firstsource Solutions Ltd.,IT,FSL,EQ,INE684F01012 +Fortis Healthcare Ltd.,HEALTHCARE SERVICES,FORTIS,EQ,INE061F01013 +Future Consumer Ltd.,CONSUMER SERVICES,FCONSUMER,EQ,INE220J01025 +Future Retail Ltd.,CONSUMER SERVICES,FRETAIL,EQ,INE752P01024 +GAIL (India) Ltd.,OIL & GAS,GAIL,EQ,INE129A01019 +GE Power India Ltd.,INDUSTRIAL MANUFACTURING,GEPIL,EQ,INE878A01011 +GMM Pfaudler Ltd.,INDUSTRIAL MANUFACTURING,GMMPFAUDLR,EQ,INE541A01023 +GMR Infrastructure Ltd.,CONSTRUCTION,GMRINFRA,EQ,INE776C01039 +Galaxy Surfactants Ltd.,CHEMICALS,GALAXYSURF,EQ,INE600K01018 +Garden Reach Shipbuilders & Engineers Ltd.,INDUSTRIAL MANUFACTURING,GRSE,EQ,INE382Z01011 +Garware Technical Fibres Ltd.,TEXTILES,GARFIBRES,EQ,INE276A01018 +General Insurance Corporation of India,FINANCIAL SERVICES,GICRE,EQ,INE481Y01014 +Gillette India Ltd.,CONSUMER GOODS,GILLETTE,EQ,INE322A01010 +Gland Pharma Ltd.,PHARMA,GLAND,EQ,INE068V01023 +Glaxosmithkline Pharmaceuticals Ltd.,PHARMA,GLAXO,EQ,INE159A01016 +Glenmark Pharmaceuticals Ltd.,PHARMA,GLENMARK,EQ,INE935A01035 +Godfrey Phillips India Ltd.,CONSUMER GOODS,GODFRYPHLP,EQ,INE260B01028 +Godrej Agrovet Ltd.,CONSUMER GOODS,GODREJAGRO,EQ,INE850D01014 +Godrej Consumer Products Ltd.,CONSUMER GOODS,GODREJCP,EQ,INE102D01028 +Godrej Industries Ltd.,CONSUMER GOODS,GODREJIND,EQ,INE233A01035 +Godrej Properties Ltd.,CONSTRUCTION,GODREJPROP,EQ,INE484J01027 +Granules India Ltd.,PHARMA,GRANULES,EQ,INE101D01020 +Graphite India Ltd.,INDUSTRIAL MANUFACTURING,GRAPHITE,EQ,INE371A01025 +Grasim Industries Ltd.,CEMENT & CEMENT PRODUCTS,GRASIM,EQ,INE047A01021 +Great Eastern Shipping Co. Ltd.,SERVICES,GESHIP,EQ,INE017A01032 +Greaves Cotton Ltd.,INDUSTRIAL MANUFACTURING,GREAVESCOT,EQ,INE224A01026 +Grindwell Norton Ltd.,INDUSTRIAL MANUFACTURING,GRINDWELL,EQ,INE536A01023 +Gujarat Alkalies & Chemicals Ltd.,CHEMICALS,GUJALKALI,EQ,INE186A01019 +Gujarat Ambuja Exports Ltd.,CONSUMER GOODS,GAEL,EQ,INE036B01030 +Gujarat Fluorochemicals Ltd.,CHEMICALS,FLUOROCHEM,EQ,INE09N301011 +Gujarat Gas Ltd.,OIL & GAS,GUJGASLTD,EQ,INE844O01030 +Gujarat Narmada Valley Fertilizers and Chemicals Ltd.,CHEMICALS,GNFC,EQ,INE113A01013 +Gujarat Pipavav Port Ltd.,SERVICES,GPPL,EQ,INE517F01014 +Gujarat State Fertilizers & Chemicals Ltd.,FERTILISERS & PESTICIDES,GSFC,EQ,INE026A01025 +Gujarat State Petronet Ltd.,OIL & GAS,GSPL,EQ,INE246F01010 +Gulf Oil Lubricants India Ltd.,OIL & GAS,GULFOILLUB,EQ,INE635Q01029 +H.E.G. Ltd.,INDUSTRIAL MANUFACTURING,HEG,EQ,INE545A01016 +HCL Technologies Ltd.,IT,HCLTECH,EQ,INE860A01027 +HDFC Asset Management Company Ltd.,FINANCIAL SERVICES,HDFCAMC,EQ,INE127D01025 +HDFC Bank Ltd.,FINANCIAL SERVICES,HDFCBANK,EQ,INE040A01034 +HDFC Life Insurance Company Ltd.,FINANCIAL SERVICES,HDFCLIFE,EQ,INE795G01014 +HFCL Ltd.,TELECOM,HFCL,BE,INE548A01028 +Happiest Minds Technologies Ltd.,IT,HAPPSTMNDS,EQ,INE419U01012 +Hatsun Agro Product Ltd.,CONSUMER GOODS,HATSUN,EQ,INE473B01035 +Havells India Ltd.,CONSUMER GOODS,HAVELLS,EQ,INE176B01034 +HeidelbergCement India Ltd.,CEMENT & CEMENT PRODUCTS,HEIDELBERG,EQ,INE578A01017 +Hemisphere Properties India Ltd.,CONSTRUCTION,HEMIPROP,EQ,INE0AJG01018 +Hero MotoCorp Ltd.,AUTOMOBILE,HEROMOTOCO,EQ,INE158A01026 +Himadri Speciality Chemical Ltd.,CHEMICALS,HSCL,EQ,INE019C01026 +Hindalco Industries Ltd.,METALS,HINDALCO,EQ,INE038A01020 +Hindustan Aeronautics Ltd.,INDUSTRIAL MANUFACTURING,HAL,EQ,INE066F01012 +Hindustan Copper Ltd.,METALS,HINDCOPPER,EQ,INE531E01026 +Hindustan Petroleum Corporation Ltd.,OIL & GAS,HINDPETRO,EQ,INE094A01015 +Hindustan Unilever Ltd.,CONSUMER GOODS,HINDUNILVR,EQ,INE030A01027 +Hindustan Zinc Ltd.,METALS,HINDZINC,EQ,INE267A01025 +Honeywell Automation India Ltd.,INDUSTRIAL MANUFACTURING,HONAUT,EQ,INE671A01010 +Housing & Urban Development Corporation Ltd.,FINANCIAL SERVICES,HUDCO,EQ,INE031A01017 +Housing Development Finance Corporation Ltd.,FINANCIAL SERVICES,HDFC,EQ,INE001A01036 +Huhtamaki India Ltd.,INDUSTRIAL MANUFACTURING,HUHTAMAKI,EQ,INE275B01026 +ICICI Bank Ltd.,FINANCIAL SERVICES,ICICIBANK,EQ,INE090A01021 +ICICI Lombard General Insurance Company Ltd.,FINANCIAL SERVICES,ICICIGI,EQ,INE765G01017 +ICICI Prudential Life Insurance Company Ltd.,FINANCIAL SERVICES,ICICIPRULI,EQ,INE726G01019 +ICICI Securities Ltd.,FINANCIAL SERVICES,ISEC,EQ,INE763G01038 +IDBI Bank Ltd.,FINANCIAL SERVICES,IDBI,EQ,INE008A01015 +IDFC First Bank Ltd.,FINANCIAL SERVICES,IDFCFIRSTB,EQ,INE092T01019 +IDFC Ltd.,FINANCIAL SERVICES,IDFC,EQ,INE043D01016 +IFB Industries Ltd.,CONSUMER GOODS,IFBIND,EQ,INE559A01017 +IIFL Finance Ltd.,FINANCIAL SERVICES,IIFL,EQ,INE530B01024 +IIFL Wealth Management Ltd.,FINANCIAL SERVICES,IIFLWAM,EQ,INE466L01020 +IOL Chem and Pharma Ltd.,PHARMA,IOLCP,EQ,INE485C01011 +IRB Infrastructure Developers Ltd.,CONSTRUCTION,IRB,EQ,INE821I01014 +IRCON International Ltd.,CONSTRUCTION,IRCON,EQ,INE962Y01021 +ITC Ltd.,CONSUMER GOODS,ITC,EQ,INE154A01025 +ITI Ltd.,TELECOM,ITI,EQ,INE248A01017 +India Cements Ltd.,CEMENT & CEMENT PRODUCTS,INDIACEM,EQ,INE383A01012 +Indiabulls Housing Finance Ltd.,FINANCIAL SERVICES,IBULHSGFIN,EQ,INE148I01020 +Indiabulls Real Estate Ltd.,CONSTRUCTION,IBREALEST,EQ,INE069I01010 +Indiamart Intermesh Ltd.,CONSUMER SERVICES,INDIAMART,EQ,INE933S01016 +Indian Bank,FINANCIAL SERVICES,INDIANB,EQ,INE562A01011 +Indian Energy Exchange Ltd.,FINANCIAL SERVICES,IEX,EQ,INE022Q01020 +Indian Hotels Co. Ltd.,CONSUMER SERVICES,INDHOTEL,EQ,INE053A01029 +Indian Oil Corporation Ltd.,OIL & GAS,IOC,EQ,INE242A01010 +Indian Overseas Bank,FINANCIAL SERVICES,IOB,EQ,INE565A01014 +Indian Railway Catering And Tourism Corporation Ltd.,SERVICES,IRCTC,EQ,INE335Y01012 +Indo Count Industries Ltd.,TEXTILES,ICIL,EQ,INE483B01026 +Indoco Remedies Ltd.,PHARMA,INDOCO,EQ,INE873D01024 +Indraprastha Gas Ltd.,OIL & GAS,IGL,EQ,INE203G01027 +Indus Towers Ltd.,TELECOM,INDUSTOWER,EQ,INE121J01017 +IndusInd Bank Ltd.,FINANCIAL SERVICES,INDUSINDBK,EQ,INE095A01012 +Infibeam Avenues Ltd.,IT,INFIBEAM,EQ,INE483S01020 +Info Edge (India) Ltd.,CONSUMER SERVICES,NAUKRI,EQ,INE663F01024 +Infosys Ltd.,IT,INFY,EQ,INE009A01021 +Ingersoll Rand (India) Ltd.,INDUSTRIAL MANUFACTURING,INGERRAND,EQ,INE177A01018 +Inox Leisure Ltd.,MEDIA ENTERTAINMENT & PUBLICATION,INOXLEISUR,EQ,INE312H01016 +Intellect Design Arena Ltd.,IT,INTELLECT,EQ,INE306R01017 +InterGlobe Aviation Ltd.,SERVICES,INDIGO,EQ,INE646L01027 +Ipca Laboratories Ltd.,PHARMA,IPCALAB,EQ,INE571A01020 +J.B. Chemicals & Pharmaceuticals Ltd.,PHARMA,JBCHEPHARM,EQ,INE572A01028 +J.K. Cement Ltd.,CEMENT & CEMENT PRODUCTS,JKCEMENT,EQ,INE823G01014 +JK Lakshmi Cement Ltd.,CEMENT & CEMENT PRODUCTS,JKLAKSHMI,EQ,INE786A01032 +JK Paper Ltd.,PAPER AND JUTE,JKPAPER,EQ,INE789E01012 +JK Tyre & Industries Ltd.,AUTOMOBILE,JKTYRE,EQ,INE573A01042 +JM Financial Ltd.,FINANCIAL SERVICES,JMFINANCIL,EQ,INE780C01023 +JSW Energy Ltd.,POWER,JSWENERGY,BE,INE121E01018 +JSW Steel Ltd.,METALS,JSWSTEEL,EQ,INE019A01038 +JTEKT India Ltd.,AUTOMOBILE,JTEKTINDIA,EQ,INE643A01035 +Jamna Auto Industries Ltd.,AUTOMOBILE,JAMNAAUTO,EQ,INE039C01032 +Jindal Saw Ltd.,METALS,JINDALSAW,EQ,INE324A01024 +Jindal Stainless (Hisar) Ltd.,METALS,JSLHISAR,EQ,INE455T01018 +Jindal Stainless Ltd.,METALS,JSL,EQ,INE220G01021 +Jindal Steel & Power Ltd.,METALS,JINDALSTEL,EQ,INE749A01030 +Johnson Controls - Hitachi Air Conditioning India Ltd.,CONSUMER GOODS,JCHAC,EQ,INE782A01015 +Jubilant Foodworks Ltd.,CONSUMER SERVICES,JUBLFOOD,EQ,INE797F01012 +Justdial Ltd.,CONSUMER SERVICES,JUSTDIAL,EQ,INE599M01018 +Jyothy Labs Ltd.,CONSUMER GOODS,JYOTHYLAB,EQ,INE668F01031 +K.P.R. Mill Ltd.,TEXTILES,KPRMILL,EQ,INE930H01023 +KEI Industries Ltd.,INDUSTRIAL MANUFACTURING,KEI,EQ,INE878B01027 +KNR Constructions Ltd.,CONSTRUCTION,KNRCON,EQ,INE634I01029 +KPIT Technologies Ltd.,IT,KPITTECH,EQ,INE04I401011 +KRBL Ltd.,CONSUMER GOODS,KRBL,EQ,INE001B01026 +KSB Ltd.,INDUSTRIAL MANUFACTURING,KSB,EQ,INE999A01015 +Kajaria Ceramics Ltd.,CONSUMER GOODS,KAJARIACER,EQ,INE217B01036 +Kalpataru Power Transmission Ltd.,POWER,KALPATPOWR,EQ,INE220B01022 +Kansai Nerolac Paints Ltd.,CONSUMER GOODS,KANSAINER,EQ,INE531A01024 +Karur Vysya Bank Ltd.,FINANCIAL SERVICES,KARURVYSYA,EQ,INE036D01028 +Kaveri Seed Company Ltd.,CONSUMER GOODS,KSCL,EQ,INE455I01029 +Kec International Ltd.,POWER,KEC,EQ,INE389H01022 +Kotak Mahindra Bank Ltd.,FINANCIAL SERVICES,KOTAKBANK,EQ,INE237A01028 +L&T Finance Holdings Ltd.,FINANCIAL SERVICES,L&TFH,EQ,INE498L01015 +L&T Technology Services Ltd.,IT,LTTS,EQ,INE010V01017 +LIC Housing Finance Ltd.,FINANCIAL SERVICES,LICHSGFIN,EQ,INE115A01026 +La Opala RG Ltd.,CONSUMER GOODS,LAOPALA,EQ,INE059D01020 +Lakshmi Machine Works Ltd.,INDUSTRIAL MANUFACTURING,LAXMIMACH,EQ,INE269B01029 +Larsen & Toubro Infotech Ltd.,IT,LTI,EQ,INE214T01019 +Larsen & Toubro Ltd.,CONSTRUCTION,LT,EQ,INE018A01030 +Laurus Labs Ltd.,PHARMA,LAURUSLABS,EQ,INE947Q01028 +Lemon Tree Hotels Ltd.,CONSUMER SERVICES,LEMONTREE,EQ,INE970X01018 +Linde India Ltd.,CHEMICALS,LINDEINDIA,EQ,INE473A01011 +Lupin Ltd.,PHARMA,LUPIN,EQ,INE326A01037 +Lux Industries Ltd.,TEXTILES,LUXIND,EQ,INE150G01020 +MAS Financial Services Ltd.,FINANCIAL SERVICES,MASFIN,EQ,INE348L01012 +MMTC Ltd.,SERVICES,MMTC,EQ,INE123F01029 +MOIL Ltd.,METALS,MOIL,EQ,INE490G01020 +MRF Ltd.,AUTOMOBILE,MRF,EQ,INE883A01011 +Mahanagar Gas Ltd.,OIL & GAS,MGL,EQ,INE002S01010 +Maharashtra Scooters Ltd.,FINANCIAL SERVICES,MAHSCOOTER,EQ,INE288A01013 +Maharashtra Seamless Ltd.,METALS,MAHSEAMLES,EQ,INE271B01025 +Mahindra & Mahindra Financial Services Ltd.,FINANCIAL SERVICES,M&MFIN,EQ,INE774D01024 +Mahindra & Mahindra Ltd.,AUTOMOBILE,M&M,EQ,INE101A01026 +Mahindra CIE Automotive Ltd.,INDUSTRIAL MANUFACTURING,MAHINDCIE,EQ,INE536H01010 +Mahindra Holidays & Resorts India Ltd.,CONSUMER SERVICES,MHRIL,EQ,INE998I01010 +Mahindra Logistics Ltd.,SERVICES,MAHLOG,EQ,INE766P01016 +Manappuram Finance Ltd.,FINANCIAL SERVICES,MANAPPURAM,EQ,INE522D01027 +Mangalore Refinery & Petrochemicals Ltd.,OIL & GAS,MRPL,EQ,INE103A01014 +Marico Ltd.,CONSUMER GOODS,MARICO,EQ,INE196A01026 +Maruti Suzuki India Ltd.,AUTOMOBILE,MARUTI,EQ,INE585B01010 +Max Financial Services Ltd.,FINANCIAL SERVICES,MFSL,EQ,INE180A01020 +Max Healthcare Institute Ltd.,HEALTHCARE SERVICES,MAXHEALTH,EQ,INE027H01010 +Mazagoan Dock Shipbuilders Ltd.,INDUSTRIAL MANUFACTURING,MAZDOCK,EQ,INE249Z01012 +Metropolis Healthcare Ltd.,HEALTHCARE SERVICES,METROPOLIS,EQ,INE112L01020 +MindTree Ltd.,IT,MINDTREE,EQ,INE018I01017 +Minda Corporation Ltd.,AUTOMOBILE,MINDACORP,EQ,INE842C01021 +Minda Industries Ltd.,AUTOMOBILE,MINDAIND,EQ,INE405E01023 +Mishra Dhatu Nigam Ltd.,METALS,MIDHANI,EQ,INE099Z01011 +Motilal Oswal Financial Services Ltd.,FINANCIAL SERVICES,MOTILALOFS,EQ,INE338I01027 +MphasiS Ltd.,IT,MPHASIS,EQ,INE356A01018 +Multi Commodity Exchange of India Ltd.,FINANCIAL SERVICES,MCX,EQ,INE745G01035 +Muthoot Finance Ltd.,FINANCIAL SERVICES,MUTHOOTFIN,EQ,INE414G01012 +NATCO Pharma Ltd.,PHARMA,NATCOPHARM,EQ,INE987B01026 +NBCC (India) Ltd.,CONSTRUCTION,NBCC,EQ,INE095N01031 +NCC Ltd.,CONSTRUCTION,NCC,EQ,INE868B01028 +NESCO Ltd.,SERVICES,NESCO,EQ,INE317F01035 +NHPC Ltd.,POWER,NHPC,EQ,INE848E01016 +NLC India Ltd.,POWER,NLCINDIA,EQ,INE589A01014 +NMDC Ltd.,METALS,NMDC,EQ,INE584A01023 +NOCIL Ltd.,CHEMICALS,NOCIL,EQ,INE163A01018 +NTPC Ltd.,POWER,NTPC,EQ,INE733E01010 +Narayana Hrudayalaya Ltd.,HEALTHCARE SERVICES,NH,EQ,INE410P01011 +National Aluminium Co. Ltd.,METALS,NATIONALUM,EQ,INE139A01034 +National Fertilizers Ltd.,FERTILISERS & PESTICIDES,NFL,EQ,INE870D01012 +Navin Fluorine International Ltd.,CHEMICALS,NAVINFLUOR,EQ,INE048G01026 +Nestle India Ltd.,CONSUMER GOODS,NESTLEIND,EQ,INE239A01016 +Network18 Media & Investments Ltd.,MEDIA ENTERTAINMENT & PUBLICATION,NETWORK18,EQ,INE870H01013 +Nilkamal Ltd.,INDUSTRIAL MANUFACTURING,NILKAMAL,EQ,INE310A01015 +Nippon Life India Asset Management Ltd.,FINANCIAL SERVICES,NAM-INDIA,EQ,INE298J01013 +Oberoi Realty Ltd.,CONSTRUCTION,OBEROIRLTY,EQ,INE093I01010 +Oil & Natural Gas Corporation Ltd.,OIL & GAS,ONGC,EQ,INE213A01029 +Oil India Ltd.,OIL & GAS,OIL,EQ,INE274J01014 +Oracle Financial Services Software Ltd.,IT,OFSS,EQ,INE881D01027 +Orient Electric Ltd.,CONSUMER GOODS,ORIENTELEC,EQ,INE142Z01019 +PI Industries Ltd.,FERTILISERS & PESTICIDES,PIIND,EQ,INE603J01030 +PNB Housing Finance Ltd.,FINANCIAL SERVICES,PNBHOUSING,EQ,INE572E01012 +PNC Infratech Ltd.,CONSTRUCTION,PNCINFRA,EQ,INE195J01029 +PVR Ltd.,MEDIA ENTERTAINMENT & PUBLICATION,PVR,EQ,INE191H01014 +Page Industries Ltd.,TEXTILES,PAGEIND,EQ,INE761H01022 +Persistent Systems Ltd.,IT,PERSISTENT,EQ,INE262H01013 +Petronet LNG Ltd.,OIL & GAS,PETRONET,EQ,INE347G01014 +Pfizer Ltd.,PHARMA,PFIZER,EQ,INE182A01018 +Phillips Carbon Black Ltd.,CHEMICALS,PHILIPCARB,EQ,INE602A01023 +Phoenix Mills Ltd.,CONSTRUCTION,PHOENIXLTD,EQ,INE211B01039 +Pidilite Industries Ltd.,CHEMICALS,PIDILITIND,EQ,INE318A01026 +Piramal Enterprises Ltd.,FINANCIAL SERVICES,PEL,EQ,INE140A01024 +Poly Medicure Ltd.,HEALTHCARE SERVICES,POLYMED,EQ,INE205C01021 +Polycab India Ltd.,INDUSTRIAL MANUFACTURING,POLYCAB,EQ,INE455K01017 +Polyplex Corporation Ltd.,INDUSTRIAL MANUFACTURING,POLYPLEX,EQ,INE633B01018 +Power Finance Corporation Ltd.,FINANCIAL SERVICES,PFC,EQ,INE134E01011 +Power Grid Corporation of India Ltd.,POWER,POWERGRID,EQ,INE752E01010 +Prestige Estates Projects Ltd.,CONSTRUCTION,PRESTIGE,EQ,INE811K01011 +Prince Pipes and Fittings Ltd.,INDUSTRIAL MANUFACTURING,PRINCEPIPE,EQ,INE689W01016 +Prism Johnson Ltd.,CEMENT & CEMENT PRODUCTS,PRSMJOHNSN,EQ,INE010A01011 +Procter & Gamble Health Ltd.,PHARMA,PGHL,EQ,INE199A01012 +Procter & Gamble Hygiene & Health Care Ltd.,CONSUMER GOODS,PGHH,EQ,INE179A01014 +Punjab National Bank,FINANCIAL SERVICES,PNB,EQ,INE160A01022 +Quess Corp Ltd.,SERVICES,QUESS,EQ,INE615P01015 +RBL Bank Ltd.,FINANCIAL SERVICES,RBLBANK,EQ,INE976G01028 +REC Ltd.,FINANCIAL SERVICES,RECLTD,EQ,INE020B01018 +RHI MAGNESITA INDIA LTD.,INDUSTRIAL MANUFACTURING,RHIM,EQ,INE743M01012 +RITES Ltd.,SERVICES,RITES,EQ,INE320J01015 +Radico Khaitan Ltd,CONSUMER GOODS,RADICO,EQ,INE944F01028 +Rail Vikas Nigam Ltd.,CONSTRUCTION,RVNL,EQ,INE415G01027 +Rain Industries Ltd,CHEMICALS,RAIN,EQ,INE855B01025 +Rajesh Exports Ltd.,CONSUMER GOODS,RAJESHEXPO,EQ,INE343B01030 +Rallis India Ltd.,FERTILISERS & PESTICIDES,RALLIS,EQ,INE613A01020 +Rashtriya Chemicals & Fertilizers Ltd.,FERTILISERS & PESTICIDES,RCF,EQ,INE027A01015 +Ratnamani Metals & Tubes Ltd.,METALS,RATNAMANI,EQ,INE703B01027 +Raymond Ltd.,TEXTILES,RAYMOND,EQ,INE301A01014 +Redington (India) Ltd.,SERVICES,REDINGTON,EQ,INE891D01026 +Relaxo Footwears Ltd.,CONSUMER GOODS,RELAXO,EQ,INE131B01039 +Reliance Industries Ltd.,OIL & GAS,RELIANCE,EQ,INE002A01018 +Responsive Industries Ltd.,CONSUMER GOODS,RESPONIND,EQ,INE688D01026 +Rossari Biotech Ltd.,CHEMICALS,ROSSARI,EQ,INE02A801020 +Route Mobile Ltd.,IT,ROUTE,EQ,INE450U01017 +SBI Cards and Payment Services Ltd.,FINANCIAL SERVICES,SBICARD,EQ,INE018E01016 +SBI Life Insurance Company Ltd.,FINANCIAL SERVICES,SBILIFE,EQ,INE123W01016 +SIS Ltd.,SERVICES,SIS,EQ,INE285J01028 +SJVN Ltd.,POWER,SJVN,EQ,INE002L01015 +SKF India Ltd.,INDUSTRIAL MANUFACTURING,SKFINDIA,EQ,INE640A01023 +SRF Ltd.,CHEMICALS,SRF,EQ,INE647A01010 +Sanofi India Ltd.,PHARMA,SANOFI,EQ,INE058A01010 +Schaeffler India Ltd.,INDUSTRIAL MANUFACTURING,SCHAEFFLER,EQ,INE513A01014 +Schneider Electric Infrastructure Ltd.,INDUSTRIAL MANUFACTURING,SCHNEIDER,EQ,INE839M01018 +Sequent Scientific Ltd.,PHARMA,SEQUENT,EQ,INE807F01027 +Sharda Cropchem Ltd.,FERTILISERS & PESTICIDES,SHARDACROP,EQ,INE221J01015 +Sheela Foam Ltd.,CONSUMER GOODS,SFL,EQ,INE916U01025 +Shilpa Medicare Ltd.,PHARMA,SHILPAMED,EQ,INE790G01031 +Shipping Corporation of India Ltd.,SERVICES,SCI,EQ,INE109A01011 +Shoppers Stop Ltd.,CONSUMER SERVICES,SHOPERSTOP,EQ,INE498B01024 +Shree Cement Ltd.,CEMENT & CEMENT PRODUCTS,SHREECEM,EQ,INE070A01015 +Shriram City Union Finance Ltd.,FINANCIAL SERVICES,SHRIRAMCIT,EQ,INE722A01011 +Shriram Transport Finance Co. Ltd.,FINANCIAL SERVICES,SRTRANSFIN,EQ,INE721A01013 +Siemens Ltd.,INDUSTRIAL MANUFACTURING,SIEMENS,EQ,INE003A01024 +Sobha Ltd.,CONSTRUCTION,SOBHA,EQ,INE671H01015 +Solar Industries India Ltd.,CHEMICALS,SOLARINDS,EQ,INE343H01029 +Solara Active Pharma Sciences Ltd.,PHARMA,SOLARA,EQ,INE624Z01016 +Sonata Software Ltd.,IT,SONATSOFTW,EQ,INE269A01021 +Spandana Sphoorty Financial Ltd.,FINANCIAL SERVICES,SPANDANA,EQ,INE572J01011 +Spicejet Ltd.,SERVICES,SPICEJET,EQ,INE285B01017 +Star Cement Ltd.,CEMENT & CEMENT PRODUCTS,STARCEMENT,EQ,INE460H01021 +State Bank of India,FINANCIAL SERVICES,SBIN,EQ,INE062A01020 +Steel Authority of India Ltd.,METALS,SAIL,EQ,INE114A01011 +Sterling And Wilson Solar Ltd.,CONSTRUCTION,SWSOLAR,EQ,INE00M201021 +Sterlite Technologies Ltd.,TELECOM,STLTECH,EQ,INE089C01029 +Strides Pharma Science Ltd.,PHARMA,STAR,EQ,INE939A01011 +Sudarshan Chemical Industries Ltd.,CHEMICALS,SUDARSCHEM,EQ,INE659A01023 +Sumitomo Chemical India Ltd.,FERTILISERS & PESTICIDES,SUMICHEM,EQ,INE258G01013 +Sun Pharma Advanced Research Company Ltd.,PHARMA,SPARC,EQ,INE232I01014 +Sun Pharmaceutical Industries Ltd.,PHARMA,SUNPHARMA,EQ,INE044A01036 +Sun TV Network Ltd.,MEDIA ENTERTAINMENT & PUBLICATION,SUNTV,EQ,INE424H01027 +Sundaram Clayton Ltd.,AUTOMOBILE,SUNCLAYLTD,EQ,INE105A01035 +Sundaram Finance Ltd.,FINANCIAL SERVICES,SUNDARMFIN,EQ,INE660A01013 +Sundram Fasteners Ltd.,AUTOMOBILE,SUNDRMFAST,EQ,INE387A01021 +Sunteck Realty Ltd.,CONSTRUCTION,SUNTECK,EQ,INE805D01034 +Suprajit Engineering Ltd.,AUTOMOBILE,SUPRAJIT,EQ,INE399C01030 +Supreme Industries Ltd.,INDUSTRIAL MANUFACTURING,SUPREMEIND,EQ,INE195A01028 +Supreme Petrochem Ltd.,CHEMICALS,SUPPETRO,EQ,INE663A01017 +Suven Pharmaceuticals Ltd.,PHARMA,SUVENPHAR,EQ,INE03QK01018 +Suzlon Energy Ltd.,INDUSTRIAL MANUFACTURING,SUZLON,EQ,INE040H01021 +Swan Energy Ltd.,TEXTILES,SWANENERGY,EQ,INE665A01038 +Symphony Ltd.,CONSUMER GOODS,SYMPHONY,EQ,INE225D01027 +Syngene International Ltd.,HEALTHCARE SERVICES,SYNGENE,EQ,INE398R01022 +TCI Express Ltd.,SERVICES,TCIEXP,EQ,INE586V01016 +TCNS Clothing Co. Ltd.,TEXTILES,TCNSBRANDS,EQ,INE778U01029 +TTK Prestige Ltd.,CONSUMER GOODS,TTKPRESTIG,EQ,INE690A01010 +TV18 Broadcast Ltd.,MEDIA ENTERTAINMENT & PUBLICATION,TV18BRDCST,EQ,INE886H01027 +TVS Motor Company Ltd.,AUTOMOBILE,TVSMOTOR,EQ,INE494B01023 +Tanla Platforms Ltd.,IT,TANLA,BE,INE483C01032 +Tasty Bite Eatables Ltd.,CONSUMER GOODS,TASTYBITE,EQ,INE488B01017 +Tata Chemicals Ltd.,CHEMICALS,TATACHEM,EQ,INE092A01019 +Tata Coffee Ltd.,CONSUMER GOODS,TATACOFFEE,EQ,INE493A01027 +Tata Communications Ltd.,TELECOM,TATACOMM,EQ,INE151A01013 +Tata Consultancy Services Ltd.,IT,TCS,EQ,INE467B01029 +Tata Consumer Products Ltd.,CONSUMER GOODS,TATACONSUM,EQ,INE192A01025 +Tata Elxsi Ltd.,IT,TATAELXSI,EQ,INE670A01012 +Tata Investment Corporation Ltd.,FINANCIAL SERVICES,TATAINVEST,EQ,INE672A01018 +Tata Motors Ltd DVR,AUTOMOBILE,TATAMTRDVR,EQ,IN9155A01020 +Tata Motors Ltd.,AUTOMOBILE,TATAMOTORS,EQ,INE155A01022 +Tata Power Co. Ltd.,POWER,TATAPOWER,EQ,INE245A01021 +Tata Steel Ltd.,METALS,TATASTEEL,EQ,INE081A01012 +Teamlease Services Ltd.,SERVICES,TEAMLEASE,EQ,INE985S01024 +Tech Mahindra Ltd.,IT,TECHM,EQ,INE669C01036 +The New India Assurance Company Ltd.,FINANCIAL SERVICES,NIACL,EQ,INE470Y01017 +The Ramco Cements Ltd.,CEMENT & CEMENT PRODUCTS,RAMCOCEM,EQ,INE331A01037 +Thermax Ltd.,INDUSTRIAL MANUFACTURING,THERMAX,EQ,INE152A01029 +Thyrocare Technologies Ltd.,HEALTHCARE SERVICES,THYROCARE,EQ,INE594H01019 +Timken India Ltd.,INDUSTRIAL MANUFACTURING,TIMKEN,EQ,INE325A01013 +Titan Company Ltd.,CONSUMER GOODS,TITAN,EQ,INE280A01028 +Torrent Pharmaceuticals Ltd.,PHARMA,TORNTPHARM,EQ,INE685A01028 +Torrent Power Ltd.,POWER,TORNTPOWER,EQ,INE813H01021 +Trent Ltd.,CONSUMER SERVICES,TRENT,EQ,INE849A01020 +Trident Ltd.,TEXTILES,TRIDENT,EQ,INE064C01022 +Triveni Turbine Ltd.,INDUSTRIAL MANUFACTURING,TRITURBINE,EQ,INE152M01016 +Tube Investments of India Ltd.,AUTOMOBILE,TIINDIA,EQ,INE974X01010 +UCO Bank,FINANCIAL SERVICES,UCOBANK,EQ,INE691A01018 +UFLEX Ltd.,INDUSTRIAL MANUFACTURING,UFLEX,EQ,INE516A01017 +UPL Ltd.,FERTILISERS & PESTICIDES,UPL,EQ,INE628A01036 +UTI Asset Management Company Ltd.,FINANCIAL SERVICES,UTIAMC,EQ,INE094J01016 +Ujjivan Financial Services Ltd.,FINANCIAL SERVICES,UJJIVAN,EQ,INE334L01012 +Ujjivan Small Finance Bank Ltd.,FINANCIAL SERVICES,UJJIVANSFB,EQ,INE551W01018 +UltraTech Cement Ltd.,CEMENT & CEMENT PRODUCTS,ULTRACEMCO,EQ,INE481G01011 +Union Bank of India,FINANCIAL SERVICES,UNIONBANK,EQ,INE692A01016 +United Breweries Ltd.,CONSUMER GOODS,UBL,EQ,INE686F01025 +United Spirits Ltd.,CONSUMER GOODS,MCDOWELL-N,EQ,INE854D01024 +V-Guard Industries Ltd.,CONSUMER GOODS,VGUARD,EQ,INE951I01027 +V-Mart Retail Ltd.,CONSUMER SERVICES,VMART,EQ,INE665J01013 +V.I.P. Industries Ltd.,CONSUMER GOODS,VIPIND,EQ,INE054A01027 +VST Industries Ltd.,CONSUMER GOODS,VSTIND,EQ,INE710A01016 +Vaibhav Global Ltd.,CONSUMER SERVICES,VAIBHAVGBL,EQ,INE884A01027 +Vakrangee Ltd.,IT,VAKRANGEE,EQ,INE051B01021 +Valiant Organics Ltd.,CHEMICALS,VALIANTORG,EQ,INE565V01010 +Vardhman Textiles Ltd.,TEXTILES,VTL,EQ,INE825A01012 +Varroc Engineering Ltd.,AUTOMOBILE,VARROC,EQ,INE665L01035 +Varun Beverages Ltd.,CONSUMER GOODS,VBL,EQ,INE200M01013 +Vedanta Ltd.,METALS,VEDL,EQ,INE205A01025 +Venky's (India) Ltd.,CONSUMER GOODS,VENKEYS,EQ,INE398A01010 +Vinati Organics Ltd.,CHEMICALS,VINATIORGA,EQ,INE410B01037 +Vodafone Idea Ltd.,TELECOM,IDEA,EQ,INE669E01016 +Voltas Ltd.,CONSUMER GOODS,VOLTAS,EQ,INE226A01021 +WABCO India Ltd.,AUTOMOBILE,WABCOINDIA,EQ,INE342J01019 +Welspun Corp Ltd.,METALS,WELCORP,EQ,INE191B01025 +Welspun India Ltd.,TEXTILES,WELSPUNIND,EQ,INE192B01031 +Westlife Development Ltd.,CONSUMER SERVICES,WESTLIFE,EQ,INE274F01020 +Whirlpool of India Ltd.,CONSUMER GOODS,WHIRLPOOL,EQ,INE716A01013 +Wipro Ltd.,IT,WIPRO,EQ,INE075A01022 +Wockhardt Ltd.,PHARMA,WOCKPHARMA,EQ,INE049B01025 +Yes Bank Ltd.,FINANCIAL SERVICES,YESBANK,EQ,INE528G01035 +Zee Entertainment Enterprises Ltd.,MEDIA ENTERTAINMENT & PUBLICATION,ZEEL,EQ,INE256A01028 +Zensar Technolgies Ltd.,IT,ZENSARTECH,EQ,INE520A01027 +Zydus Wellness Ltd.,CONSUMER GOODS,ZYDUSWELL,EQ,INE768C01010 +eClerx Services Ltd.,IT,ECLERX,BE,INE738I01010 diff --git a/scripts/Fetching trending stocks using nlp/data/ind_nifty50list.csv b/scripts/Fetching trending stocks using nlp/data/ind_nifty50list.csv new file mode 100644 index 0000000..f418a3d --- /dev/null +++ b/scripts/Fetching trending stocks using nlp/data/ind_nifty50list.csv @@ -0,0 +1,51 @@ +Company Name,Industry,Symbol,Series,ISIN Code +Adani Ports and Special Economic Zone Ltd.,SERVICES,ADANIPORTS,EQ,INE742F01042 +Asian Paints Ltd.,CONSUMER GOODS,ASIANPAINT,EQ,INE021A01026 +Axis Bank Ltd.,FINANCIAL SERVICES,AXISBANK,EQ,INE238A01034 +Bajaj Auto Ltd.,AUTOMOBILE,BAJAJ-AUTO,EQ,INE917I01010 +Bajaj Finance Ltd.,FINANCIAL SERVICES,BAJFINANCE,EQ,INE296A01024 +Bajaj Finserv Ltd.,FINANCIAL SERVICES,BAJAJFINSV,EQ,INE918I01018 +Bharat Petroleum Corporation Ltd.,OIL & GAS,BPCL,EQ,INE029A01011 +Bharti Airtel Ltd.,TELECOM,BHARTIARTL,EQ,INE397D01024 +Britannia Industries Ltd.,CONSUMER GOODS,BRITANNIA,EQ,INE216A01030 +Cipla Ltd.,PHARMA,CIPLA,EQ,INE059A01026 +Coal India Ltd.,METALS,COALINDIA,EQ,INE522F01014 +Divi's Laboratories Ltd.,PHARMA,DIVISLAB,EQ,INE361B01024 +Dr. Reddy's Laboratories Ltd.,PHARMA,DRREDDY,EQ,INE089A01023 +Eicher Motors Ltd.,AUTOMOBILE,EICHERMOT,EQ,INE066A01021 +Grasim Industries Ltd.,CEMENT & CEMENT PRODUCTS,GRASIM,EQ,INE047A01021 +HCL Technologies Ltd.,IT,HCLTECH,EQ,INE860A01027 +HDFC Bank Ltd.,FINANCIAL SERVICES,HDFCBANK,EQ,INE040A01034 +HDFC Life Insurance Company Ltd.,FINANCIAL SERVICES,HDFCLIFE,EQ,INE795G01014 +Hero MotoCorp Ltd.,AUTOMOBILE,HEROMOTOCO,EQ,INE158A01026 +Hindalco Industries Ltd.,METALS,HINDALCO,EQ,INE038A01020 +Hindustan Unilever Ltd.,CONSUMER GOODS,HINDUNILVR,EQ,INE030A01027 +Housing Development Finance Corporation Ltd.,FINANCIAL SERVICES,HDFC,EQ,INE001A01036 +ICICI Bank Ltd.,FINANCIAL SERVICES,ICICIBANK,EQ,INE090A01021 +ITC Ltd.,CONSUMER GOODS,ITC,EQ,INE154A01025 +Indian Oil Corporation Ltd.,OIL & GAS,IOC,EQ,INE242A01010 +IndusInd Bank Ltd.,FINANCIAL SERVICES,INDUSINDBK,EQ,INE095A01012 +Infosys Ltd.,IT,INFY,EQ,INE009A01021 +JSW Steel Ltd.,METALS,JSWSTEEL,EQ,INE019A01038 +Kotak Mahindra Bank Ltd.,FINANCIAL SERVICES,KOTAKBANK,EQ,INE237A01028 +Larsen & Toubro Ltd.,CONSTRUCTION,LT,EQ,INE018A01030 +Mahindra & Mahindra Ltd.,AUTOMOBILE,M&M,EQ,INE101A01026 +Maruti Suzuki India Ltd.,AUTOMOBILE,MARUTI,EQ,INE585B01010 +NTPC Ltd.,POWER,NTPC,EQ,INE733E01010 +Nestle India Ltd.,CONSUMER GOODS,NESTLEIND,EQ,INE239A01016 +Oil & Natural Gas Corporation Ltd.,OIL & GAS,ONGC,EQ,INE213A01029 +Power Grid Corporation of India Ltd.,POWER,POWERGRID,EQ,INE752E01010 +Reliance Industries Ltd.,OIL & GAS,RELIANCE,EQ,INE002A01018 +SBI Life Insurance Company Ltd.,FINANCIAL SERVICES,SBILIFE,EQ,INE123W01016 +Shree Cement Ltd.,CEMENT & CEMENT PRODUCTS,SHREECEM,EQ,INE070A01015 +State Bank of India,FINANCIAL SERVICES,SBIN,EQ,INE062A01020 +Sun Pharmaceutical Industries Ltd.,PHARMA,SUNPHARMA,EQ,INE044A01036 +Tata Consultancy Services Ltd.,IT,TCS,EQ,INE467B01029 +Tata Consumer Products Ltd.,CONSUMER GOODS,TATACONSUM,EQ,INE192A01025 +Tata Motors Ltd.,AUTOMOBILE,TATAMOTORS,EQ,INE155A01022 +Tata Steel Ltd.,METALS,TATASTEEL,EQ,INE081A01012 +Tech Mahindra Ltd.,IT,TECHM,EQ,INE669C01036 +Titan Company Ltd.,CONSUMER GOODS,TITAN,EQ,INE280A01028 +UPL Ltd.,FERTILISERS & PESTICIDES,UPL,EQ,INE628A01036 +UltraTech Cement Ltd.,CEMENT & CEMENT PRODUCTS,ULTRACEMCO,EQ,INE481G01011 +Wipro Ltd.,IT,WIPRO,EQ,INE075A01022 diff --git a/scripts/Fetching trending stocks using nlp/requirements.txt b/scripts/Fetching trending stocks using nlp/requirements.txt new file mode 100644 index 0000000..f589ab7 --- /dev/null +++ b/scripts/Fetching trending stocks using nlp/requirements.txt @@ -0,0 +1,4 @@ +spacy - en_core_web_sm model +requests +streamlit +yfinance \ No newline at end of file diff --git a/scripts/Script to fetch top IMBD listed movies/Readme.md b/scripts/Script to fetch top IMBD listed movies/Readme.md new file mode 100644 index 0000000..aadb229 --- /dev/null +++ b/scripts/Script to fetch top IMBD listed movies/Readme.md @@ -0,0 +1,8 @@ +# Script to fetch top imbd movies + +This script fetches the list of top imbd movies using beautiful soup. +## Simplest way to run + +Open idle, open the file, f5 and enjoy ✔✔ + +The script will create a csv file of all the fetched list. diff --git a/scripts/Script to fetch top IMBD listed movies/imbd.py b/scripts/Script to fetch top IMBD listed movies/imbd.py new file mode 100644 index 0000000..28b3440 --- /dev/null +++ b/scripts/Script to fetch top IMBD listed movies/imbd.py @@ -0,0 +1,37 @@ +from bs4 import BeautifulSoup +import requests +import re +import pandas as pd + +url = 'http://www.imdb.com/chart/top' +response = requests.get(url) +soup = BeautifulSoup(response.text, "html.parser") +movies = soup.select('td.titleColumn') +crew = [a.attrs.get('title') for a in soup.select('td.titleColumn a')] +ratings = [b.attrs.get('data-value') + for b in soup.select('td.posterColumn span[name=ir]')] + +list = [] + + +for index in range(0, len(movies)): + + movie_string = movies[index].get_text() + movie = (' '.join(movie_string.split()).replace('.', '')) + movie_title = movie[len(str(index))+1:-7] + year = re.search('\((.*?)\)', movie_string).group(1) + place = movie[:len(str(index))-(len(movie))] + data = {"place": place, + "movie_title": movie_title, + "rating": ratings[index], + "year": year, + "star_cast": crew[index], + } + list.append(data) + +for movie in list: + print(movie['place'], '-', movie['movie_title'], '('+movie['year'] + + ') -', 'Starring:', movie['star_cast'], movie['rating']) + +df = pd.DataFrame(list) +df.to_csv('imdb_top_250_movies.csv',index=False) diff --git a/scripts/Script to fetch top IMBD listed movies/imdb_top_250_movies.csv b/scripts/Script to fetch top IMBD listed movies/imdb_top_250_movies.csv new file mode 100644 index 0000000..2d10622 --- /dev/null +++ b/scripts/Script to fetch top IMBD listed movies/imdb_top_250_movies.csv @@ -0,0 +1,251 @@ +place,movie_title,rating,year,star_cast +1,The Shawshank Redemption,9.234904136818454,1994,"Frank Darabont (dir.), Tim Robbins, Morgan Freeman" +2,The Godfather,9.15624256340351,1972,"Francis Ford Coppola (dir.), Marlon Brando, Al Pacino" +3,The Dark Knight,8.988706481126444,2008,"Christopher Nolan (dir.), Christian Bale, Heath Ledger" +4,The Godfather Part II,8.984194506058763,1974,"Francis Ford Coppola (dir.), Al Pacino, Robert De Niro" +5,12 Angry Men,8.950378660821537,1957,"Sidney Lumet (dir.), Henry Fonda, Lee J. Cobb" +6,Schindler's List,8.937490356517953,1993,"Steven Spielberg (dir.), Liam Neeson, Ralph Fiennes" +7,The Lord of the Rings: The Return of the King,8.92747119693047,2003,"Peter Jackson (dir.), Elijah Wood, Viggo Mortensen" +8,Pulp Fiction,8.848600373629079,1994,"Quentin Tarantino (dir.), John Travolta, Uma Thurman" +9,The Lord of the Rings: The Fellowship of the Ring,8.807764305629757,2001,"Peter Jackson (dir.), Elijah Wood, Ian McKellen" +1," Il buono, il brutto, il cattivo",8.791317254914828,1966,"Sergio Leone (dir.), Clint Eastwood, Eli Wallach" +11,Forrest Gump,8.76765197219575,1994,"Robert Zemeckis (dir.), Tom Hanks, Robin Wright" +12,Fight Club,8.748855294854142,1999,"David Fincher (dir.), Brad Pitt, Edward Norton" +13,Inception,8.733239211175135,2010,"Christopher Nolan (dir.), Leonardo DiCaprio, Joseph Gordon-Levitt" +14,The Lord of the Rings: The Two Towers,8.732812731363351,2002,"Peter Jackson (dir.), Elijah Wood, Ian McKellen" +15,The Empire Strikes Back,8.700015179846625,1980,"Irvin Kershner (dir.), Mark Hamill, Harrison Ford" +16,The Matrix,8.669806873023978,1999,"Lana Wachowski (dir.), Keanu Reeves, Laurence Fishburne" +17,Goodfellas,8.65205609337949,1990,"Martin Scorsese (dir.), Robert De Niro, Ray Liotta" +18,One Flew Over the Cuckoo's Nest,8.639647532083753,1975,"Milos Forman (dir.), Jack Nicholson, Louise Fletcher" +19,Se7en,8.604249174368016,1995,"David Fincher (dir.), Morgan Freeman, Brad Pitt" +20,Shichinin no samurai,8.599072399250122,1954,"Akira Kurosawa (dir.), Toshirô Mifune, Takashi Shimura" +21,It's a Wonderful Life,8.595597467085389,1946,"Frank Capra (dir.), James Stewart, Donna Reed" +22,The Silence of the Lambs,8.588098006838871,1991,"Jonathan Demme (dir.), Jodie Foster, Anthony Hopkins" +23,Cidade de Deus,8.579576002977847,2002,"Fernando Meirelles (dir.), Alexandre Rodrigues, Leandro Firmino" +24,Saving Private Ryan,8.578595835275541,1998,"Steven Spielberg (dir.), Tom Hanks, Matt Damon" +25,La vita è bella,8.567330756535378,1997,"Roberto Benigni (dir.), Roberto Benigni, Nicoletta Braschi" +26,Interstellar,8.56303060608984,2014,"Christopher Nolan (dir.), Matthew McConaughey, Anne Hathaway" +27,The Green Mile,8.56163218111644,1999,"Frank Darabont (dir.), Tom Hanks, Michael Clarke Duncan" +28,Star Wars,8.550952471373744,1977,"George Lucas (dir.), Mark Hamill, Harrison Ford" +29,Terminator 2: Judgment Day,8.536034536114844,1991,"James Cameron (dir.), Arnold Schwarzenegger, Linda Hamilton" +30,Back to the Future,8.517634371526357,1985,"Robert Zemeckis (dir.), Michael J. Fox, Christopher Lloyd" +31,Sen to Chihiro no kamikakushi,8.515957661934813,2001,"Hayao Miyazaki (dir.), Daveigh Chase, Suzanne Pleshette" +32,Psycho,8.508100171700699,1960,"Alfred Hitchcock (dir.), Anthony Perkins, Janet Leigh" +33,The Pianist,8.506140125815184,2002,"Roman Polanski (dir.), Adrien Brody, Thomas Kretschmann" +34,Gisaengchung,8.497547306878936,2019,"Bong Joon Ho (dir.), Song Kang-ho, Lee Sun-kyun" +35,Léon,8.496742949795678,1994,"Luc Besson (dir.), Jean Reno, Gary Oldman" +36,The Lion King,8.488303334526902,1994,"Roger Allers (dir.), Matthew Broderick, Jeremy Irons" +37,Gladiator,8.48613057086782,2000,"Ridley Scott (dir.), Russell Crowe, Joaquin Phoenix" +38,American History X,8.483038321302992,1998,"Tony Kaye (dir.), Edward Norton, Edward Furlong" +39,The Departed,8.475406175977735,2006,"Martin Scorsese (dir.), Leonardo DiCaprio, Matt Damon" +40,The Usual Suspects,8.472974613205455,1995,"Bryan Singer (dir.), Kevin Spacey, Gabriel Byrne" +41,The Prestige,8.468754981826935,2006,"Christopher Nolan (dir.), Christian Bale, Hugh Jackman" +42,Whiplash,8.46419492410809,2014,"Damien Chazelle (dir.), Miles Teller, J.K. Simmons" +43,Casablanca,8.463536574401392,1942,"Michael Curtiz (dir.), Humphrey Bogart, Ingrid Bergman" +44,The Intouchables,8.45389376019163,2011,"Olivier Nakache (dir.), François Cluzet, Omar Sy" +45,Seppuku,8.452823221120253,1962,"Masaki Kobayashi (dir.), Tatsuya Nakadai, Akira Ishihama" +46,Hotaru no haka,8.452312496213862,1988,"Isao Takahata (dir.), Tsutomu Tatsumi, Ayano Shiraishi" +47,Modern Times,8.448896098758617,1936,"Charles Chaplin (dir.), Charles Chaplin, Paulette Goddard" +48,Once Upon a Time in the West,8.445557033237119,1968,"Sergio Leone (dir.), Henry Fonda, Charles Bronson" +49,Rear Window,8.436516529285429,1954,"Alfred Hitchcock (dir.), James Stewart, Grace Kelly" +50,Alien,8.434191515187006,1979,"Ridley Scott (dir.), Sigourney Weaver, Tom Skerritt" +51,City Lights,8.43400078426509,1931,"Charles Chaplin (dir.), Charles Chaplin, Virginia Cherrill" +52,Nuovo Cinema Paradiso,8.432330911775702,1988,"Giuseppe Tornatore (dir.), Philippe Noiret, Enzo Cannavale" +53,Apocalypse Now,8.424316691843506,1979,"Francis Ford Coppola (dir.), Martin Sheen, Marlon Brando" +54,Memento,8.423001092607869,2000,"Christopher Nolan (dir.), Guy Pearce, Carrie-Anne Moss" +55,Raiders of the Lost Ark,8.40875402873324,1981,"Steven Spielberg (dir.), Harrison Ford, Karen Allen" +56,Django Unchained,8.405712989541973,2012,"Quentin Tarantino (dir.), Jamie Foxx, Christoph Waltz" +57,WALL·E,8.393874760771658,2008,"Andrew Stanton (dir.), Ben Burtt, Elissa Knight" +58,The Lives of Others,8.385260120005508,2006,"Florian Henckel von Donnersmarck (dir.), Ulrich Mühe, Martina Gedeck" +59,Sunset Blvd,8.381538331508562,1950,"Billy Wilder (dir.), William Holden, Gloria Swanson" +60,Paths of Glory,8.372273172821316,1957,"Stanley Kubrick (dir.), Kirk Douglas, Ralph Meeker" +61,The Shining,8.366253580048621,1980,"Stanley Kubrick (dir.), Jack Nicholson, Shelley Duvall" +62,The Great Dictator,8.366139448005406,1940,"Charles Chaplin (dir.), Charles Chaplin, Paulette Goddard" +63,Avengers: Infinity War,8.35982850807831,2018,"Anthony Russo (dir.), Robert Downey Jr., Chris Hemsworth" +64,Witness for the Prosecution,8.359818706084797,1957,"Billy Wilder (dir.), Tyrone Power, Marlene Dietrich" +65,Aliens,8.343195944781366,1986,"James Cameron (dir.), Sigourney Weaver, Michael Biehn" +66,American Beauty,8.33434708795025,1999,"Sam Mendes (dir.), Kevin Spacey, Annette Bening" +67,Spider-Man: Into the Spider-Verse,8.333401167582558,2018,"Bob Persichetti (dir.), Shameik Moore, Jake Johnson" +68,Dr Strangelove or: How I Learned to Stop Worrying and Love the Bomb,8.33088130513012,1964,"Stanley Kubrick (dir.), Peter Sellers, George C. Scott" +69,The Dark Knight Rises,8.327616707512922,2012,"Christopher Nolan (dir.), Christian Bale, Tom Hardy" +70,Oldeuboi,8.320293271332895,2003,"Park Chan-wook (dir.), Choi Min-sik, Yoo Ji-tae" +71,Joker,8.316498373495666,2019,"Todd Phillips (dir.), Joaquin Phoenix, Robert De Niro" +72,Amadeus,8.315915050787167,1984,"Milos Forman (dir.), F. Murray Abraham, Tom Hulce" +73,Inglourious Basterds,8.314304876708752,2009,"Quentin Tarantino (dir.), Brad Pitt, Diane Kruger" +74,Toy Story,8.314113950777616,1995,"John Lasseter (dir.), Tom Hanks, Tim Allen" +75,Coco,8.314063119617284,2017,"Lee Unkrich (dir.), Anthony Gonzalez, Gael García Bernal" +76,Braveheart,8.313879864301272,1995,"Mel Gibson (dir.), Mel Gibson, Sophie Marceau" +77,Das Boot,8.312114822300837,1981,"Wolfgang Petersen (dir.), Jürgen Prochnow, Herbert Grönemeyer" +78,Avengers: Endgame,8.303857104770678,2019,"Anthony Russo (dir.), Robert Downey Jr., Chris Evans" +79,Mononoke-hime,8.303350373225244,1997,"Hayao Miyazaki (dir.), Yôji Matsuda, Yuriko Ishida" +80,Top Gun: Maverick,8.299656428177661,2022,"Joseph Kosinski (dir.), Tom Cruise, Jennifer Connelly" +81,Once Upon a Time in America,8.297673313570954,1984,"Sergio Leone (dir.), Robert De Niro, James Woods" +82,Good Will Hunting,8.288839571210985,1997,"Gus Van Sant (dir.), Robin Williams, Matt Damon" +83,Kimi no na wa,8.279527211534438,2016,"Makoto Shinkai (dir.), Ryûnosuke Kamiki, Mone Kamishiraishi" +84,Requiem for a Dream,8.275746143325462,2000,"Darren Aronofsky (dir.), Ellen Burstyn, Jared Leto" +85,Toy Story 3,8.274002958042601,2010,"Lee Unkrich (dir.), Tom Hanks, Tim Allen" +86,Singin' in the Rain,8.273688160960239,1952,"Stanley Donen (dir.), Gene Kelly, Donald O'Connor" +87,3 Idiots,8.27343895400716,2009,"Rajkumar Hirani (dir.), Aamir Khan, Madhavan" +88,Tengoku to jigoku,8.269244396218957,1963,"Akira Kurosawa (dir.), Toshirô Mifune, Yutaka Sada" +89,Star Wars: Episode VI - Return of the Jedi,8.265672583109295,1983,"Richard Marquand (dir.), Mark Hamill, Harrison Ford" +90,2001: A Space Odyssey,8.263722837501648,1968,"Stanley Kubrick (dir.), Keir Dullea, Gary Lockwood" +91,Eternal Sunshine of the Spotless Mind,8.263099458543415,2004,"Michel Gondry (dir.), Jim Carrey, Kate Winslet" +92,Capharnaüm,8.262183579687944,2018,"Nadine Labaki (dir.), Zain Al Rafeea, Yordanos Shiferaw" +93,Reservoir Dogs,8.261877143221772,1992,"Quentin Tarantino (dir.), Harvey Keitel, Tim Roth" +94,Jagten,8.2561157078314,2012,"Thomas Vinterberg (dir.), Mads Mikkelsen, Thomas Bo Larsen" +95,Citizen Kane,8.254669534194218,1941,"Orson Welles (dir.), Orson Welles, Joseph Cotten" +96,Lawrence of Arabia,8.253946628118202,1962,"David Lean (dir.), Peter O'Toole, Alec Guinness" +97,M - Eine Stadt sucht einen Mörder,8.253238146338694,1931,"Fritz Lang (dir.), Peter Lorre, Ellen Widmann" +98,Idi i smotri,8.251420306430981,1985,"Elem Klimov (dir.), Aleksey Kravchenko, Olga Mironova" +99,North by Northwest,8.249599981496104,1959,"Alfred Hitchcock (dir.), Cary Grant, Eva Marie Saint" +10, Vertigo,8.245985214386339,1958,"Alfred Hitchcock (dir.), James Stewart, Kim Novak" +101,Le fabuleux destin d'Amélie Poulain,8.243743793901526,2001,"Jean-Pierre Jeunet (dir.), Audrey Tautou, Mathieu Kassovitz" +102,A Clockwork Orange,8.242211458589265,1971,"Stanley Kubrick (dir.), Malcolm McDowell, Patrick Magee" +103,The Apartment,8.239281256451196,1960,"Billy Wilder (dir.), Jack Lemmon, Shirley MacLaine" +104,Double Indemnity,8.238818471235854,1944,"Billy Wilder (dir.), Fred MacMurray, Barbara Stanwyck" +105,Full Metal Jacket,8.238456878568147,1987,"Stanley Kubrick (dir.), Matthew Modine, R. Lee Ermey" +106,Ikiru,8.23798294621132,1952,"Akira Kurosawa (dir.), Takashi Shimura, Nobuo Kaneko" +107,Scarface,8.235119483708974,1983,"Brian De Palma (dir.), Al Pacino, Michelle Pfeiffer" +108,Hamilton,8.233902143761393,2020,"Thomas Kail (dir.), Lin-Manuel Miranda, Phillipa Soo" +109,The Sting,8.227720387044808,1973,"George Roy Hill (dir.), Paul Newman, Robert Redford" +110,To Kill a Mockingbird,8.22688247095639,1962,"Robert Mulligan (dir.), Gregory Peck, John Megna" +111,Heat,8.224713767308861,1995,"Michael Mann (dir.), Al Pacino, Robert De Niro" +112,Up,8.22448044743651,2009,"Pete Docter (dir.), Edward Asner, Jordan Nagai" +113,Incendies,8.22394925673602,2010,"Denis Villeneuve (dir.), Lubna Azabal, Mélissa Désormeaux-Poulin" +114,Taxi Driver,8.223682833598346,1976,"Martin Scorsese (dir.), Robert De Niro, Jodie Foster" +115,Metropolis,8.222147904524576,1927,"Fritz Lang (dir.), Brigitte Helm, Alfred Abel" +116,Jodaeiye Nader az Simin,8.221637434217634,2011,"Asghar Farhadi (dir.), Payman Maadi, Leila Hatami" +117,LA Confidential,8.221290450710068,1997,"Curtis Hanson (dir.), Kevin Spacey, Russell Crowe" +118,Snatch,8.218544453436461,2000,"Guy Ritchie (dir.), Jason Statham, Brad Pitt" +119,Die Hard,8.218114462560006,1988,"John McTiernan (dir.), Bruce Willis, Alan Rickman" +120,Ladri di biciclette,8.218014560920595,1948,"Vittorio De Sica (dir.), Lamberto Maggiorani, Enzo Staiola" +121,Indiana Jones and the Last Crusade,8.216887862218428,1989,"Steven Spielberg (dir.), Harrison Ford, Sean Connery" +122,Taare Zameen Par,8.211373183282015,2007,"Aamir Khan (dir.), Darsheel Safary, Aamir Khan" +123,1917,8.21133123154053,2019,"Sam Mendes (dir.), Dean-Charles Chapman, George MacKay" +124,Der Untergang,8.203691553618699,2004,"Oliver Hirschbiegel (dir.), Bruno Ganz, Alexandra Maria Lara" +125,Per qualche dollaro in più,8.201642263500739,1965,"Sergio Leone (dir.), Clint Eastwood, Lee Van Cleef" +126,Batman Begins,8.199707665814062,2005,"Christopher Nolan (dir.), Christian Bale, Michael Caine" +127,Dangal,8.199353048642266,2016,"Nitesh Tiwari (dir.), Aamir Khan, Sakshi Tanwar" +128,The Kid,8.193437246113863,1921,"Charles Chaplin (dir.), Charles Chaplin, Edna Purviance" +129,Some Like It Hot,8.191815028455801,1959,"Billy Wilder (dir.), Marilyn Monroe, Tony Curtis" +130,The Father,8.180891914462121,2020,"Florian Zeller (dir.), Anthony Hopkins, Olivia Colman" +131,All About Eve,8.18055449735846,1950,"Joseph L. Mankiewicz (dir.), Bette Davis, Anne Baxter" +132,Green Book,8.176065254686911,2018,"Peter Farrelly (dir.), Viggo Mortensen, Mahershala Ali" +133,The Wolf of Wall Street,8.174646007238417,2013,"Martin Scorsese (dir.), Leonardo DiCaprio, Jonah Hill" +134,Judgment at Nuremberg,8.169857701876323,1961,"Stanley Kramer (dir.), Spencer Tracy, Burt Lancaster" +135,Ran,8.165124750988024,1985,"Akira Kurosawa (dir.), Tatsuya Nakadai, Akira Terao" +136,Casino,8.16384693356473,1995,"Martin Scorsese (dir.), Robert De Niro, Sharon Stone" +137,Pan's Labyrinth,8.162216796596542,2006,"Guillermo del Toro (dir.), Ivana Baquero, Ariadna Gil" +138,Unforgiven,8.161285749661333,1992,"Clint Eastwood (dir.), Clint Eastwood, Gene Hackman" +139,There Will Be Blood,8.158139227908475,2007,"Paul Thomas Anderson (dir.), Daniel Day-Lewis, Paul Dano" +140,The Truman Show,8.156133825512999,1998,"Peter Weir (dir.), Jim Carrey, Ed Harris" +141,Spider-Man: No Way Home,8.154271501504828,2021,"Jon Watts (dir.), Tom Holland, Zendaya" +142,The Sixth Sense,8.153644018061344,1999,"M. Night Shyamalan (dir.), Bruce Willis, Haley Joel Osment" +143,A Beautiful Mind,8.151958642702523,2001,"Ron Howard (dir.), Russell Crowe, Ed Harris" +144,Yôjinbô,8.149441946227604,1961,"Akira Kurosawa (dir.), Toshirô Mifune, Eijirô Tôno" +145,Monty Python and the Holy Grail,8.149418337645502,1975,"Terry Gilliam (dir.), Graham Chapman, John Cleese" +146,Shutter Island,8.147920850516051,2010,"Martin Scorsese (dir.), Leonardo DiCaprio, Emily Mortimer" +147,The Treasure of the Sierra Madre,8.147899273502375,1948,"John Huston (dir.), Humphrey Bogart, Walter Huston" +148,Jurassic Park,8.145815384957087,1993,"Steven Spielberg (dir.), Sam Neill, Laura Dern" +149,Rashômon,8.141873464083456,1950,"Akira Kurosawa (dir.), Toshirô Mifune, Machiko Kyô" +150,The Great Escape,8.141454504516688,1963,"John Sturges (dir.), Steve McQueen, James Garner" +151,Kill Bill: Vol 1,8.137930323856532,2003,"Quentin Tarantino (dir.), Uma Thurman, David Carradine" +152,No Country for Old Men,8.137294099145311,2007,"Ethan Coen (dir.), Tommy Lee Jones, Javier Bardem" +153,Finding Nemo,8.131489521838844,2003,"Andrew Stanton (dir.), Albert Brooks, Ellen DeGeneres" +154,The Elephant Man,8.129687394303057,1980,"David Lynch (dir.), Anthony Hopkins, John Hurt" +155,The Thing,8.129630076311827,1982,"John Carpenter (dir.), Kurt Russell, Wilford Brimley" +156,Chinatown,8.128352284641188,1974,"Roman Polanski (dir.), Jack Nicholson, Faye Dunaway" +157,Raging Bull,8.127333632413476,1980,"Martin Scorsese (dir.), Robert De Niro, Cathy Moriarty" +158,Gone with the Wind,8.124456666611811,1939,"Victor Fleming (dir.), Clark Gable, Vivien Leigh" +159,V for Vendetta,8.12424187910994,2005,"James McTeigue (dir.), Hugo Weaving, Natalie Portman" +160,Inside Out,8.122570067781727,2015,"Pete Docter (dir.), Amy Poehler, Bill Hader" +161,"Lock, Stock and Two Smoking Barrels",8.12173025139722,1998,"Guy Ritchie (dir.), Jason Flemyng, Dexter Fletcher" +162,Dial M for Murder,8.119878686504563,1954,"Alfred Hitchcock (dir.), Ray Milland, Grace Kelly" +163,El secreto de sus ojos,8.117651293315738,2009,"Juan José Campanella (dir.), Ricardo Darín, Soledad Villamil" +164,Hauru no ugoku shiro,8.115624825415054,2004,"Hayao Miyazaki (dir.), Chieko Baishô, Takuya Kimura" +165,The Bridge on the River Kwai,8.112312089657408,1957,"David Lean (dir.), William Holden, Alec Guinness" +166,"Three Billboards Outside Ebbing, Missouri",8.11180581282161,2017,"Martin McDonagh (dir.), Frances McDormand, Woody Harrelson" +167,Trainspotting,8.111012714060038,1996,"Danny Boyle (dir.), Ewan McGregor, Ewen Bremner" +168,Warrior,8.103573815451904,2011,"Gavin O'Connor (dir.), Tom Hardy, Nick Nolte" +169,Gran Torino,8.102946223213968,2008,"Clint Eastwood (dir.), Clint Eastwood, Bee Vang" +170,Fargo,8.102476828261098,1996,"Joel Coen (dir.), William H. Macy, Frances McDormand" +171,Prisoners,8.100260206669939,2013,"Denis Villeneuve (dir.), Hugh Jackman, Jake Gyllenhaal" +172,Tonari no Totoro,8.093760524076421,1988,"Hayao Miyazaki (dir.), Hitoshi Takagi, Noriko Hidaka" +173,Million Dollar Baby,8.089354641611278,2004,"Clint Eastwood (dir.), Hilary Swank, Clint Eastwood" +174,Catch Me If You Can,8.088688040707636,2002,"Steven Spielberg (dir.), Leonardo DiCaprio, Tom Hanks" +175,The Gold Rush,8.08630381102749,1925,"Charles Chaplin (dir.), Charles Chaplin, Mack Swain" +176,Bacheha-Ye aseman,8.085742862289964,1997,"Majid Majidi (dir.), Mohammad Amir Naji, Amir Farrokh Hashemian" +177,Blade Runner,8.08512367471186,1982,"Ridley Scott (dir.), Harrison Ford, Rutger Hauer" +178,On the Waterfront,8.082300380081083,1954,"Elia Kazan (dir.), Marlon Brando, Karl Malden" +179,12 Years a Slave,8.079856793348362,2013,"Steve McQueen (dir.), Chiwetel Ejiofor, Michael Kenneth Williams" +180,Before Sunrise,8.079848472748038,1995,"Richard Linklater (dir.), Ethan Hawke, Julie Delpy" +181,The Third Man,8.079374406547796,1949,"Carol Reed (dir.), Orson Welles, Joseph Cotten" +182,Smultronstället,8.078607432909374,1957,"Ingmar Bergman (dir.), Victor Sjöström, Bibi Andersson" +183,Harry Potter and the Deathly Hallows: Part 2,8.078244849335574,2011,"David Yates (dir.), Daniel Radcliffe, Emma Watson" +184,Ben-Hur,8.077815479798078,1959,"William Wyler (dir.), Charlton Heston, Jack Hawkins" +185,The General,8.07725341901528,1926,"Clyde Bruckman (dir.), Buster Keaton, Marion Mack" +186,Gone Girl,8.077053402716771,2014,"David Fincher (dir.), Ben Affleck, Rosamund Pike" +187,The Deer Hunter,8.075143836236032,1978,"Michael Cimino (dir.), Robert De Niro, Christopher Walken" +188,The Grand Budapest Hotel,8.074432324406573,2014,"Wes Anderson (dir.), Ralph Fiennes, F. Murray Abraham" +189,In the Name of the Father,8.074001896468923,1993,"Jim Sheridan (dir.), Daniel Day-Lewis, Pete Postlethwaite" +190,Barry Lyndon,8.073307191432082,1975,"Stanley Kubrick (dir.), Ryan O'Neal, Marisa Berenson" +191,Le salaire de la peur,8.071867620825236,1953,"Henri-Georges Clouzot (dir.), Yves Montand, Charles Vanel" +192,Sherlock Jr,8.069182202089088,1924,"Buster Keaton (dir.), Buster Keaton, Kathryn McGuire" +193,Mr Smith Goes to Washington,8.06915181187886,1939,"Frank Capra (dir.), James Stewart, Jean Arthur" +194,Klaus,8.068841487089509,2019,"Sergio Pablos (dir.), Jason Schwartzman, J.K. Simmons" +195,Hacksaw Ridge,8.068833473421833,2016,"Mel Gibson (dir.), Andrew Garfield, Sam Worthington" +196,Salinui chueok,8.068460190213838,2003,"Bong Joon Ho (dir.), Song Kang-ho, Kim Sang-kyung" +197,Relatos salvajes,8.066744033091398,2014,"Damián Szifron (dir.), Darío Grandinetti, María Marull" +198,Det sjunde inseglet,8.065430978302158,1957,"Ingmar Bergman (dir.), Max von Sydow, Gunnar Björnstrand" +199,Room,8.063938187223517,2015,"Lenny Abrahamson (dir.), Brie Larson, Jacob Tremblay" +200,Mad Max: Fury Road,8.063343714785574,2015,"George Miller (dir.), Tom Hardy, Charlize Theron" +201,Mary and Max,8.061811350659532,2009,"Adam Elliot (dir.), Toni Collette, Philip Seymour Hoffman" +202,How to Train Your Dragon,8.061497205303745,2010,"Dean DeBlois (dir.), Jay Baruchel, Gerard Butler" +203,The Big Lebowski,8.060531219315328,1998,"Joel Coen (dir.), Jeff Bridges, John Goodman" +204,"Monsters, Inc",8.059667990461328,2001,"Pete Docter (dir.), Billy Crystal, John Goodman" +205,Jaws,8.0595308057808,1975,"Steven Spielberg (dir.), Roy Scheider, Robert Shaw" +206,Tôkyô monogatari,8.056986153500892,1953,"Yasujirô Ozu (dir.), Chishû Ryû, Chieko Higashiyama" +207,La passion de Jeanne d'Arc,8.056015533653978,1928,"Carl Theodor Dreyer (dir.), Maria Falconetti, Eugene Silvain" +208,Dead Poets Society,8.055487981598707,1989,"Peter Weir (dir.), Robin Williams, Robert Sean Leonard" +209,Hotel Rwanda,8.051682768802205,2004,"Terry George (dir.), Don Cheadle, Sophie Okonedo" +210,Ford v Ferrari,8.047474874327822,2019,"James Mangold (dir.), Matt Damon, Christian Bale" +211,Rocky,8.046544605623975,1976,"John G. Avildsen (dir.), Sylvester Stallone, Talia Shire" +212,Platoon,8.045946390941978,1986,"Oliver Stone (dir.), Charlie Sheen, Tom Berenger" +213,Stand by Me,8.040321912000634,1986,"Rob Reiner (dir.), Wil Wheaton, River Phoenix" +214,Pather Panchali,8.040246837371546,1955,"Satyajit Ray (dir.), Kanu Bannerjee, Karuna Bannerjee" +215,The Terminator,8.040158995355188,1984,"James Cameron (dir.), Arnold Schwarzenegger, Linda Hamilton" +216,Spotlight,8.04003040240906,2015,"Tom McCarthy (dir.), Mark Ruffalo, Michael Keaton" +217,Logan,8.038010113121434,2017,"James Mangold (dir.), Hugh Jackman, Patrick Stewart" +218,Rush,8.037705957537115,2013,"Ron Howard (dir.), Daniel Brühl, Chris Hemsworth" +219,Ratatouille,8.037216148638704,2007,"Brad Bird (dir.), Brad Garrett, Lou Romano" +220,Network,8.036234010584907,1976,"Sidney Lumet (dir.), Faye Dunaway, William Holden" +221,Into the Wild,8.034616300670839,2007,"Sean Penn (dir.), Emile Hirsch, Vince Vaughn" +222,Everything Everywhere All at Once,8.034103724035578,2022,"Dan Kwan (dir.), Michelle Yeoh, Stephanie Hsu" +223,The Wizard of Oz,8.032405154395828,1939,"Victor Fleming (dir.), Judy Garland, Frank Morgan" +224,Before Sunset,8.03077024373811,2004,"Richard Linklater (dir.), Ethan Hawke, Julie Delpy" +225,Groundhog Day,8.029212910376621,1993,"Harold Ramis (dir.), Bill Murray, Andie MacDowell" +226,The Exorcist,8.027624182007811,1973,"William Friedkin (dir.), Ellen Burstyn, Max von Sydow" +227,Jai Bhim,8.027076286702933,2021,"T.J. Gnanavel (dir.), Suriya, Lijo Mol Jose" +228,The Best Years of Our Lives,8.025182051180233,1946,"William Wyler (dir.), Myrna Loy, Dana Andrews" +229,The Incredibles,8.02511110727724,2004,"Brad Bird (dir.), Craig T. Nelson, Samuel L. Jackson" +230,To Be or Not to Be,8.025020325839856,1942,"Ernst Lubitsch (dir.), Carole Lombard, Jack Benny" +231,La battaglia di Algeri,8.02430455669616,1966,"Gillo Pontecorvo (dir.), Brahim Hadjadj, Jean Martin" +232,Hachi: A Dog's Tale,8.02243899720676,2009,"Lasse Hallström (dir.), Richard Gere, Joan Allen" +233,The Grapes of Wrath,8.02146531567852,1940,"John Ford (dir.), Henry Fonda, Jane Darwell" +234,Rebecca,8.021406112274061,1940,"Alfred Hitchcock (dir.), Laurence Olivier, Joan Fontaine" +235,Pirates of the Caribbean: The Curse of the Black Pearl,8.021137206786229,2003,"Gore Verbinski (dir.), Johnny Depp, Geoffrey Rush" +236,Amores perros,8.021048633968682,2000,"Alejandro G. Iñárritu (dir.), Emilio Echevarría, Gael García Bernal" +237,Babam ve Oglum,8.020817645877138,2005,"Çagan Irmak (dir.), Çetin Tekindor, Fikret Kuskan" +238,La haine,8.02048531313721,1995,"Mathieu Kassovitz (dir.), Vincent Cassel, Hubert Koundé" +239,Cool Hand Luke,8.019859704116232,1967,"Stuart Rosenberg (dir.), Paul Newman, George Kennedy" +240,Les quatre cents coups,8.016215939497515,1959,"François Truffaut (dir.), Jean-Pierre Léaud, Albert Rémy" +241,Persona,8.014912330620977,1966,"Ingmar Bergman (dir.), Bibi Andersson, Liv Ullmann" +242,Ah-ga-ssi,8.013566726616054,2016,"Park Chan-wook (dir.), Kim Min-hee, Ha Jung-woo" +243,It Happened One Night,8.013124254730636,1934,"Frank Capra (dir.), Clark Gable, Claudette Colbert" +244,The Sound of Music,8.012883390986223,1965,"Robert Wise (dir.), Julie Andrews, Christopher Plummer" +245,Life of Brian,8.01243613072654,1979,"Terry Jones (dir.), Graham Chapman, John Cleese" +246,Dersu Uzala,8.008622707042678,1975,"Akira Kurosawa (dir.), Maksim Munzuk, Yuriy Solomin" +247,The Help,8.004953799401568,2011,"Tate Taylor (dir.), Viola Davis, Emma Stone" +248,Gandhi,8.004866178479936,1982,"Richard Attenborough (dir.), Ben Kingsley, John Gielgud" +249,Aladdin,8.004818115680994,1992,"Ron Clements (dir.), Scott Weinger, Robin Williams" +250,The Iron Giant,8.003732372543244,1999,"Brad Bird (dir.), Eli Marienthal, Harry Connick Jr." diff --git a/scripts/Script to fetch top IMBD listed movies/requirements.txt b/scripts/Script to fetch top IMBD listed movies/requirements.txt new file mode 100644 index 0000000..f8b61a8 --- /dev/null +++ b/scripts/Script to fetch top IMBD listed movies/requirements.txt @@ -0,0 +1,3 @@ +requests +bs4(beautifulsoup) +pandas \ No newline at end of file diff --git a/scripts/Simple Sentiment analysis using spacy/sentiment_analysis.ipynb b/scripts/Simple Sentiment analysis using spacy/sentiment_analysis.ipynb new file mode 100644 index 0000000..d6f3c7d --- /dev/null +++ b/scripts/Simple Sentiment analysis using spacy/sentiment_analysis.ipynb @@ -0,0 +1,138 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [], + "collapsed_sections": [] + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + } + }, + "cells": [ + { + "cell_type": "code", + "execution_count": 14, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "Cd5CzPSIVspD", + "outputId": "0edab2ce-0706-440c-be56-752051c6095b" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n", + "Collecting spacytextblob\n", + " Downloading spacytextblob-4.0.0-py3-none-any.whl (4.5 kB)\n", + "Requirement already satisfied: spacy<4.0,>=3.0 in /usr/local/lib/python3.7/dist-packages (from spacytextblob) (3.4.2)\n", + "Requirement already satisfied: textblob<0.16.0,>=0.15.3 in /usr/local/lib/python3.7/dist-packages (from spacytextblob) (0.15.3)\n", + "Requirement already satisfied: typer<0.5.0,>=0.3.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (0.4.2)\n", + "Requirement already satisfied: wasabi<1.1.0,>=0.9.1 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (0.10.1)\n", + "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (2.0.7)\n", + "Requirement already satisfied: typing-extensions<4.2.0,>=3.7.4 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (4.1.1)\n", + "Requirement already satisfied: srsly<3.0.0,>=2.4.3 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (2.4.5)\n", + "Requirement already satisfied: setuptools in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (57.4.0)\n", + "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (21.3)\n", + "Requirement already satisfied: pathy>=0.3.5 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (0.6.2)\n", + "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (1.0.9)\n", + "Requirement already satisfied: jinja2 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (2.11.3)\n", + "Requirement already satisfied: pydantic!=1.8,!=1.8.1,<1.11.0,>=1.7.4 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (1.10.2)\n", + "Requirement already satisfied: spacy-loggers<2.0.0,>=1.0.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (1.0.3)\n", + "Requirement already satisfied: thinc<8.2.0,>=8.1.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (8.1.5)\n", + "Requirement already satisfied: catalogue<2.1.0,>=2.0.6 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (2.0.8)\n", + "Requirement already satisfied: requests<3.0.0,>=2.13.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (2.23.0)\n", + "Requirement already satisfied: langcodes<4.0.0,>=3.2.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (3.3.0)\n", + "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (4.64.1)\n", + "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.10 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (3.0.10)\n", + "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (3.0.8)\n", + "Requirement already satisfied: numpy>=1.15.0 in /usr/local/lib/python3.7/dist-packages (from spacy<4.0,>=3.0->spacytextblob) (1.21.6)\n", + "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from catalogue<2.1.0,>=2.0.6->spacy<4.0,>=3.0->spacytextblob) (3.10.0)\n", + "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /usr/local/lib/python3.7/dist-packages (from packaging>=20.0->spacy<4.0,>=3.0->spacytextblob) (3.0.9)\n", + "Requirement already satisfied: smart-open<6.0.0,>=5.2.1 in /usr/local/lib/python3.7/dist-packages (from pathy>=0.3.5->spacy<4.0,>=3.0->spacytextblob) (5.2.1)\n", + "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests<3.0.0,>=2.13.0->spacy<4.0,>=3.0->spacytextblob) (2.10)\n", + "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests<3.0.0,>=2.13.0->spacy<4.0,>=3.0->spacytextblob) (1.24.3)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests<3.0.0,>=2.13.0->spacy<4.0,>=3.0->spacytextblob) (2022.9.24)\n", + "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests<3.0.0,>=2.13.0->spacy<4.0,>=3.0->spacytextblob) (3.0.4)\n", + "Requirement already satisfied: nltk>=3.1 in /usr/local/lib/python3.7/dist-packages (from textblob<0.16.0,>=0.15.3->spacytextblob) (3.7)\n", + "Requirement already satisfied: joblib in /usr/local/lib/python3.7/dist-packages (from nltk>=3.1->textblob<0.16.0,>=0.15.3->spacytextblob) (1.2.0)\n", + "Requirement already satisfied: click in /usr/local/lib/python3.7/dist-packages (from nltk>=3.1->textblob<0.16.0,>=0.15.3->spacytextblob) (7.1.2)\n", + "Requirement already satisfied: regex>=2021.8.3 in /usr/local/lib/python3.7/dist-packages (from nltk>=3.1->textblob<0.16.0,>=0.15.3->spacytextblob) (2022.6.2)\n", + "Requirement already satisfied: blis<0.8.0,>=0.7.8 in /usr/local/lib/python3.7/dist-packages (from thinc<8.2.0,>=8.1.0->spacy<4.0,>=3.0->spacytextblob) (0.7.9)\n", + "Requirement already satisfied: confection<1.0.0,>=0.0.1 in /usr/local/lib/python3.7/dist-packages (from thinc<8.2.0,>=8.1.0->spacy<4.0,>=3.0->spacytextblob) (0.0.3)\n", + "Requirement already satisfied: MarkupSafe>=0.23 in /usr/local/lib/python3.7/dist-packages (from jinja2->spacy<4.0,>=3.0->spacytextblob) (2.0.1)\n", + "Installing collected packages: spacytextblob\n", + "Successfully installed spacytextblob-4.0.0\n" + ] + } + ], + "source": [ + "import spacy\n", + "!pip install spacytextblob" + ] + }, + { + "cell_type": "code", + "source": [ + "# Sample Texts\n", + "text_1 = \"I enjoy learning new stuff\"\n", + "text_2 = \"Yesterday was an amazing day\"\n", + "text_3 = \"The service at that store is bad\"\n", + "\n", + "texts = [text_1, text_2, text_3]" + ], + "metadata": { + "id": "9MhsKRgKXWWV" + }, + "execution_count": 16, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "import spacy\n", + "from spacytextblob.spacytextblob import SpacyTextBlob\n", + "nlp = spacy.load(\"en_core_web_sm\")\n", + "nlp.add_pipe(\"spacytextblob\")\n", + "\n", + "for text in texts:\n", + " doc = nlp(text)\n", + " print(f\"Text: {text}\\nSentiment_Analysis: {doc._.blob.polarity}, Subjectivity_Analysis: {doc._.blob.subjectivity}\")\n", + " print(\"=====================================================\")" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "MBNCVNjgXFxd", + "outputId": "29a4f7c8-fa9b-4bbd-beb9-f8c2d798bd05" + }, + "execution_count": 17, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Text: I enjoy learning new stuff\n", + "Sentiment_Analysis: 0.2681818181818182, Subjectivity_Analysis: 0.4772727272727273\n", + "=====================================================\n", + "Text: Yesterday was an amazing day\n", + "Sentiment_Analysis: 0.6000000000000001, Subjectivity_Analysis: 0.9\n", + "=====================================================\n", + "Text: The service at that store is bad\n", + "Sentiment_Analysis: -0.6999999999999998, Subjectivity_Analysis: 0.6666666666666666\n", + "=====================================================\n" + ] + } + ] + } + ] +} \ No newline at end of file