{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [], "authorship_tag": "ABX9TyN152Nrbyyqur9dFEmcG/dR", "include_colab_link": true }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "widgets": { "application/vnd.jupyter.widget-state+json": { "00e8d3fcbf2d458bafe70cc30d0f4d71": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_d7bf9f7e23424722ad51e66bb3d31f44", "IPY_MODEL_c9bd1206b2994609bd8b24dc3c886c3d", "IPY_MODEL_4d820a0721284de4be381f6bbe7c65d1" ], "layout": "IPY_MODEL_0dd480987916438a9035503b9239bf40" } }, "d7bf9f7e23424722ad51e66bb3d31f44": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_37023318069b4eef84f3d260f1ac50b0", "placeholder": "​", "style": "IPY_MODEL_c1b27f95737543d0986adf61b65727b6", "value": "Downloading (…)lve/main/config.json: 100%" } }, "c9bd1206b2994609bd8b24dc3c886c3d": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_46f00edbac234bbf8338cf348a1bcfbd", "max": 953, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_0d658060ac90494cb1919f07f0e9997a", "value": 953 } }, "4d820a0721284de4be381f6bbe7c65d1": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4d781dd1856e4ef7bbb61c2499fa877e", "placeholder": "​", "style": "IPY_MODEL_4196b57142dd48a886a9ace940eb0576", "value": " 953/953 [00:00<00:00, 13.4kB/s]" } }, "0dd480987916438a9035503b9239bf40": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "37023318069b4eef84f3d260f1ac50b0": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "c1b27f95737543d0986adf61b65727b6": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "46f00edbac234bbf8338cf348a1bcfbd": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "0d658060ac90494cb1919f07f0e9997a": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "4d781dd1856e4ef7bbb61c2499fa877e": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "4196b57142dd48a886a9ace940eb0576": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "cefb3a3a50df4328a3e1aa60badada6a": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_33e5462c902a4b288a2ae70f2969e45c", "IPY_MODEL_d343de84a884458ea45ae9165403ed4f", "IPY_MODEL_44906a4d83194bbb93b9c2baf26488b0" ], "layout": "IPY_MODEL_0833d76a8409412783b717428133224c" } }, "33e5462c902a4b288a2ae70f2969e45c": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_342fb5d6c1cf4e2ba8bfce1399e31220", "placeholder": "​", "style": "IPY_MODEL_2edb942445304bbf9b0459e5fa90e65a", "value": "Downloading (…)"pytorch_model.bin";: 100%" } }, "d343de84a884458ea45ae9165403ed4f": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_526ee09f2d484dcb847749a9783c988a", "max": 669491321, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_2654938824504c94b4df4e611c1ef86b", "value": 669491321 } }, "44906a4d83194bbb93b9c2baf26488b0": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4abeac3a7e5d4509bfe8f641c1a1282a", "placeholder": "​", "style": "IPY_MODEL_45c0f75862b342929e079aba2c4ac4b0", "value": " 669M/669M [00:14<00:00, 38.4MB/s]" } }, "0833d76a8409412783b717428133224c": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "342fb5d6c1cf4e2ba8bfce1399e31220": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "2edb942445304bbf9b0459e5fa90e65a": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "526ee09f2d484dcb847749a9783c988a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "2654938824504c94b4df4e611c1ef86b": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "4abeac3a7e5d4509bfe8f641c1a1282a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "45c0f75862b342929e079aba2c4ac4b0": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "3e3c80723f5f4711ac0c227236a1a201": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_408426c5dcf04f8082ec780d29029c70", "IPY_MODEL_435c05a24bf54d9cb91a3b4f2e9090d2", "IPY_MODEL_0e7711bc07e64d85b7ac8abc860a58ce" ], "layout": "IPY_MODEL_1e2a62f855e3494bb57a648336928846" } }, "408426c5dcf04f8082ec780d29029c70": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3c8df1db53ff4b43b8ccf14254f85d8f", "placeholder": "​", "style": "IPY_MODEL_7b60fcabf8a043aa8d89acafe180a4b3", "value": "Downloading (…)okenizer_config.json: 100%" } }, "435c05a24bf54d9cb91a3b4f2e9090d2": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_96b7996fb677443ba8c1069462715117", "max": 39, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_b567696494c34339ab1ae5aa8c181dcd", "value": 39 } }, "0e7711bc07e64d85b7ac8abc860a58ce": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_14ed949745fb4da48ff76534a5bc717d", "placeholder": "​", "style": "IPY_MODEL_2b937004c5d84052847af445e97f6bf1", "value": " 39.0/39.0 [00:00<00:00, 1.39kB/s]" } }, "1e2a62f855e3494bb57a648336928846": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3c8df1db53ff4b43b8ccf14254f85d8f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "7b60fcabf8a043aa8d89acafe180a4b3": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "96b7996fb677443ba8c1069462715117": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "b567696494c34339ab1ae5aa8c181dcd": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "14ed949745fb4da48ff76534a5bc717d": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "2b937004c5d84052847af445e97f6bf1": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "455ed1b6ed1b46de9c0ae7bf7ec96610": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_1fe1ce8e634c4126af673f8944c04f0a", "IPY_MODEL_049258c530914ffc94d1e7b094200a82", "IPY_MODEL_7e8e512bba0f420d952111be7118ae32" ], "layout": "IPY_MODEL_e931fbbdaa8043b6b13e2ef99932df1b" } }, "1fe1ce8e634c4126af673f8944c04f0a": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cd9851e4c27c403b97b86627894da956", "placeholder": "​", "style": "IPY_MODEL_3db33dafa4064615ac12ba02bab0912f", "value": "Downloading (…)solve/main/vocab.txt: 100%" } }, "049258c530914ffc94d1e7b094200a82": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8fcb8f329cac4c688c5cfd2c00bb6cc0", "max": 871891, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_fddeb9d892fe47b4accd3d0b9ea6c71d", "value": 871891 } }, "7e8e512bba0f420d952111be7118ae32": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c68fe70b5a464fb39f42595edd5eccb3", "placeholder": "​", "style": "IPY_MODEL_99715c01e04c4d55b5a3fd37a9f1a09b", "value": " 872k/872k [00:00<00:00, 1.92MB/s]" } }, "e931fbbdaa8043b6b13e2ef99932df1b": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "cd9851e4c27c403b97b86627894da956": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3db33dafa4064615ac12ba02bab0912f": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "8fcb8f329cac4c688c5cfd2c00bb6cc0": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "fddeb9d892fe47b4accd3d0b9ea6c71d": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "c68fe70b5a464fb39f42595edd5eccb3": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "99715c01e04c4d55b5a3fd37a9f1a09b": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "5045cfb8d210405ea681b5a5aedd81c3": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_602e280b413a44f6b3fb594441e7c20b", "IPY_MODEL_c99995914494484c877419709f18b27d", "IPY_MODEL_e6ed602ce673438ba07f7c6cafdf38bf" ], "layout": "IPY_MODEL_40c6cca6491f40558168c9e3b1b122e9" } }, "602e280b413a44f6b3fb594441e7c20b": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_06e4ef984cae41669bb2639ebcd37725", "placeholder": "​", "style": "IPY_MODEL_765d919a626f41679c39eee4c13f6c44", "value": "Downloading (…)cial_tokens_map.json: 100%" } }, "c99995914494484c877419709f18b27d": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_58979a1334ab4f16b18d6113f403e931", "max": 112, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_e9f24b5c29ed416aadaddba33892e140", "value": 112 } }, "e6ed602ce673438ba07f7c6cafdf38bf": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e90ae2754c0441aa8a98c76034d4dc00", "placeholder": "​", "style": "IPY_MODEL_6237552000bc4a57a62f677b3027d909", "value": " 112/112 [00:00<00:00, 5.62kB/s]" } }, "40c6cca6491f40558168c9e3b1b122e9": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "06e4ef984cae41669bb2639ebcd37725": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "765d919a626f41679c39eee4c13f6c44": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "58979a1334ab4f16b18d6113f403e931": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "e9f24b5c29ed416aadaddba33892e140": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "e90ae2754c0441aa8a98c76034d4dc00": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "6237552000bc4a57a62f677b3027d909": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } } } } }, "cells": [ { "cell_type": "markdown", "metadata": { "id": "view-in-github", "colab_type": "text" }, "source": [ "\"Open" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "wQW6K0obfV9V", "outputId": "779eeeb4-20c4-49b2-d9c3-3947cc032cda" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n", "Requirement already satisfied: kaggle in /usr/local/lib/python3.8/dist-packages (1.5.12)\n", "Requirement already satisfied: certifi in /usr/local/lib/python3.8/dist-packages (from kaggle) (2022.12.7)\n", "Requirement already satisfied: six>=1.10 in /usr/local/lib/python3.8/dist-packages (from kaggle) (1.15.0)\n", "Requirement already satisfied: python-slugify in /usr/local/lib/python3.8/dist-packages (from kaggle) (8.0.1)\n", "Requirement already satisfied: tqdm in /usr/local/lib/python3.8/dist-packages (from kaggle) (4.64.1)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.8/dist-packages (from kaggle) (2.25.1)\n", "Requirement already satisfied: urllib3 in /usr/local/lib/python3.8/dist-packages (from kaggle) (1.26.14)\n", "Requirement already satisfied: python-dateutil in /usr/local/lib/python3.8/dist-packages (from kaggle) (2.8.2)\n", "Requirement already satisfied: text-unidecode>=1.3 in /usr/local/lib/python3.8/dist-packages (from python-slugify->kaggle) (1.3)\n", "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.8/dist-packages (from requests->kaggle) (2.10)\n", "Requirement already satisfied: chardet<5,>=3.0.2 in /usr/local/lib/python3.8/dist-packages (from requests->kaggle) (4.0.0)\n" ] } ], "source": [ "# install kaggle to use kaggle sample data sets\n", "!pip install kaggle" ] }, { "cell_type": "code", "source": [ "!mkdir ~/.kaggle" ], "metadata": { "id": "jkuj__QBf1pB" }, "execution_count": 2, "outputs": [] }, { "cell_type": "code", "source": [ "# install the main libraries\n", "import pandas as pd\n", "import seaborn as sns\n", "import matplotlib.pyplot as plt" ], "metadata": { "id": "xXDJXFjOgjK4" }, "execution_count": 3, "outputs": [] }, { "cell_type": "code", "source": [ "# download lexicon to work with pretrained text data\n", "import nltk\n", "nltk.download('vader_lexicon')" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "DGyvjkSiprJi", "outputId": "bdf5a157-8c18-4b36-92be-4bc0afafa427" }, "execution_count": 4, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "[nltk_data] Downloading package vader_lexicon to /root/nltk_data...\n" ] }, { "output_type": "execute_result", "data": { "text/plain": [ "True" ] }, "metadata": {}, "execution_count": 4 } ] }, { "cell_type": "code", "source": [ "# import e.g. sentiment analyzer to categorise reviews\n", "from nltk.sentiment.vader import SentimentIntensityAnalyzer\n", "sentiments = SentimentIntensityAnalyzer()" ], "metadata": { "id": "CadX-IbPpWjl" }, "execution_count": 5, "outputs": [] }, { "cell_type": "code", "source": [ "# use e.g. the available Hotel_Reviews.csv file, download from kaggle or from https://github.com/spribylova/Python_Hotels\n", "# data = pd.read_csv(\"Hotel_Reviews.csv\")" ], "metadata": { "id": "jOGcID0Ope52" }, "execution_count": 6, "outputs": [] }, { "cell_type": "code", "source": [ "import pandas as pd\n", "url = \"https://raw.githubusercontent.com/spribylova/Python_Text_Sentiment/main/Hotel_Reviews.csv\"\n", "data = pd.read_csv(url)\n", "data" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 964 }, "id": "DJCPfxkJLnLB", "outputId": "5d7bc236-1dbe-47be-fc3c-65e4c782753e" }, "execution_count": 7, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " address \\\n", "0 Riviera San Nicol 11/a \n", "1 Riviera San Nicol 11/a \n", "2 Riviera San Nicol 11/a \n", "3 Riviera San Nicol 11/a \n", "4 Riviera San Nicol 11/a \n", "... ... \n", "35907 1088 Powdermill Rd \n", "35908 1088 Powdermill Rd \n", "35909 1088 Powdermill Rd \n", "35910 3747 29th St S E \n", "35911 3747 29th St S E \n", "\n", " categories city \\\n", "0 Hotels Mableton \n", "1 Hotels Mableton \n", "2 Hotels Mableton \n", "3 Hotels Mableton \n", "4 Hotels Mableton \n", "... ... ... \n", "35907 Cabins,Resorts & Vacation Cottages,Wedding Cha... Gatlinburg \n", "35908 Cabins,Resorts & Vacation Cottages,Wedding Cha... Gatlinburg \n", "35909 Cabins,Resorts & Vacation Cottages,Wedding Cha... Gatlinburg \n", "35910 Hotels-Apartment,Corporate Lodging,Hotels,Lodging Grand Rapids \n", "35911 Hotels-Apartment,Corporate Lodging,Hotels,Lodging Grand Rapids \n", "\n", " country latitude longitude \\\n", "0 US 45.421611 12.376187 \n", "1 US 45.421611 12.376187 \n", "2 US 45.421611 12.376187 \n", "3 US 45.421611 12.376187 \n", "4 US 45.421611 12.376187 \n", "... ... ... ... \n", "35907 US 35.754868 -83.457295 \n", "35908 US 35.754868 -83.457295 \n", "35909 US 35.754868 -83.457295 \n", "35910 US 42.909480 -85.573590 \n", "35911 US 42.909480 -85.573590 \n", "\n", " name postalCode province \\\n", "0 Hotel Russo Palace 30126 GA \n", "1 Hotel Russo Palace 30126 GA \n", "2 Hotel Russo Palace 30126 GA \n", "3 Hotel Russo Palace 30126 GA \n", "4 Hotel Russo Palace 30126 GA \n", "... ... ... ... \n", "35907 Elk Springs Resort 37738 TN \n", "35908 Elk Springs Resort 37738 TN \n", "35909 Elk Springs Resort 37738 TN \n", "35910 Extended Stay America Grand Rapids - Kentwood 49512 MI \n", "35911 Extended Stay America Grand Rapids - Kentwood 49512 MI \n", "\n", " reviews.date reviews.dateAdded reviews.doRecommend \\\n", "0 2013-09-22T00:00:00Z 2016-10-24T00:00:25Z NaN \n", "1 2015-04-03T00:00:00Z 2016-10-24T00:00:25Z NaN \n", "2 2014-05-13T00:00:00Z 2016-10-24T00:00:25Z NaN \n", "3 2013-10-27T00:00:00Z 2016-10-24T00:00:25Z NaN \n", "4 2015-03-05T00:00:00Z 2016-10-24T00:00:25Z NaN \n", "... ... ... ... \n", "35907 2012-03-20T00:00:00Z 2016-06-23T16:50:58Z NaN \n", "35908 2012-03-12T00:00:00Z 2016-06-23T16:50:58Z NaN \n", "35909 2015-11-03T00:00:00Z 2016-06-23T16:50:58Z NaN \n", "35910 NaN 2015-12-01T19:40:54Z NaN \n", "35911 NaN 2015-12-01T19:40:54Z NaN \n", "\n", " reviews.id reviews.rating \\\n", "0 NaN 4.0 \n", "1 NaN 5.0 \n", "2 NaN 5.0 \n", "3 NaN 5.0 \n", "4 NaN 5.0 \n", "... ... ... \n", "35907 NaN 5.0 \n", "35908 NaN 5.0 \n", "35909 NaN 5.0 \n", "35910 NaN 0.0 \n", "35911 NaN 0.0 \n", "\n", " reviews.text \\\n", "0 Pleasant 10 min walk along the sea front to th... \n", "1 Really lovely hotel. Stayed on the very top fl... \n", "2 Ett mycket bra hotell. Det som drog ner betyge... \n", "3 We stayed here for four nights in October. The... \n", "4 We stayed here for four nights in October. The... \n", "... ... \n", "35907 Best of the Best!!!! My family and I stayed in... \n", "35908 Amazing Vacation in Beautiful Cabin We stayed ... \n", "35909 My husband and I stayed at Tree Tops which is ... \n", "35910 to share your opinion of this businesswith YP ... \n", "35911 xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx \n", "\n", " reviews.title reviews.userCity reviews.username \\\n", "0 Good location away from the crouds NaN Russ (kent) \n", "1 Great hotel with Jacuzzi bath! NaN A Traveler \n", "2 Lugnt l��ge NaN Maud \n", "3 Good location on the Lido. NaN Julie \n", "4 ������ ��������������� NaN sungchul \n", "... ... ... ... \n", "35907 Amazing time (both times!!) Charlotte Chelsa K. \n", "35908 Amazing time (both times!!) Charlotte Heather D. \n", "35909 Amazing time (both times!!) Charlotte Carol W. \n", "35910 NaN NaN write a review \n", "35911 NaN NaN xxxxxxxxxxxxxx \n", "\n", " reviews.userProvince \n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "... ... \n", "35907 NC \n", "35908 NC \n", "35909 NC \n", "35910 NaN \n", "35911 NaN \n", "\n", "[35912 rows x 19 columns]" ], "text/html": [ "\n", "
\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
addresscategoriescitycountrylatitudelongitudenamepostalCodeprovincereviews.datereviews.dateAddedreviews.doRecommendreviews.idreviews.ratingreviews.textreviews.titlereviews.userCityreviews.usernamereviews.userProvince
0Riviera San Nicol 11/aHotelsMabletonUS45.42161112.376187Hotel Russo Palace30126GA2013-09-22T00:00:00Z2016-10-24T00:00:25ZNaNNaN4.0Pleasant 10 min walk along the sea front to th...Good location away from the croudsNaNRuss (kent)NaN
1Riviera San Nicol 11/aHotelsMabletonUS45.42161112.376187Hotel Russo Palace30126GA2015-04-03T00:00:00Z2016-10-24T00:00:25ZNaNNaN5.0Really lovely hotel. Stayed on the very top fl...Great hotel with Jacuzzi bath!NaNA TravelerNaN
2Riviera San Nicol 11/aHotelsMabletonUS45.42161112.376187Hotel Russo Palace30126GA2014-05-13T00:00:00Z2016-10-24T00:00:25ZNaNNaN5.0Ett mycket bra hotell. Det som drog ner betyge...Lugnt l��geNaNMaudNaN
3Riviera San Nicol 11/aHotelsMabletonUS45.42161112.376187Hotel Russo Palace30126GA2013-10-27T00:00:00Z2016-10-24T00:00:25ZNaNNaN5.0We stayed here for four nights in October. The...Good location on the Lido.NaNJulieNaN
4Riviera San Nicol 11/aHotelsMabletonUS45.42161112.376187Hotel Russo Palace30126GA2015-03-05T00:00:00Z2016-10-24T00:00:25ZNaNNaN5.0We stayed here for four nights in October. The...������ ���������������NaNsungchulNaN
............................................................
359071088 Powdermill RdCabins,Resorts & Vacation Cottages,Wedding Cha...GatlinburgUS35.754868-83.457295Elk Springs Resort37738TN2012-03-20T00:00:00Z2016-06-23T16:50:58ZNaNNaN5.0Best of the Best!!!! My family and I stayed in...Amazing time (both times!!)CharlotteChelsa K.NC
359081088 Powdermill RdCabins,Resorts & Vacation Cottages,Wedding Cha...GatlinburgUS35.754868-83.457295Elk Springs Resort37738TN2012-03-12T00:00:00Z2016-06-23T16:50:58ZNaNNaN5.0Amazing Vacation in Beautiful Cabin We stayed ...Amazing time (both times!!)CharlotteHeather D.NC
359091088 Powdermill RdCabins,Resorts & Vacation Cottages,Wedding Cha...GatlinburgUS35.754868-83.457295Elk Springs Resort37738TN2015-11-03T00:00:00Z2016-06-23T16:50:58ZNaNNaN5.0My husband and I stayed at Tree Tops which is ...Amazing time (both times!!)CharlotteCarol W.NC
359103747 29th St S EHotels-Apartment,Corporate Lodging,Hotels,LodgingGrand RapidsUS42.909480-85.573590Extended Stay America Grand Rapids - Kentwood49512MINaN2015-12-01T19:40:54ZNaNNaN0.0to share your opinion of this businesswith YP ...NaNNaNwrite a reviewNaN
359113747 29th St S EHotels-Apartment,Corporate Lodging,Hotels,LodgingGrand RapidsUS42.909480-85.573590Extended Stay America Grand Rapids - Kentwood49512MINaN2015-12-01T19:40:54ZNaNNaN0.0xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxNaNNaNxxxxxxxxxxxxxxNaN
\n", "

35912 rows × 19 columns

\n", "
\n", " \n", " \n", " \n", "\n", " \n", "
\n", "
\n", " " ] }, "metadata": {}, "execution_count": 7 } ] }, { "cell_type": "code", "source": [ "# the sample csv file only contains US country\n", "data[\"country\"].unique()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "7dcEw2OyQU_u", "outputId": "27b0f90e-aab0-4704-ed45-769e8946b782" }, "execution_count": 8, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "array(['US'], dtype=object)" ] }, "metadata": {}, "execution_count": 8 } ] }, { "cell_type": "code", "source": [ "# there is many US unique hotel names in the file \n", "data[\"name\"].unique()" ], "metadata": { "id": "kBHMcqUHQkHi", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "31ec5c66-546a-4b3f-c160-7e18310877bd" }, "execution_count": 9, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "array(['Hotel Russo Palace', 'Americas Best Value Inn', 'Intermezzo',\n", " 'Studio 6', 'Little Paradise Hotel', 'Comfort Suites',\n", " 'Thunderbird Executive Inn and Conference Center',\n", " 'Little Belt Inn Neihart',\n", " 'Hawthorn Suites By Wyndham Livermore Wine Country',\n", " 'Fairfield Inn By Marriott Binghamton', 'Howard Johnson',\n", " 'La Quinta', 'Days Inn El Reno Ok', 'Gresham Area Hotels',\n", " 'Berney Fly Bed and Breakfast', 'Polynesian Plaza',\n", " 'Hotel Vier Jahreszeiten KÜhlungsborn', 'The Point',\n", " 'The Houstonian Hotel', 'Best Western Plus Waterville Grand Hotel',\n", " 'The Amble Inn', 'Howard Johnson Inn Columbia',\n", " 'Osage Village Inn', 'Super 8 Columbia Dwntwn Sc',\n", " 'The Kingsport Inn',\n", " 'Azul Beach Hotel By Karisma Gourmet Inclusive', 'Red Roof Inn',\n", " 'Ocean Breeze Motel Apts', 'Days Inn Branson / Near The Strip',\n", " 'Country Lodge Motel', 'The Inn @ St. Botolph', 'Quality Inn',\n", " 'Comfort Suites Southport', 'Ramada', 'Ambassadors Inn and Suites',\n", " 'Tryp Dusseldorf Krefeld Hotel', 'Rodeway Inn',\n", " 'Centennial Bed and Breakfast',\n", " 'Americinn Lodge Suites Oscoda - Ausable River',\n", " 'Bridgetown Mill House Restaurant Inn', 'Gran Melia Victoria',\n", " 'Kaier Mansion', 'The National Conference Center',\n", " 'Holiday Inn Express & Suites Lenoir City (knoxville Area)',\n", " 'Manor Vail Lodge', 'Economy Inn',\n", " 'The Golden Hotel, An Ascend Hotel Collection Member',\n", " 'Hyatt Regency Reston', 'Glendale Gaslight Inn', 'Super 8',\n", " 'Motel 6', 'Country Inn Walker', 'Mt Gardner Inn',\n", " 'Hotel De La Ville', 'Econo Lodge St Robert',\n", " 'La Quinta Inn-houston', 'Best Western Plus',\n", " 'La Quinta Inn & Suites Auburn',\n", " 'The Citizen Hotel, Autograph Collection', 'Super 8 Ithaca',\n", " 'Big Mountain Lodge',\n", " 'Holiday Inn Express Atlanta Ne - I-85 Clairmont',\n", " 'Springhill Suites Columbia', 'Sportsmen Motel',\n", " 'North Country Inn B & B', 'Microtel of Ste Genevieve',\n", " 'Days Inn Barstow', 'Unionport Lodge No 333 F A M',\n", " 'Doubletree By Hilton Hotel Bay City - Riverfront',\n", " 'Hilton Garden Inn Burlington Downtown',\n", " 'Doubletree By Hilton West Palm Beach Airport',\n", " 'Courtyard Hattiesburg', 'Janmere Motel', 'Skidway Lake Motel',\n", " 'El Cortez', 'Enchanted Castle Hotel',\n", " 'Extended Stay America - Chicago - Westmont - Oak Brook',\n", " 'Extended Stay America', 'Econo Lodge', 'Hometown Inn',\n", " 'Days Inn Brookings', 'Pheasant Manor', 'Spirit Tree Inn B & B',\n", " 'Durango Travelodge', 'Americinn Lodge and Suites',\n", " 'Residence Inn Billings',\n", " 'Best Western Plus Arlington North Hotel and Suites',\n", " 'Knights Inn', 'La Quinta Inn and Suites Tucson - Reid Park',\n", " 'Staybridge Suites Tyler University Area',\n", " 'Country Inn and Suites By Carlson Corbin',\n", " 'Best Western Owasso Inn & Suites', 'Truckee Tahoe Htl Larkspur',\n", " 'Wyndham Resort At Fairfield Mountains', 'Quality Inn Spearfish',\n", " 'The White House Inn', 'Inn At Queen Anne', 'Comfort Inn',\n", " 'Budget Inn South',\n", " 'Residence Inn By Marriott Irvine John Wayne Airport',\n", " 'Blue Top Inn', 'Days Inn Warren', 'Budget Host Inn',\n", " 'Howard Johnson Gallup', 'Desert Sands Motel',\n", " 'Davison St Guest House', 'Travelodge', 'Parkway Inn Jellico',\n", " 'Days Inn & Suites Vicksburg', 'Chippewa Hotel',\n", " 'Martin Mason Hotel', \"Comfort Inn and Suites O'fallon\",\n", " 'La Quinta Inn & Suites Dublin',\n", " 'Sheraton Mission Valley San Diego Hotel', 'The Bluffs Inn Suites',\n", " 'Astro Motel', 'Best Western Luxury Inn',\n", " 'Extended Stay America San Diego - Carlsbad Village By The Sea',\n", " 'Seaside Oceanfront Inn & Restaurant', 'Lakeview Lodge',\n", " 'Extended Stay America - Los Angeles - Ontario Airport',\n", " 'Days Inn Marion', 'Protection Motel', 'Town Country Motel',\n", " 'Ramada Inn', 'Holiday Inn Canyon De Chelly', 'Lake Motel',\n", " 'Arcola Inn', 'Landmark Inn Lakes-mountain Region', 'Haltom Inn',\n", " 'Noyo Harbor Inn', 'Candlewood Suites West Springfield',\n", " \"Alyssa's Motel\", 'Holiday Inn Express & Suites Portland',\n", " 'Royal Inn', 'Columbia Gorge Riverside Lodge', 'Cypress Suites',\n", " 'Best Western Burlington Inn', 'Eldorado Suites Hotel',\n", " 'Bent Elbow', 'Penzion Accom', 'La Quinta Inn and Suites Sunrise',\n", " 'Americana Resort Properties', 'Knights Inn Aiken',\n", " 'Inroads Ireland Tours', 'Mansfield Plantation Inc',\n", " 'Holiday Inn Express Pinetop',\n", " 'Holiday Inn Express Howe (sturgis, Mi)',\n", " 'Deluxe Inn Merrillville', 'Super 8 Pittsburgh/monroeville',\n", " 'La Quinta Inn', 'Townplace Suites By Marriott', 'Cadillac Motel',\n", " 'Hyatt Regency Kathmandu', 'Mainsail Motel & Cottages',\n", " 'Fairfield Inn & Suites Peoria East',\n", " 'Holiday Inn Express and Suites Canyonville', 'Solstice',\n", " 'Country Inns Suites', 'Dead Broke Inn',\n", " 'Hampton Inn & Suites Crescent City', 'The Grove Seaside Hotel',\n", " 'Savaii Roberts Motels', 'The Alexandrian, Autograph Collection',\n", " 'Hotel Monaco Chicago, A Kimpton Hotel', 'Rips Country Inn',\n", " 'Holiday Inn Express Gatesville',\n", " 'Hilton Garden Inn Kauai Wailua Bay',\n", " 'Holiday Inn Express Hotel and Suites Memphis Southwind',\n", " 'Clarion', 'Mountain Lodge At Telluride - A Noble House Resort',\n", " 'Hampton Inn New Orleans - Downtown',\n", " 'Baymont Inn and Suites Enid', 'Quality Inn & Suites',\n", " 'Super 8 Carlisle-south', 'Americinn Coralville',\n", " 'Travelodge Shakopee', 'Hampton Inn Fayetteville Fort Bragg',\n", " 'Four Points-kansas', \"Cliff's Motor Inn\",\n", " 'Days Inn & Suites Castle Rock', 'Candlewood Suites Olathe',\n", " 'Holiday Inn Express', 'Super 8 Alamosa',\n", " \"The Miner's Inn Motel Restaurant\",\n", " 'Extended Stay America - Orlando Theme Parks - Vineland Rd.',\n", " 'White Cliff Manor Bed and Breakfast',\n", " 'Fiesta Inn Centro Historico', 'Pine Needles Golf Course',\n", " 'Days Inn Bloomington', 'Fairfield Inn/suites-marriott',\n", " 'Holiday Inn Express Hotel & Suites Hillview',\n", " 'Marquesa Hotel & Cafe Marquesa', 'Best Western',\n", " 'Mandarin Oriental Jakarta', 'Barber Joyce',\n", " 'Sunset Inn-yosemite Cabins', 'Ramada Vandalia',\n", " 'Holiday Inn Express & Suites Weslaco', 'Super 8 Elko Nv',\n", " 'Hotel Borgo Verde', 'Vista Hotel On Lake Tarpon',\n", " 'Miramar Boutique Hotel',\n", " 'Best Western Plus French Quarter Landmark Hotel',\n", " 'Red Carpet Inn', 'Adria Motor Inn', 'Quality Inn and Suites',\n", " 'Village Lodge', 'Super 8 Manhattan Ks', 'Olde Bridge Inn',\n", " 'Raintree Inn', 'Garden Bed and Breakfast', 'Alpine Motel',\n", " 'Wine Valley Lodge', 'Hilton Garden Inn Austin Nw - Arboretum',\n", " 'The Governor Hotel', 'Pullman Rail Journeys',\n", " 'Motor Inns of America', 'Profile Deluxe Motel',\n", " 'American Star Inn and Suites Atlantic City',\n", " 'Meadow Farm Bed and Breakfast', 'Days Inn Kuttawa',\n", " 'Hotel Relais De Margaux Golf and Spa',\n", " 'Hyatt Place San Antonio Airport - Quarry Market', 'Discovery Inn',\n", " 'Holiday Inn Lumberton North - I-95',\n", " 'Old Saco Inn Bed & Breakfast', 'Hotel Millersburg',\n", " 'Springhill Suites', 'Stratford Inn', 'Comfort Inn Livermore',\n", " 'Body Tuneup', 'Adobe Nido Bed & Breakfast',\n", " 'Tulip Inn Turin West', 'Hotel Portaventura', 'Relax Inn',\n", " 'Hotel Olcott', 'Radisson Hotel Hauppauge-long Island',\n", " 'Quality Inn & Suites Hanes Mall', 'Robins Roost Cabins',\n", " 'Hampton Inn', 'Candlewood Suites Huntersville',\n", " 'Super 8 Longmont / Del Camino', 'Holiday Inn Express Dahlonega',\n", " 'Briarcliff', 'Lake Hill Cabins', 'Warwick Denver',\n", " 'Econo Lodge Inn & Suites', 'Falls Motel',\n", " 'Holiday Inn Express Hotel and Stes Port Clinton-catawba Island',\n", " 'Berkshire By The Sea A Vri Resort', 'Days Inn Bangor Airport',\n", " 'Fireline Hotel', 'Brooks Donald L Jr', 'Days Inn Geneva',\n", " 'Fh Hotel Villa Fiesole', 'Clarion Inn', 'Porto Vista Hotel',\n", " 'The Litchfield Inn', \"Sam's Town Hotel & Gmblng Hall\",\n", " 'Hotel Deca - A Noble House Hotel',\n", " 'Boiling Springs Resort Canoe Rental', 'Advance Motel',\n", " 'Edgewater Inn & Cottages', 'Hilton Princess San Pedro Sula',\n", " 'Pelican Shores Inn', 'Hyatt Place Utica', 'Hotel Roc Lago Rojo',\n", " 'Amisos Hotel', 'Red Banks Motel', 'Hotel Guadalmedina',\n", " 'Intercontinental Hotels Resorts', 'Greektown Casino',\n", " 'The Kinney - Venice Beach', 'Scenic View Motel',\n", " 'Holiday Inn Rutland-killington Area',\n", " 'Plaza Hotel and Casino - Las Vegas', 'Monarch of Rancho Mirag',\n", " 'Seiling Motel', 'Quality Inn Johnson City', 'Fort Conde Inn',\n", " 'Regency Inn Motel', 'Super 8 Dallas South',\n", " 'Baymont Inn & Suites Griffin',\n", " 'Holiday Inn Express - Harrisburg East',\n", " 'Kilauea Lodge Restaurant', 'Dallas/fort Worth Marriott Solana',\n", " 'Old Wheeler Hotel', 'The Chestnut Boutique Hotel',\n", " 'Red Fox Motel', 'The Inn On Negley',\n", " 'Wyndham Vacation Resorts Towers On The Grove',\n", " \"America's Best Value Inn\", 'Super 8 Kingston',\n", " 'Leakey Springs Cabins', 'Hotel Mc Call',\n", " 'Super 8 Worthington Minnesota', 'Quality Inn Near Six Flags',\n", " 'Americinn Lodge Suites Austin',\n", " 'Holiday Inn Spearfish-convention Center', 'Mar Mar Resort Tackle',\n", " 'Cambria Hotel & Suites', 'Best Western Hotel Goldenmile Milan',\n", " \"Rideout's Lakeside Lodge Cottages\",\n", " 'Days Inn Ruther Glen Kings Dominion Area',\n", " 'Pueblo Bonito Sunset Beach Resort & Spa - All Inclusive',\n", " 'Turf Motel', 'Homewood Suites By Hilton',\n", " 'Rangeland Court Motel & Rv', 'Red Roof Inn St Louis - Troy',\n", " 'Best Western Plus-seaport Inn', 'Hampton Inn Abilene',\n", " 'Aspen Alps', 'Holiday Inn Express Henderson',\n", " 'Country Inn and Suites By Carlson', 'Main Street Bed & Breakfast',\n", " 'Tidewater Inn', 'Uptown Motel', 'Villa Carlotta',\n", " 'Extended Stay America - Fort Lauderdale - Davie',\n", " 'Spruce Meadow Cabins', 'Silver Run Cabins',\n", " 'Jacksonville Plaza Hotel and Suites',\n", " 'Hawthorn Suites Dayton North',\n", " 'Suburban Extended Stay of Memphis Bartlett',\n", " 'Knights Inn Durango Co', 'Homewood Suites - Mall of America',\n", " 'Days Inn', 'Twelve Hotels & Residences',\n", " 'Embassy Suites By Hilton Houston Downtown', 'Super 8 Cloquet',\n", " 'Extended Stay America - Rockford - I-90', 'Bailey Hotel',\n", " 'Red Rest Inn', 'Colonial Inns of Ontario',\n", " 'Hotel Silken Siete Coronas', 'Corey Motel', 'Cherry Orchard Inn',\n", " 'Hotel Vorbach', 'Eden Park Guest House', 'Lakeway Resort & Spa',\n", " 'Knights Inn Amarillo Airport',\n", " 'La Quinta Inn and Suites Nashville Franklin', 'Close For You',\n", " 'Blue Jay Motel', 'Chelsea Inn', 'Whiteface Chalet',\n", " 'Homewood Suites', 'Super 8 Motel Fairmont', 'Great Basin Inn',\n", " 'Comfort Inn - Springfield', 'Stirling City Hotel',\n", " 'Sombrero Resort and Marina', 'Key West Inn - Clanton',\n", " 'Days Inn West Memphis', 'Worldwide Hospitality Supply Company',\n", " 'Plantation Inn', 'Comfort Suites South',\n", " 'Marriott Hotels Resorts Suites', 'Sybaris Pool Suites',\n", " \"Miss Kitty's Boarding House\", 'Sheraton Offenbach Hotel',\n", " 'Extended Stay America - Raleigh - Cary - Regency Parkway S',\n", " 'Suburban Extended Stay Warner Robins', 'Jvd Hotels',\n", " 'Holiday Inn-bayside', 'Pavilion Lodge', 'Ritz Hotel',\n", " 'Arrowhead Motel and Rv Park', 'Parkside Inn At Incline',\n", " 'Saddleback Motor Inn', 'Sherwood Hills Resort',\n", " 'Holiday Inn Express Hotel and Suites Raleigh-wakefield', 'Arion',\n", " 'Una Hotel Forte Dei Marmi', 'Days Inn Newton',\n", " \"A Swallow's Nest Motel\", 'Canyon Gate Motel', 'Cascabel',\n", " 'Hampton Inn & Suites Fort Worth-west-i-30',\n", " 'Fireside Inn Santa Cruz', 'Mandarin Oriental Hotel Group',\n", " 'Bellaire Motel Lodge', 'Palomar Washington Dc, A Kimpton Hotel',\n", " 'Bay Shores Yachttennisclub 514 2 Br Condo By Redawning',\n", " 'Hilton Santo Domingo', 'Atlantic House', 'Frontier Cabins Motel',\n", " 'Samui Cliff View Resort & Spa', 'Country Inn & Suites By Carlson',\n", " 'Hampton Inn-st Robert', 'Best Western Holiday Hills',\n", " 'Tiffany House Bed & Breakfast', 'Progress Management Co',\n", " 'Norwood Inn and Suites', 'Howard Johnson Inn - Newburgh',\n", " 'Holiday Inn Express Colton-riverside North', 'Sutton Bay Resort',\n", " 'La Quinta Inn Calhoun', 'Colonial Motel', 'Fairfield Inn Saginaw',\n", " 'Extended Stay America Philadelphia - Exton',\n", " 'Saco River Recreational Council', 'Ihg', 'Red Roof Inn Somerset',\n", " 'Wallowa Lake Vacation Rentals', 'Hotel Casena Dei Colli',\n", " 'Chalet Leon At Hector Falls',\n", " 'Fairfield Inn Suites Chattanooga South/east Ridge',\n", " 'Midvalley Motel', 'Ubaa Old Crawford Inn',\n", " 'Holiday Inn Express Hotel Suites Sedalia',\n", " 'Hampton Inn & Suites Syracuse/carrier Circle',\n", " 'Quality Inn and Suites Eugene-springfield',\n", " 'Four Points By Sheraton Memphis Southwind',\n", " 'Americinn Lodge Suites Princeton', 'Juniper Lane Guest House',\n", " 'Bosselmans Pump Pantry Motel',\n", " \"Harrah's Laughlin Hotel and Casino\",\n", " 'Americas Best Value Inn and Suites', 'Masters Inn',\n", " 'The Westin Europa and Regina', 'Super 8 Opelousas',\n", " 'Melia Paris Champs-elys��es', 'Sci�� On Martin',\n", " 'Springhill Suites By Marriott South Bend/mishawaka',\n", " 'Inn At The River',\n", " 'Country Inn and Suites By Carlson Charlotte University Place',\n", " 'Holiday Inn Express Eagle',\n", " 'Sir Walter Raleigh Inns of Greenbelt', 'Gardena Terrace Inn',\n", " 'Quality Suites Intercontinental Airport West', '1785 Inn',\n", " 'Best Western Knoxville Suites', 'The Jayakarta Bali',\n", " 'Holiday Inn Express Grove City (outlet Center)', 'Hotel Aura Sfo',\n", " 'Hampton Inn Bloomington West',\n", " 'Quality Inn & Suites Historic St. Charles',\n", " 'Best Western Plus San Marcos Inn', 'Budget Inn-santa Maria',\n", " 'Equestrian Estates Horse Farm Bed and Breakfast',\n", " 'Comfort Inn Deland - Near University', 'Boardroom Motel',\n", " 'Carleton Hotel', 'Wisconsin-aire Motel', 'High Desert Motel',\n", " 'Best Western of Long Beach', 'Days Inn Berea Ky',\n", " 'East Side Motel Cabins', 'Abbeville Inn',\n", " 'Comfort Suites Mount Vernon',\n", " 'Holiday Inn Express & Suites Phoenix Downtown - Ballpark',\n", " 'Holiday Inn Express Hotel Suites Cookeville', 'Fairbridge Inn',\n", " 'Four Seasons Country Inn', 'Gooding Hotel Bed Breakfast',\n", " 'Grand Hotel Cadenabbia', 'Pillar Hotels Resorts',\n", " 'Hotel An Der Philharmonie', 'Microtel Inn',\n", " 'Crestview Condominiums',\n", " 'Comfort Hotel Nation Pere Lachaise Paris 11', 'Cedar Crest Inn',\n", " 'Spring Fountain Motel', 'Innisbrook', 'Cougar Crest Lodge',\n", " 'Springhill Suites By Marriott Sarasota Bradenton',\n", " 'Fairfield Inn and Suites By Marriott Plainville',\n", " 'Holiday Inn Express Hotel & Suites Chicago-deerfield/lincolnshire',\n", " 'Camelback Resort Aquatopia Indoor Waterpark',\n", " \"Marriott's Mountainside At Park City\",\n", " 'Fairfield Inn & Suites Atlanta Perimeter Center',\n", " 'Hampton Inn Jackson Hole', 'Shoshone Lodge', 'Magton Inc',\n", " 'Quality Inn & Suites - Riverfront',\n", " 'Super 8 Schenect/albany Area', 'Intown Suites El Paso',\n", " 'Extended Stay America - Columbia - Northwest Harbison',\n", " 'Hilton San Diego Airport/harbor Island',\n", " 'Candlewood Suites Oklahoma City-moore',\n", " 'Holiday Inn Express & Suites Bay City', 'Rodeway Inn-tacoma',\n", " 'Western Inn-glacier Park', 'Americinn Lodge & Suites Appleton',\n", " 'Hampton Inn Sarasota - I-75 Bee Ridge', 'Amerihost Inn',\n", " 'Country Inn and Suites By Carlson Galena', 'Days Inn Suites',\n", " 'Hampton Inn Roanoke/salem', 'School House Motel', '1900 House',\n", " 'Excellence Riviera Cancun - Adults Only - All Inclusive',\n", " 'Hyatt Centric Arlington', 'Days Inn Bowling Green',\n", " 'Hotel Metropole', 'Inn & Suites', 'Anglers Inn',\n", " 'Super 8 Crete Ne', 'H��tel Marinca and Spa',\n", " 'Hyatt Place Pittsburgh Cranberry', 'Four Seasons Hotel St. Louis',\n", " 'El Dorado Seaside Suites By Karisma - All Inclusive',\n", " 'Courtyard San Marcos', 'Fairfield Inn Suites Spearfish',\n", " 'Best Western Hospitality Hotel and Suites',\n", " 'Hotel Adler Cavalieri', 'Royal Inn Motel', 'Ambiance',\n", " 'Rodeway Inn Bushnell', 'Microtel Inn By Wyndham Knoxville',\n", " 'Candlewood', 'Menehune Reservations',\n", " 'Staybridge Suites Chicago - Glenview', 'Riverside Lodge',\n", " 'Patalya Thermal Resort', 'H��tel Les Bruy��res',\n", " 'Comfort Inn Birmingham - Irondale', 'Super 8 Madison',\n", " 'Comfort Inn & Suites', 'Concord Apartments By Boq Lodging',\n", " 'Holiday Inn Express & Suites West Monroe',\n", " 'Double Eagle Hotel and Casino', 'Rainbow Motel',\n", " 'Country Inn & Suites By Carlson, Rocky Mount, Nc',\n", " 'Ip Casino Resort Spa', 'La Quinta Inn & Suites Bryant',\n", " 'Travelodge Anaheim Convention Center',\n", " 'Hampton Inn Tucson-airport', 'Beacon Motel', 'Super 8 Sallisaw',\n", " 'Wilshire Inn Motel', 'Palm Suites',\n", " 'Hampton Inn & Suites-downtown-tutwiler', 'Narcis',\n", " 'Econo Lodge Big Spring',\n", " 'La Quinta Inn and Suites Miami Cutler Bay',\n", " 'Candlewood Suites Fort Smith', 'Courtyard Burlington Harbor',\n", " 'Terrace Inns Suites', 'Rapid City Days Inn', 'Foxburg Inn',\n", " 'Aspen Haus Bed and Breakfast', \"Fort's Cedar View\",\n", " 'Best Western Eufaula Inn', 'Terry Peak Ski Area',\n", " 'Super 8 - Effingham', 'Best Western Plus Kelly Inn',\n", " 'Days Inn Fort Wayne', 'Courtyard Columbus Worthington',\n", " 'Super 8 Bradenton Sarasota Area', 'Chalfant House',\n", " 'Hotel Corpus Christi', 'Sleep Inn', 'Bay Haven Inn Bed Breakfast',\n", " 'Hampton Inn & Suites Millington',\n", " 'Holiday Inn Express Suites Woodland Hills',\n", " 'Best Western Plus Humboldt House Inn',\n", " 'Red Lion Anaheim Maingate Hotel', \"Albert's Motel\", 'Octagon Inn',\n", " 'Budget Inn', 'Towneplace Suites', 'Hitching Horse Inn',\n", " 'Homewood Suites By Hilton Indpls Airport / Plainfield In',\n", " 'Kit Carson Lodge Restaurant', 'Watermark Bed Breakfast',\n", " 'Super 8 - Upland', 'Bailey House Bed & Breakfast',\n", " 'Microtel Inn Suites By Wyndham San Antonio By Seaworld',\n", " 'Comfort Hotel Bernau', 'Miami Executive Hotel',\n", " 'Extended Stay America Princeton - West Windsor',\n", " 'Mercure Curitiba Golden Hotel', 'Sheraton Baltimore North Hotels',\n", " 'Sids Resort', 'Hampton Inn & Suites Douglas',\n", " 'Comfort Inn Humboldt Bay', 'Super 8 Big Cabin Vinita Ok',\n", " 'Radisson Blu Conference and Airport Hotel',\n", " 'Days Inn North Columbia Ft. Jackson', 'Campanile Lyon Ecully',\n", " 'La Brea Hotel', 'Microtel Inn By Wyndham Southern Pines',\n", " 'Homewood Suites Dallas-market Center', 'Websters Manor',\n", " 'Holiday Inn Express & Suites Lawrence', 'Bethesda Gardens',\n", " 'Homestead Studio Suites', 'Bayside Resort Hotel',\n", " 'Super 8 Batesville Ar', 'Gateway Studios', 'Sunset Inn',\n", " 'Simpson House Inn', 'Longville Inn',\n", " 'A Bed & Breakfast In Cambridge', 'Clatskanie River Inn',\n", " 'Jellico Days Inn North Tennessee',\n", " 'Mountaintop Lodge Bed Breakfast', 'Inn At Mendenhall',\n", " 'Hampton Inn Waco', 'Roy-el Motel', 'Comfort Inn and Suites Bend',\n", " 'Eaglecrest Ski Area', 'Magnuson Hotel Summerton',\n", " 'La Quinta Inn and Suites Hopkinsville', 'Lindy Motel',\n", " 'Lighthouse Motel', 'Cal Neva Resort', 'Park Terrace Suites',\n", " 'Fairfield Inn & Suites Des Moines Airport',\n", " 'Super 8 Blackwell Ok', 'Sand Dunes Motel', 'Nantahala Cabins Inc',\n", " 'Holiday Inn', 'Holiday Inn & Suites Green Bay Stadium',\n", " 'Cliffrose Lodge Gardens',\n", " 'The Ritz-carlton Orlando, Grande Lakes', 'Super 8 Belle Fourche',\n", " 'Merritt House Inn', 'Comfort Suites Shreveport', 'Budget Host',\n", " 'Holiday Inn Express Hotel & Suites Bloomington-normal',\n", " 'Knights Inn - Wilmington', 'Pizza Hut', 'Comfort Inn Montgomery',\n", " 'Spinners Tailspin Inn', 'Triangle Motel',\n", " 'Residence Inn By Marriott Hartford Downtown',\n", " 'Great American Inn Suites', 'Hunting Lodge', 'Keyser Inn Inc',\n", " 'Patriots Inn', 'Super 8 Indianapolis',\n", " 'Holiday Inn Express Lubbock South', 'Stay Inn', 'Southside Motel',\n", " 'Residence Inn By Marriott Springdale', 'La Playa',\n", " 'Wingate By Wyndham Lagrange', 'Bear Cove Inn',\n", " 'Hyatt House Colorado Springs', 'Antlers Inn',\n", " 'Marylander Hotel Condo', 'Drury Inn & Suites Sikeston',\n", " 'Garden of The Gods Club & Resort',\n", " 'Sands Central Inn Hot Springs', 'Hamton Inn New Orleans Westbank',\n", " 'Holiday Inn Manhattan 6th Ave - Chelsea', 'Vacation Side Travel',\n", " 'Holiday Inn Express - Hillsboro', 'Sky Vue Motel',\n", " 'Blue Boar Inn', 'Hampton Inn Ft Chiswell',\n", " \"Fitzgerald's Restaurant\", 'Super 8 Fort Collins',\n", " 'Inter-hotel Orl��ans Nord', 'Best Western Rama Inn & Suites',\n", " 'Clarion Inn Strasburg - Lancaster', 'Red Roof Inn Erie',\n", " 'Holiday Inn Express & Suites South Portland',\n", " 'The Parkview Memphis', 'Club Quarters, Rockefeller Center',\n", " 'Hampton Inn Dublin', 'Agate Beach Motel', 'Newark Budget Inn',\n", " 'Knights Inn Eau Claire', 'Laurel Manor Motel',\n", " 'Hampton Inn and Suites Annapolis', 'Riverside Motel and Cabins',\n", " 'Mineola Motel', 'Towneplace Suites Albany University Area',\n", " 'Monterey Beach Dunes Inn',\n", " 'Drury Inn & Suites San Antonio Northwest Medical Center',\n", " 'H��tel Sezz Paris', 'Hudson Hotel - Book Direct',\n", " 'Super 8 Kansas City Airport', 'Best Western Hotel De Neuville',\n", " 'Mccamly Plaza Hotel', 'Wingate By Wyndham Pueblo',\n", " 'Days Inn Lincolnton', 'Hotel Roc Flamingo', 'Lexington Inn',\n", " 'Nippersink Country Club, Inc.', 'Sterling Motel',\n", " 'Campus Inn & Suites Eugene Downtown', 'Days Inn Branson Mo',\n", " 'Mt. Washington Bed and Breakfast', 'Super 8 Metropolis',\n", " 'Melody Lodge Cabins', \"Sand's Motel\", 'Travelodge Ruther Glen',\n", " 'Texan Inn', 'Hotel Garibaldi',\n", " 'Lake Raystown Resort Lodge & Conference Center', 'Central House',\n", " 'The Concorde Inn', 'Economy Motel',\n", " 'Hampton Inn Virginia Beach Oceanfront North', 'Irish House Hotel',\n", " 'Clubhouse At River Country Est', 'Sleep Inn At Harbour View',\n", " 'Hotel Lavonia', 'Courtyard By Marriott Rockaway Mount Arlington',\n", " 'Fiesta Inn and Suites', 'Hilton Garden Inn Oconomowoc',\n", " 'P K Motel', 'Candlewood Suites Indianapolis Northwest',\n", " 'Holiday Inn Fond Du Lac', 'Arizona Inn of Prescott Valley',\n", " 'Koehne Dexter Terrie',\n", " 'Microtel Inn and Suites By Wyndham Burlington',\n", " 'The Inn At Bella Vista', 'Brasstown Valley Golf Club',\n", " 'Quality Inn Long Beach Airport', 'Calloway Inn',\n", " 'Grandison Bed Breakfast', 'Days Inn Tallulah',\n", " 'Twin Gables of Woodstock', 'Happy Tails Hotel & Playland',\n", " 'Baymont Inn and Suites Boone',\n", " 'Springhill Suites Marriott Colorado Springs South',\n", " 'Brightwood Inn Country Inn', 'Motel 6 Fort Bragg',\n", " 'Westernaire Motel', 'Super 8 Columbia East',\n", " 'Holiday Inn Express Hotel and Suites Va Beach Oceanfront',\n", " 'Hotel Valencia Santana Row', 'New York Marriott Marquis',\n", " 'Holiday Inn Express & Suites Willows',\n", " 'Hampton Inn Grand Junction Downtown/historic Main Street',\n", " 'Holiday Inn Express Suites Floresville', 'Villager Inn Motel',\n", " 'Lamothe House', 'Dor-shada Resort By The Sea',\n", " 'Hi-way Inn of Kiowa', 'Sleep Inn Slidell',\n", " 'Knights Inn New Castle/wilmington',\n", " 'La Posada Lodge & Casitas, An Ascend Hotel Collection Member',\n", " 'Comfort Inn Huntingdon', 'Mericana Motel',\n", " 'Hilton Americas-houston', 'Casino Queen Rv Park',\n", " 'Quality Inn and Suites Irvine Spectrum',\n", " 'Marriott Springhill Marina', 'Hampton Inn Suites Columbus',\n", " 'Milliken Creek Inn', 'Intown Suites Nashville North',\n", " 'The Desmond House Bed & Breakfast', 'The Booker-lewis',\n", " 'Shamrock Hill Inn', 'Econo Lodge Bellmawr',\n", " 'Crossland Economy Studios - Lake Charles - Sulphur',\n", " 'Hotel Columbia', 'Raton Pass Inn', 'Sumner Motor Inn',\n", " 'Days Inn-amarillo-medical Ctr', 'Best Western Silicon Valley Inn',\n", " 'Days Inn Lanham Washington Dc', 'Cliffs 7305 By Redawning',\n", " 'La Quinta Inn Auburn Worcester', 'Dockers Inn', 'Spring Bay Inn',\n", " 'Candlewood Suites Eugene Springfield', 'Anaheim Marriott Suites',\n", " 'Monarch Inn', 'Yakima Inn', 'Homeplace Inn and Suites',\n", " 'Innpoints Worldwide',\n", " 'Wingate By Wyndham Chantilly / Dulles Airport',\n", " 'Days Inn and Suites Albany', 'Holiday Inn Express San Clemente',\n", " 'The Westin Buckhead',\n", " 'Hyatt Place Atlanta/alpharetta/north Point Mall', 'Eldorado Inn',\n", " 'Americas Best Value Inn - Medical Center/airport', 'Outside Inn',\n", " 'Point Randall Resort', 'Courtyard By Marriott Downtown Boise',\n", " 'The Abbey Resort', 'Crossroads Hotel', 'Helios Resort',\n", " 'Best Western Plus Circle Inn',\n", " 'Fairfield Inn and Suites By Marriott Idaho Falls',\n", " 'Greenstay Hotel and Suites', 'Pine Shadows Motel',\n", " \"Beach Cove 411 Tower A Sierra's 1 Bedroom Condo By Prista Management\",\n", " 'Residence Inn By Marriott Fort Lauderdale Weston',\n", " 'Petretti Apartments',\n", " 'Extended Stay America - Bloomington - Normal',\n", " '40 Berkeley Hostel', 'La Quinta Inn & Suites Chicago Tinley Park',\n", " 'Welcome Inn Apartments', 'Candlewood Suites Lexington',\n", " 'Quinta Real Acapulco', 'Forest Hill Inn',\n", " 'Clarion Suites Philadelphia', \"Sportsmen's Lodge\",\n", " 'Port-o-call Motel',\n", " 'Drury Inn and Suites Columbus Convention Center',\n", " 'Avalon Hotel Group', 'Elba Sara Beach & Golf Resort',\n", " 'Good Nite Inn Rohnert Park', 'The Merritt Center and Lodge',\n", " 'Rustic Inn', 'Liberty Lodge', 'Comfort Suites Fort Pierce',\n", " 'Twin Pines Motel', 'Best Western Hartford Hotel & Suites',\n", " 'Courtyard By Marriott', 'La Quinta Inn and Suites Meridian',\n", " 'Residence Inn By Marriott Tucson Williams Centre',\n", " 'Hampton Inn Rockford', 'Red Roof Inn Cedar Rapids',\n", " 'Lewis River Inn', 'Tmc Resort Rentals',\n", " 'Homewood Suites By Hilton Albuquerque - Journal Center',\n", " 'Desert Motel Restaurant', 'Hyatt Dulles', 'West Side Motel',\n", " 'Casa Del Mar Inn Bandb',\n", " 'Holiday Inn Express and Suites Gahanna/columbus Airport E',\n", " 'Rodeway Inn Near Venice Beach', 'Citrus Hills Lodge Hernando',\n", " 'Econo Lodge Miles City', 'Atlanta Marriott Northwest At Galleria',\n", " 'Ibis Wuerzburg City', 'Hotel Eug��ne En Ville',\n", " \"Super 8 Chicago O'hare Airport\", 'Comfort Inn and Suites',\n", " 'Pine Motel', 'Nesco Manor Hotel', 'Busy B Ranch',\n", " 'Best Western University Inn & Suites', 'Rodeway Inn Airport',\n", " 'Starwood Resorts Hotel', 'City Express Irapuato',\n", " 'Days Inn Statesville', 'The Lake Point Conference Center',\n", " 'Super 8 Gretna', 'Royal Dutch Inn', 'Sea View Motel',\n", " 'Castle Kona Reef', 'Brookside Motel', 'Acorn Motor Inn',\n", " 'Torian Plum By Wyndham Vacation Rentals', 'The Savoy Hotel',\n", " 'Holiday Inn Express & Suites Crossville',\n", " 'Holiday Inn Express Hotel and Suites Hesperia',\n", " 'Best Western Saint-etienne Aeroport',\n", " 'Mission Sands Vacation Rentals', 'River Oaks Golf Villas',\n", " 'Holiday Inn Victorville', 'Quality Inn and Suites Big Rapids',\n", " 'Residence Inn Burlington Colchester', 'Wakonda Hotel & Bar',\n", " 'Inturotel Esmeralda Park', 'Knights Inn Carmel Hill',\n", " 'Five Seasuns Bed & Breakfast Inn', 'Summit At Big Sky',\n", " 'Holiday Inn Express Hotel and Suites Cambridge', 'Breakers Hotel',\n", " 'Holiday Inn Express Hotel & Suites Emporia', 'The Dec',\n", " 'Lazy T Motel', 'Cherokee Lodge Bed and Breakfast',\n", " 'Beach Haven Vacation Rental House', 'Sonoma Coast Villa Spa',\n", " 'Ambassador Inn Albuquerque', 'Quality Inn Gulfport',\n", " 'Super 8 Van Horn', 'Residence Inn By Marriott Deptford',\n", " 'Rock A Bye Inn',\n", " 'Holiday Inn Express Hotel and Suites Meadowlands Area',\n", " 'Sky-lit Motel', \"Simoni's Fremont Inn\", 'Elk Springs Resort',\n", " 'Extended Stay America Grand Rapids - Kentwood'], dtype=object)" ] }, "metadata": {}, "execution_count": 9 } ] }, { "cell_type": "code", "source": [ "# see the unique values in rating column\n", "data[\"reviews.rating\"].unique()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "fYsFlry9R97A", "outputId": "3782f0f6-be8d-40cf-e201-995875a927d5" }, "execution_count": 29, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "array([4. , 5. , 3. , 1. , 2. , 0. , 4.1 , 4.9 , 4.8 , 3.4 , 2.4 ,\n", " 3.1 , 3.2 , 3.3 , 4.15, 4.4 , 4.6 , 3.75, 3.95, 3.55, 3.8 , 2.9 ,\n", " 3.35, 3.15, 4.2 , 4.5 , 3.9 , 1.3 , 4.3 , 4.7 , 2.8 , 1.5 , 3.7 ,\n", " 2.7 , 2.5 , 3.5 , 4.75])" ] }, "metadata": {}, "execution_count": 29 } ] }, { "cell_type": "code", "source": [ "# fill the null reviews of the Hotels with 0\n", "data['reviews.rating']=data['reviews.rating'].fillna(0)" ], "metadata": { "id": "30mgPjRvTr14" }, "execution_count": 11, "outputs": [] }, { "cell_type": "code", "source": [ "# create a range of 5 maximum review numbers, all values above 5 are equal to 5\n", "for i in range(0,len(data)):\n", " if(data['reviews.rating'].loc[i] > 5):\n", " temp = data['reviews.rating'].loc[i]\n", " newtemp = (temp/10)*5\n", " data.at[i,'reviews.rating'] = newtemp" ], "metadata": { "id": "fUa0csNRT7NJ" }, "execution_count": 12, "outputs": [] }, { "cell_type": "code", "source": [ "# see the number of reviews for each rating number\n", "ratings = data[\"reviews.rating\"].value_counts()\n", "numbers = ratings.index\n", "quantity = ratings.values\n", "ratings" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "ssVh-6k-qmLD", "outputId": "356fb62c-5e00-471f-c0f9-115a9da17085" }, "execution_count": 13, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "5.00 12772\n", "4.00 9755\n", "3.00 5709\n", "1.00 3068\n", "2.00 2979\n", "0.00 1199\n", "4.80 78\n", "4.60 56\n", "4.40 30\n", "4.30 26\n", "4.15 25\n", "3.75 24\n", "3.95 24\n", "4.20 22\n", "3.40 17\n", "4.10 14\n", "3.15 14\n", "4.50 13\n", "3.55 13\n", "3.35 12\n", "2.70 9\n", "3.10 7\n", "2.90 7\n", "4.70 6\n", "3.30 6\n", "4.90 6\n", "2.40 4\n", "3.80 3\n", "2.50 3\n", "3.20 2\n", "3.90 2\n", "3.70 2\n", "1.30 1\n", "2.80 1\n", "1.50 1\n", "3.50 1\n", "4.75 1\n", "Name: reviews.rating, dtype: int64" ] }, "metadata": {}, "execution_count": 13 } ] }, { "cell_type": "code", "source": [ "# round decimal places in rating and sort output by rating level\n", "ratings=data['reviews.rating'].round(0).value_counts()[[5,4,3,2,1]]\n", "ratings" ], "metadata": { "id": "udysK--Au3Yo", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "ca27afc9-d7b4-4e52-c9c1-caa4ce54a1ab" }, "execution_count": 14, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "5 12919\n", "4 9954\n", "3 5784\n", "2 2987\n", "1 3069\n", "Name: reviews.rating, dtype: int64" ] }, "metadata": {}, "execution_count": 14 } ] }, { "cell_type": "code", "source": [ "# create indexes from rating value and counts\n", "numbers = ratings.index\n", "quantity = ratings.values" ], "metadata": { "id": "ebcAMh2ivv4m" }, "execution_count": 15, "outputs": [] }, { "cell_type": "code", "source": [ "# assign color to each rating and revise the pie chart to see the share of rating values \n", "# the majority of people is giving review 5, only small share of people was not satisfied\n", "custom_colors = [\"tan\", \"beige\", 'silver', \"grey\", \"black\"]\n", "plt.figure(figsize=(5, 5))\n", "plt.pie(quantity, labels=numbers, colors=custom_colors)\n", "central_circle = plt.Circle((0, 0), 0.5, color='white')\n", "fig = plt.gcf()\n", "fig.gca().add_artist(central_circle)\n", "plt.rc('font', size=12)\n", "plt.title(\"Hotel Reviews Ratings\", fontsize=20)\n", "plt.show()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 324 }, "id": "8E6BAJQsqhDN", "outputId": "7853a839-85be-4f05-d35e-30c7a926623a" }, "execution_count": 16, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "iVBORw0KGgoAAAANSUhEUgAAAR4AAAEzCAYAAADn+2w+AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/NK7nSAAAACXBIWXMAAAsTAAALEwEAmpwYAAAxWklEQVR4nO3dd3wc9Z3/8ddnd9XWljvuFYFxQVTTiygpXJSElEuOSyV3KXe5S1WSH1zKkrvLpZ2SHGmXhAuGI5CEVBLlAgFiYYMpbkTghmXkIhvkJtvSSlpp9/v7Y0awXiRZZWe+s7Of5+Oxj5VmZ2feWu1+9vv9ThNjDEop5aeI7QBKqeKjhUcp5TstPEop32nhUUr5TguPUsp3WniUUr7TwpMHInKLiBgRucp2ltESkRvdv+FG21nCQkRWiYjurzKAwBQe900/5D9JRFrc+RaOcV1W3xBZhSr71i0iO0Tkh2P9+4qdiFw1wOvbKyL7RORXInJlntazMh/vx2IUsx2gyDUCq9yfpwLXAB8A/lpELjLGPOdjll8DjwP7fVyn13YBK92f48D5wJuBN4nI3xhj7vV4/e9x16tyaOGxa5Ux5pb+X0QkAvwOeB3wL8D7/ApijDkKHPVrfT5pyX59AUTkJuDLwNcATwuPMWa3l8svZIHpao2ViFwrIn8UkcMi0iMi20XkKyIyMWuehW4Xq8b9PbspvipneXNF5DsistNd3iERuU9ELvDqbzDGZHj5G/oV6xGRuIjcLCKbRKRTRDpEZK2I/G3OfDe4f9M3B1qPiJSJyBER2S8iMXfaoGM8w30tRORD7jI+kDP9fe70pIiU5Tz2hNvNrMia9kYRecjN1+N2kRpF5MNDvX7D9D/u/UIRmZaT5U0icpf73ul0b+tF5KPul0L2vAZ4r/vr81nvo5aseV7Rpc/qBt4iIueISIOItLuvTaOIXDpQaBGZJSK3i0ibiHS574H3Zi8vZ/5T3W77Dnf+wyLSJCL/LSJTR/XK5VEoWjwi8iHg+0AnzrdYG3AV8P+AN4jIZcaYdqAd+CJwI7DA/blfS9byzgMeAKYA9wO/AqYBbwLWiMibjTF/8O4vAqA3+xcRmQQ8DJwLbAB+jPPF8VrgbhFZboz5nDv7b3BaL+8QkU8bY/pyln09MAmoH+CxE4zwtXjIvb8W+FHWYq517yuAS3C7l+6XwvnAamNMlzvtg8APgBdwWn8HgenAWTgtwO8NlXeEenN+/wqQAZ4AWoGJON3f/8L5Inh31rxfxHkNznYfb3entzM8K4DPAGuB24D5wFuBh0TkHGPMtv4ZRWS6O98C4BHgMWAmzmvxQO6CRWQW8BQwAfgD8EugHFjk/g3fAQ4NM6c3jDGBuAHGvd0yxK3dnWdh1vMWAD3AMWBJzjK/587/w5zpq5w/fcAcMWAH0A3U5Dw2G+cNuR8oy5p+i7ueq4b5t/bPf0vO9CjwR/exb+c8ttKd/pmc6eXuczLAOVnTf+DO//oB1t/gPladNe1Gd9qNY3wtduEUfsmatg+nKKWBf8uafr27zs9nTVvv/j+nD5B72jBf36vc5a4a4LHPuY81DfBY1QDTIsAd7nMuGuR/snCQHK94n2VlO+G1dh/7kDv9eznT/8ed/tWc6We7r9UJ7yXgI+60jw2QaRxQMZbPaj5uVlee84KYEdwWZj3vs+60/xhgmZNxClJXzofjFW+IrMf6PwxfH+Txj7mPvy5r2i2MrvCs4uWieiuwxZ3+bPYHD2fguQ94apDlne0+72tZ0y51p92bM+9Md1kbcqbfmPthGOVrcbs77Sz392Xu7/+I8y38WNa8t7qPXZo1bT1Oy3XyGN5L/R/ulqzX92s4LUaD0xq8dATLO8993hdypq/MfT/mPP6K91lWtjUDzF+C0wpblzWtFEjifOlWDvCcHzF44fmgF5/VfNwC19Uyxshgj7n95wU5k89z7x8eYFlHRGQjcCWwBHh6GBEuce8X5PabXae790txmrFjUePesm3CKWDZA70X4LSGXtGXd5VkZQLAGPOYiGzH6WpONsYccR96p7uslcPIN5rX4mGcInYt8Becrgo4LZ6FwCdFpNIYc9x9rAN4MmuZPwHqgc0i8lOcLX+PGmMODCNvrgVAImfaEeAaY8ym3JndsY9P4wzun4rTOsg2ZxQZBrMud4IxpldEXsT5wux3Bk4XdZ37muVaA7w/Z9p9wH8A3xWR1+J0kR8FNhu3MtkWuMIzChPd+8E2A/dPnzTM5fUPvL3tJPONH+byhvJFY8wt7sDlHOBTwEeBn4vIXxlnsDk70wUMMOg8RKY7gC8BN+CMgYEzINoL3D2MfKN5LbLHeb7p3u81xmwXkYdwxjVqRGQdsBz4g8kaZzLGfENEDgIfxnktPo5TcBuBTxtjXvGBHUKjMeYqABGZgjOG8h3gdyJygTHmhf4Z3TG0p3DGQZ4E7gQO47QOJ+G07k4YGB+j9kGm9+F8MfTrf3+/OMj8r5hujNklIhfitPSuA97iPrRHRP7TGHPriNPmWRi2avW3DGYO8visnPmGu7zrjTEyxO2LQy5lBIwxGWPMHmPMx4BfAK8B/nmATN88Saarcxb9vzhjP+8FEJFzgWqcD/vBYUQb8WthjNkHbAOudLdgXcXLxWgNkAJexcstoYFaqncaYy7GKXy1OGMcVwL3i8gpw8j9CsaYw8aYHwGfBObyykHq9+MUnS8aYy4yxnzYGPM542yO/9lo1pknx9z7GYM8PuB0Y8wWY8zf4LyGK4CbcD7v/yUif5/3lCMUhsKz0b2/KvcB91vsHJzB0S1ZD6Xdx6O5z8HZiQ7ginwFHKE6nAHDL4jIBHfakzgFZESZjDF7cD7YF4nIGby8+feOYS5itK/FQ0AlzrjOJPd3jDFJd5nXcmIXbEDGmHZjzB+MMR/A6RpOwSlAY/HfOGNobxaRy7Kmn+be/3KA5+R2h/ul3fuB3kf5shVnjPIsEakc4PHLh3qyMabPGLPeGPNVoH+3izflN+LIhaHw3IXTdfiIiJyW89i/4WxSvMsY05M1vX9T4vwBlvdboBn4JxF53UArFJFLRMSTPVKNs9PZj3C+qercaW04Yx8rROTzAxVMEakSkUUDLHKle//3OG+8g8DvhxlntK9FfyvmZvf+oZzHzgTeiPN/OGHcTUSuFpGBxvmmu/fJYWYfkDEmzcvjPl/KeqjFvb8qJ8+5vPx35BrqfZQXxpgUTotrIs4WuexsZ+PsHU3O9PMla/+1LP2tozG9hnlhe3S7/4a7xeok87QwwFYEnPEAg9MsvQ1nz9TH3GlbgCk58/dvttyI8+b7HPDurMfPwhkbMjiDct8Fvg78FOeDaICZWfPfQh42p2c9PgvnzXEMdxMyTgFd6z5vO85+PF/Gab086U6/YYBlxXG6TCl3nlsHWeeNDLyJd0SvhfucKTitAQNsyXns8v7/NTlb3NzH24G9OF3O/8QZaO7/+9YBJcN4fa9ikM3p7uPi/u8N8Fp32mycQpLG2Vfpq+59yv1bDbAyZzmvdafvcOf/HPDPWY+vYvCtWoP971tw9rjOnjYDZzeF/i2h/4Gz9bAT51CXE7a4Ad/CaSX9CaeF92Xg5+60buAS65932wGyXqxRFx73sdfg7Ex1BKersgNnE+qkAeaNuv+8nTitpVe8SXG+Yb8CPINTBDqA59wPxLuAWNa8t5DHwuPOU+/OU581rRRn7OcxnGLSA+zGaVF8HJg6yLJu4+UP+/mDzHMjAxSekb4WWc9Z7y7vuznTS9znG+AfB3jeP7gfpp3uug7jFInPMMDm5EH+lv4P96oh5nmDO89TWdOW4WwRanM/1Otxxn4WMkDhcZ/zSZwvt/79aVqyHluV+55mFIXHnT4H50vmAE4B2YTTdf5rd3kfz5r3IpyNCU+7r18XzufhduBMPz/Xg93EDaqUKkAi8iWc4/quM8bcbzvPcGnhUaoAiMhs42wxzJ5WjdP6TQFzjDHdVsKNQhj241GqGKwTkR043d1OnJ03a3E2EH2okIoOaItHqYIgIgmczeALcXZVaMfZNeE/jTGrbOUaLS08SinfhWE/HqVUgdHCo5TynRYepZTvtPAopXynhUcp5TstPEop32nhUUr5TguPUsp3WniUUr7TwqOU8p0WHqWU77TwKKV8p4VHKeU7LTxKKd9p4VFK+U4Lj1LKd1p4lFK+08KjlPKdFh6llO+08CilfKeFRynlOy08Sinf6QX9VFETkRbgOJAG+owxK+wmKg5aeJSCq40xB22HKCba1VJK+U4Ljyp2BnhARNaLyAdthykW2tVSxe5yY0yriEwH/iQiW40xj9gOFXba4lFFzRjT6t63Ab8GLrSbqDhoi0cB0NRQHwfmAXPd2zxgGjAOqHBv8ZyfBehyb8kBfj4EtAJ7+2/VtXVHfPujTkJExgERY8xx9+fXAP9qOVZREGOM7QzKJ00N9eOA5cCZ7u0MYD5OoZnkU4xOnCK0B9gGPO3emqpr67p8ygCAiJyK08oB50v4bmPMl/zMUKy08IRUU0N9OXARsAI4HzgPOJ3gdq8zwHO8XIg2Ao9V19YdtZpKeUILT0g0NdRHcQrMte7tMqDcaqixSwPrgYfc26PVtXXddiOpfNDCU8CaGupPA64DXgXU4F93yZZu4DHgYeD+6tq6dZbzqFHSwlNgmhrqFwB/A9wAnGs5jm07gZ8DP62urXvadhg1fFp4CkBTQ/1s4O04Bediy3GCahvwM+Bn1bV1m22HUUPTwhNQTQ31JcDbgA8CVxDcQeEgagJuB1YGafO9epkWnoBpaqifBXzIvc20HKfQdQE/Bb6n40HBooUnIJoa6i8FPgK8FSixHCeM1gLfBH5VXVuXth2m2GnhsaipoV5wulOfwdkUrry3G/gG8APdNG+PFh5Lmhrqr8fZPf8s21mKVCvwJeC26tq6Xtthio0WHp81NdRfh1NwLrCdRQHQAvwbcId2wfyjhccnTQ31NcC/A5fbzqIG9BzwReCe6tq6jO0wYaeFx2NNDfWLgFuB19vOooZlE/CP1bV1j9sOEmZaeDzS1FBfCnwa+CzOaSRU4TDAbcBN1bV1h22HCSMtPB5oaqi/BvgezmknVOE6iLPFcWV1bZ1+UPJIC08eNTXUz8TZVPu3trOovFoDfLi6tq7JdpCw0MKTJ00N9e8Gvg1MtJ1FeaIP+DLwr9W1dX22wxQ6LTxj1NRQPxH4PtrKKRZrgXdW19Y9bztIIdMDD8egqaH+MpytIFp0isclwKamhvp32Q5SyLTFMwru2f6+gLPFKmo5jrLnJzhjP8dsByk0WnhGqKmhfiHOG+5Sy1FUMDyP0/VaaztIIdGu1gi4ex+vQ4uOetkiYFVTQ/3f2Q5SSLTFM0xNDfXvx9k3R09ZoQbzDeDTesjFyWnhOQl3POc/gY9bjqIKw/8BN+i4z9C08AzB3VT+U5wrOSg1XJuBN1TX1u20HSSotPAMoqmhvgr4HbDUdhZVkA4Bb62urWu0HSSItPAMoKmh/mzgAWC67SyqoPUAb6+urbvPdpCg0a1aOZoa6i8BVqFFR41dGfCLpob6t9kOEjRaeLLsfvo3lwN/IvxX5FT+KQHucY/lUy4tPK5ksvnaaadX3z+lavl621lU6ESBlU0N9R+wHSQotPDgFB2cgeT4pHmnXTF54RlrbGdSoRMBftDUUP9R20GCoOgLTzLZfA1O0akAEBGZvHDJpRPnnfaY3WQqhAT4r6aG+o/bDmJbUW/VcovO7xng1KTGmL6D259ed2xfi16rXOWbwTm+6x7bQWwp2sKTTDafDTwKjBtsHmNMqm3Lhqc7Xtyjl6JR+ZYCaqtr6x60HcSGoiw8yWTzKcBTwIKTzWuM6X7x2ac2dx7Yd573yVSROQ7UVNfWbbQdxG9FN8aTTDaXAr9iGEUHQETKZyy/YEl8yoynvU2milAl8H/uJZCKStEVHpzTlI7oonoiEp951sWnVkya9qxHmVTxmgHc39RQf4rtIH4qqsKTTDZ/AhjVeVNEpHLWOZfNLZswZWueYyl1OnCfey22olA0hSeZbL4O+PpYliEiE+ecd8UppeMn7shTLKX6XYxzPp+iUBSDy8lk8xnAE+Tp0jPGmAN7nnq4o7fzeNH1zZXn3lldW3e37RBeC33hSSabJ+MUndPzuVxjMvv3PPFQX29X57x8LlcVvU7gouraulCPJ4a6q5VMNkeBn5HnogMgEpk178JrJVYe35fvZauiNg74ZVNDfaXtIF4KdeEBvgK82quFSyQyd/5Fr0pFS8tf9GodqiidAfzYdggvhbarlUw2Xwqsxofimkmnm3evfWBiurdnmtfrUkXlE9W1dd+yHcILoSw8yWRzGc4VPpf4tc5Mum/brsfun5Hp653k1zpV6PUA51XX1m22HSTfwtrV+gI+Fh2ASDR2xoJLXrMvEo3p1QVUvpQBdzQ11MdsB8m30BWeZLL5XOAzNtYdiZUsm3/Ja1okEu20sX4VSiuAm22HyLdQdbWSyeYYzsGf59jMkU71bNy19v4lJpN5xek2lBqFXpwu1zO2g+RL2Fo8n8Fy0QGIlpadO//i1zyLSMp2FhUKJcBtTQ31ofm8huYPSSabl+KM7QRCrKx8xfyLX70RkT7bWVQoXAR8xHaIfAlFVyuZbI4Aa4BLbGfJlUp2rN3zxIMX4pzwW6mx6AQWV9fWFfxOq2Fp8XyEABYdgNL4+EvmXnD1WpzTXSo1FuOAL9kOkQ8F3+JJJpsXAM8yxClMg6D72JHVresbr7CdYziipRVUTJxB2bjJlFRMoLRiIiUVlcTK4kRLyhEREPc7yxiMyZDpS9GXStLb1UGq6yi9XcdIJdvpOtpGb5fuYZBHGWBFoZ+1MAz7ByQIeNEBKJ8w+YrZ51zeuG/TmhrbWU4gEcZNmUN88hzGT51H+YRTiERLMJk0EokSiQ7vLRKNlVJSPp6KCc4FWDOZNCbdh0QiGGPoOX6IzsN7SR7ZR8fBXWTSvV7+VWEWAeqBa2wHGYuCbvEkk81VwFYKqIB2Hnph1Qt/efwqmxkisTIqpy9i0uwzGD9tASaTIRKNIRFvh6FMJkMm3YtEonQdfZH21i0ca2umr7vD0/WG1PWFfE32Qi88twM32s4xUh1tratefPapq3xdqQgTplcx7dQLqJg0A5PuI1pS5muEXOm+FCIRUl3HOLhzHUf3bdWW0PBtA86srq0ryK2mBVt4CrG1k+3Yvl2rDmzbeJXX64mVjWPK/LOYuvBcJBIhGrNbbAaT7kshCEdaN3OoZQM9HYdtRyoEH62urfu27RCjUciFZyXwXts5xqJ9b3PjoeeaPBnzKamYyKylV1I5/VTAEImWeLGavDOZNMZk6Dp2gP2bV9HVvt92pCA7CCyorq1L2g4yUgVZeJLJ5tNwWjsFvW+MMca079q+5vDzW/K2tStWGmf64suYPHcpSISIx+M2XjHGYNJ9dB5uZf+WP2sLaHAfq66tu9V2iJEq1MJzB/Ae2znywRiTObxz89r23c9dNpblRKIlnHLaRUxbdB4gw94aFXSZTAZMmqMv7OCFLY/Q16MD0Tl2AacV2lhPwRWeZLL5dGALBd7ayWaMSR/a0fTk0b07R7UT5Lip85h/bi2RWGnBdKlGKpNJYzJp9j/7Z47sDc2xkvnynurauv+1HWIkCrHw3Am823aOfDPG9B3YtmnD8f27LhzucyLREmYtv5pJs5YQiYWz4ORK96XoOtrGnk0Nuhn+Zc8AZ1XX1hXMh7mgDplIJpsXA++wncMLIhI75Yxzzh4/fc664cw/bspczrj674uq6ICzo2J88iwW17yPyXOX244TFGcCr7cdYiQKqvAAnyVEXaxcIlI2fdmK5eOmzRpyd/hpi85n4YVvIVY2rqiKTr9IJEo0Vsqs5dcw9+zrECm0t7EnbrIdYCQKpquVTDZPAfbhnA4y1IwxnfufXruz60hbdfZ0iUSZe9ZrqZxRRTRWNFe7HVKmr5fuzsO0PPlL0qku23Fsu7S6tm6t7RDDUUhfFe+mCIoOgIiMm3X2JQvKJ0596STfsbI4VZe9gwkzT9OikyUSK6G8chqLr7yR8gmn2I5j2/ttBxiuQmrx/AWoPumMIWKMOdK64ZE2k+aMqktuIBIrIxINbU9zTIwxZNK97F5/Hx0Hd9mOY0sHMLO6ti7w5/wuiBZPMtl8IUVWdABEZPLc8181/bTL35WJlpRr0RmCiBCNlbJgxfXu3tpFaTzwNtshhqMgCg8F1ITMJ5ESKirmTI5ESyISKZR/lV2RaAnzz3t9MRefv7MdYDgC39VKJpsrgBeBUF9LOpdICeXlc4CIc+ItNSKZdC+71v22WLtdi6tr656zHWIohfA1WkuRFR2IUFY2Gy06oxeJlrDg/OuLdcD5fbYDnEwhFJ6/tR3Ab2VlsxCJatEZI4nGWHThXxMtLbrLm70n6JfCCXS4ZLJ5AvA62zn8VFJyCpFIqRadPBARIiVlLLrwrcW2k+Ec4GLbIYYS9P/Gm4Fy2yH8EotNIBYbX2wfEk9FIlHKxk1hzlmvsR3Fb2+0HWAoQX+H32A7gF9ESikpmapFxwORWAkTZp7OpOI6tusNtgMMJbDv8mSyeRxwre0cfikrmwlo98or0Vgps5dfQ6x8vO0oflnW1FAf2H0KAlt4gEtxrhkdeiUlU3Qw2QcSiTLvnFrbMfwU2FZPkAtPsK4/5ZFIpIxYbKJ2sXwQiUSpmDi9mE6noYVnFIqi8JSWzkC7WP7pP51GrKwoulxXNjXUT7QdYiCBLDzJZHM5cIHtHF6LxSZoF8sCiUSZubQgriY9ViXAq2yHGEggCw/OPgghPwWGuGM7Qf0XhFckEmXizNMpGzfFdhQ/XGo7wECC+q4PfTcrFpuIdrEskgizll1lO4UfRnUBAa9p4bEiQknJZG3tWBSJRBk3ZS4Vk2bajuK185oa6gN35rjAvfOTyeZSAr6791iVlEy2HUHhHMs1a9nVtmN4rQw4z3aIXIErPDiDyiE+qk/cQeUgvvTFRUSomHAKZeNDP9YTuO5WEN/9oe5mRaNFsRm3YIhEmLowcA2CfNPCMwxX2g7gpZKSSdraCRCJRJk8ZxkSkks+D0ILzzCcYzuAVyKRMkRC/QYvSAbDpNlLbcfw0tymhvpAnREtUIUnmWyOAzNs5/BKNDoB3YQePNFYKdNOXWE7htcW2w6QLVCFB1hoO4CXYrFxupdyQJVWTAj7ketaeIawyHYAr0QiZWhrJ7iMyTAh3Fem0MIzhNAWnmh0HFp4gisaK2XSnFCP85xuO0A2LTw+iUbHazcr4ComzSISDe0poLTFM4SFtgN4wTkCXa8CGnQm3ce4afNtx/DKaU0N9YH55gta4QlliycSKQeCfeFE5Zybedzk2bZjeKUCmGc7RD8tPD5wBpaD9lKrXCIRxk2ZazuGl+bYDtAvMJ+GZLJ5EjDJcgxPRCIVOr5TIMoqp9mO4KWptgP0C0zhIaTjOwCRSODOSqAGISKUVIT2itlaeAYQym6WHiJRWEwmQ8XE0O48r4VnANNtB/CCU3h0YLlQSCRKaUUgz4+eD4E5/0eQCk8od6DQFk9hiURjlFRMsB3DK9riGUAoP6HO/jtBepnVyZTGQ9vi0cIzgJAWnphu0SowJeU6uOw1LTweEwllDzLUYmVx2xG8EphTCgep8ITymAI9VKLwRGKh3f0hMG/GIBWeULZ49Ij0whPirnFgPmOBCUKwsuRNeN/DYRbhhQPtL9pOkW8iHK+2HcIlxgRjH5NksvnLwE22c+Rbeflc91gtVSi6u7upqAjMcEg+bTLGnGs7BGhXy3NBKexq+DKZjO0IXknbDtBPC49SOfr6+mxH8IoWngGEsvAYE9o3cWi1t7fbjuAVLTwDCGWfxJhe2xHUCL3wwgu2I3jlmO0A/YJUeA7bDuAFY9IYE9oxg1Das2eP7QheCcxnLEiF54DtAF7Qrlbh2blzp+0IXglv4RGRqIhsFJHfj/CpB/OdJQiMSRPSXmQodXd3s3fvXtsxvBLewgN8DNgyiueFsvBkMr0Eq2GphtLd3c22bdtsx/DKEdsB+uX1EyEic4Fa4LZRPD2UhcfZkKBjPIWioqKC9evX247hldC2eL4FfIbRfdLa8hslODKZHtsR1DB1dHRw8GBIvwPDWHhE5PVAmzFmtF8XLwKh3PacTnfrHswFYuPGjbYjeCkw+wnks8VzGfBGEWkBfgpcIyJ3DffJ8XhVBmjNY57AcFo82t0KulQqxapVq2zH8FKz7QD98lZ4jDE3G2PmGmMWAjcADxtj3jXCxezOV54gyWS60QHm4Ovq6uKxxx6zHcMrR4wx4etq5UkoCw9kMCZlO4Q6iVgsxurVq23H8MoO2wGyeVJ4jDGrjDGvH8VTQ1p4oK/vuO7BHHAPPvhgmA8QDX/hGYPnbQfwSjqdtB1BDeHYsWPcc889tmN4KTDjOxC8wrPBdgCvGNOrLZ4AKysr449//KPtGF7SFs8Q/gJ02Q7hlXRau1tBtW7dOo4ePWo7hpeesx0gW6AKTzxe1QeEdkeKvr7AnJVAZTl27Bhf//rXbcfwUhp42naIbIEqPK4nbAfwijF9uhdzAPX29vL734/0mOaCstkY02k7RDYtPD7r7W3X7laAdHV1ceutt5JOB+bkfF540naAXEEsPIF7kfIpk0miezEHyw9+8APbEbwWuM9U4ApPPF71PCE9KVg/bfUEQyqVoqGhgRdfDN0ltHJp4RmmUHe3nEFmPWjUtnQ6zac//WnbMbyWBJ6xHSJXUAtP4Cp0fhlSqUPa6rGou7ubO++8k5aWFttRvLbRBPD8u0EtPKFu8UD/Pj2hHtAMtHQ6zec//3nbMfwQyIPPglp4nqQI+iK9vQe11WNBMpnkW9/6FgcOhHoosd8DtgMMJDDXTs+VTDY/CyyzncNrZWWziUTKEAnqd0D4HD58uHf+/PklnZ2B2rXFC53AFDPMUyOIyI+B/hP6nellsCC/239jO4AfUqnQb1EJlFQqxe9+97uSq6+++nER2W87j8cah1t0XCuB6zzKcoIgF557bQfwgzFpUintcvmht7eXZ555hpaWFlasWHHxTTfdVLlw4cJGAnRp3zxrGMnMxphH8Om8zIHtagEkk83bgdNt5/CDdrm819HRwa233kpv74mn9t69e/fWu+66K5NKpcLWtV9gjBnROa5EZCHw+2LuakGRtHpAu1xe6+3t5Re/+MUrig7A/Pnzl9x0001LLr744kcI0PXFx6hppEXHT0EvPD+3HcAvxqTp6XlBu1weSKVSPPzww+zatWvQeSKRSOS666678pOf/GTXlClT1voYzyu/sR1gKIHuagEkk83bgMW2c/glFptASclU7XLlSSqVYuvWrfz6178e0fOefvrpdb/97W9nZDKZeR5F89oZxpjtI32SdrVeVjTdLXAOp0inO7Tlkwd9fX0cPnyY++67b8TPPfvss1fcfPPN0xYvXryKwrve21OjLDr3AGuBM0Rkr4j8ff6juesqgBbPWQTsJEZ+KCubQyRSqi2fUcpkMnR1dfH973+fse6vs2/fvh133nlnsru7+6w8xfPaR40x37YdYiiBLzwAyWTzVuAM2zn8FaG8fA4iMS0+I5TJZOjp6eG2227j8OH8bB02xpg///nPax555JEzgcl5Wag3+oDZxphA75ZdKO/ooupuOTJ0d7diTJ92u0Ygk8mQSqX48Y9/nLeiAyAics0111zxqU99Kj19+vQ1eVtw/t0f9KIDhdPiqcY5EXwR0pbPcGUyGbq7u7n99ts5ePCgp+vaunXrpnvvvXdiOp1e5OmKRu4GY8zPbIc4mYIoPADJZPNTwArbOeyIUFY2S8d8htDX10dXVxe33347R44c8Wudqd/85jePPfPMMxcD5b6sdGhHgDnGmMBfqaWQCs/bKKL9egZSWnoK0eh4LT45UqkUbW1t3H333XR1+f+ZO3DgwK6VK1ce6uzsPM/3lZ/oq8aYmyxnGJZCKjwRYCtFcgjFYHQ/nxOlUimampr4wx/+QCZjdyzs0UcfffTBBx9cbIw5xcLqe4FFxphWC+sesYIpPADJZPMHgdCfmftkIpEKyspmAhRtATLG0NfXx/3338/69ettx3lJV1fX0bvuuuvp1tbWKwDxcdV3G2Pe6eP6xqTQCk8Z0ALMtBzFOpEopaUzivLA0lQqRWdnJ/feey/79wfzzBbNzc1N99xzT1lfX59fe92vMMYEpwKfREEVHoBksvkm4Mu2cwRFNFpJScm0DM7hRrbjeKq/lfPEE0+watWqwF8LK51O9zU0NDy6YcOGFcA4D1e12hhzpYfLz7tCLDwTgd3ABNtZgiCdznQ+++yhY0uWLJlVWVlJNBq1HckThdDKGczhw4f3rly5ct+xY8cu9GgVbzHGjOxgNMsKrvAAJJPNXwNCf12S4di69UDj8eM9NQBTp07ltNNOIxaLEYvFbEfLi1QqRTqd5uGHH2bDhg3WB5DHYt26dY83NDQsMMbMyuNitwHLTIHtZVqohWc28DxQajuLTUePdj+zffvBZeTsgT5jxgxOPfVUIpFIwRag/m7Uo48+enzNmjWVA51HpxD19PR03HPPPetbWlouB/LRPH27Mabg9uwvyMIDkEw23wZ4dvRs0GUyJrVhQ+tuYzhtoMdFhNmzZzN//vyCKkB9fc4loPbv38/u3bvZunXrI3v37i2o8Yvh2L1795a77rrLjPGsh+uBC0wBfogLufCcAWymcI43y6sdOw6tOnKk66rhzDtlyhTmzZtHZWUlIkLQBqEzmQzGGLq7u9mzZw9tbW30vy8zmUxq9erVbcaYuZZj5l0mk8k88MADqx9//PFzGd2Y5WuNMYG8fM3JFGzhAUgmm38CvMN2Dr91dqaaN29um8cIu5plZWXMnj2bGTNmvNQCsjUYnclkXio4hw4dorW1lY6OjgHnff7551fv2rXrCp8j+ubo0aMv3HHHHc8fPnz4khE8bZUx5mrPQnms0AvPXJy9mb3cVBkoxpjMxo37NqfTYztDXEVFBVOnTmX69OmMGzeOTCZDJBLxrDVkjCGdTiMiLx3icOjQIY4fP37S52Yymb7Vq1e3GmMWeBIuIEZ41sNLjDGPex7KIwVdeACSyebPAv9uO4dfdu1qb2xr66jJ5zJjsRiVlZVUVlYyadIkxo8fTzQafWkLkogMu2XU35Lpfx5AZ2cn7e3tHD9+nOPHj9PT0zPijLt37350586dl434iQWmt7e36957731i+/btlwElg8x2nzHmej9z5VsYCk8ZzljPqbazeK27u29vU9MLk/GhhVdSUkJFRQWlpaWUlZVRWlr60u+RSOSlomKMIZPJ0NvbS3d3Nz09PfT09JBKpV76PR+MMZlHHnnkeWNMVV4WGHBDnPUwBVSP5tSmQVLwhQcgmWy+noCfVT8fNm3at663N1OkpwaBvXv3rt2xY8dIxkEK2iBnPfwPY8xnbebKh1AUHoBksvn/8Onyqzbs23fs0dbWY6HvagzFGGNWr169PZPJFNVpcDs6Og7eeeedW9va2uYCy40xSduZxipMhWcR8AwQt50l33p70wc3bdofAabYzmLb/v37n9y2bZtXhx4EWmtr61/98Ic//KPtHPkQrB06xiAer3oeSNjO4YWtWw9sR4sOALNmzbowGo1utp3DgnvDUnQgRIXH9U1gg+0Q+XTwYOdT3d19l9rOESSLFy8u+K7GCLUDH7UdIp9CVXji8ao08AEg2OdLGKZ0OnP8+eePzLGdI2hmzJixIhaLFdPJ/z+RSCResB0in0JVeADi8aoNwDds58iH7dsPbgRm284RREuWLCmoo7HH4GeJRGKl7RD5FrrC4/ocULB7dQK0t3f9paMjFdrDBMZq2rRp55SUlGy0ncNju4B/sB3CC6EsPPF4VQp4GxD4C5sNJJMxPTt2HKrE33P2FpylS5cWxiH3o5MG3pVIJNptB/FCKAsPQDxetRe4gQIc72luPrTWGIJ2objAmTJlSnVpaelTtnN45EuJRCLIVywdk9AWHoB4vOphnG5XwejoSG1vb+8u6h0FR2L58uXjbWfwwGPAv9oO4aVQFx7XV4Hf2g4xHMaY9LZtB/oY/OBAlWPixIlLy8vLC3o8L8dB4B2JRKLgWuojEfrCE49XGeC9wHO2s5zMrl3tazIZM5Yz0hWl5cuXTwXCsJWrF3hrIpHYZTuI10JfeADi8aqjwFuBwO541t3du/vAgc4LbOcoRJWVladXVFSEodXzT4lE4hHbIfxQFIUHIB6vagI+aDvHYLZsOXCQEB5n5pfly5fPogA3JGT5diKR+JHtEH4pmsIDEI9X/QT4ru0cuVpbj63p68ucZztHIRs/fvyicePGrbWdY5T+BHzCdgg/FVXhcX0CeNh2iH6pVLpt375jYzqNqXIsX758Ps44SSHZDrw97IPJuYqu8MTjVb3AG4HVtrMAbN3a1gxMsp0jDOLx+PzKyspCGutpBa4L606CQym6wgMQj1d1Aq8DrDbN29o6nujpSRfNGfX8sGzZsiogP+db9dYB4NWJROJ520FsKMrCAxCPV3UAfwVY2fO1ry9zdNeu9lBfNcGGioqK2RMnTgx6q+co8NpEIrHFdhBbirbwwEub2V8L+H6w4bZtB/4CzPR7vcVg2bJlS4Eu2zkG0Qn8VSKRCPsBrkMq6sIDEI9XHQFeDTT5tc4jR7o2JZO9l/u1vmJTVlY2ffLkyU/azjGAHuD6RCJRqFvf8qboCw9APF51CHgV4HnTN5PJdDU3H5qMHnnuqaVLl54JDHxpUju6gbckEomHbAcJAi08rni8qg24Bmfzpmd27Dj8hDHo2I7HSktLp06dOnWd7Ryu4zjdqz/YDhIUWniyxONVL+AUn2Yvln/8eM/Wo0e79eRePlmyZMm5OAO5Nh0GXpVIJFZZzhEoWnhyxONVrUANkNdvS2NM3/btBwGGdy1gNWYlJSUTp0+fbnMQdw9wRSKRCOJ4k1VaeAbgFp8rgLvztcyWliNrMhmzJF/LU8OzePHi83FaHX57Frg0kUgU46V4TkoLzyDi8arueLzqncD/Y4ynXOjq6m05eDB5cX6SqZGIxWKVM2fO9G2LpetBnJbOXp/XWzC08JxEPF71NeANjHKswBhjtm490A6U5zOXGr7TTz/9Avw7/3Y9zmEQR4b7BBGZJyJ/FpHNIvKsiHzMw3yBEJpLGHstmWxeAtwHnD6S5+3de3T1/v3HdUDZsueee+6R1tbWKz1cRRfw/kQiMeLuuYjMAmYZYzaISCWwHniTMSa03TRt8QxTPF61FbgQuH+4z0ml+l7Yv//4Wd6lUsNVVVV1EbDfo8XvBi4bTdEBMMbsN8ZscH8+jrM/Wagv5KiFZwTi8ap2oJZhXjBwy5YDu4CJXmZSwxOJRMrmzZu3w4NFrwJW5OsQCBFZCJwLPJGP5QWVFp4Riser0vF4VR3OeZy7B5vvxRc71qZS6Yv8S6ZOZtGiRReLyJ48La4X+CzOPjp5GT8SkfHAL4GPG2OO5WOZQaVjPGOQTDYvBVbidMFe0tubPrJp0/4+4BQbudTgWlpa1rS0tIz1OLmtOBfbW5+PTAAiUgL8HrjfGBOKS3APRVs8YxCPV20BLgVuJuscMNu2HXwWLTqBtGDBgktEZLTnwDHAd4Dz8lx0BPgfYEsxFB3QFk/eJJPNy4GVhw8npbn58Pm286jB7d69+7GdO3deOsKn7Qfel0gkhr1xYbhE5HKcM2I28fI+Y/9ijAntsV1aePIomWyObdq07596ezNfBips51EDM8ZkVq9evTOTyZw2jNkzwA+BzyYSCRt7QIeSFh4PNDY2ngr8N855flQAtba2Pv7cc8+dbG/yp4APJxKJoBzlHhpaeDzU2Nj4NuArwKm2s6gTGWPM6tWrt2UymYGOnzsE/AtwWyKRCMMVSgNHC4/HGhsbS4F/Bj4HTLYcR2XZv3//U9u2bcu+emsGZ5D35kQicchSrKKghccnjY2NU3CKzz8BpZbjKNfq1aufSafTZ+IcDvPZRCLxjO1MxUALj8/c8Z8vAW9Hd2ewrq2t7Y7Nmzf/QM+D7C8tPJY0NjaeDnwGeA/aArLhz8AtNTU1j9gOUoy08FjW2Ng4B/gk8EFgvOU4YZcGfg18q6am5lHbYYqZFp6AcMeAPgL8A3q9rXw7AvwI+G5NTc1u22GUFp7AaWxsjOGceOwDOBcb1HGg0dsM3Ar8b01NTdJ2GPUyLTwB1tjYOB/4O/c2z3KcQnEI+DnwE+1OBZcWngLQ2NgYAV4DvA14IzDNbqLA6QJ+B9wF/LGmpqbXch51Elp4CkxjY2MUuBJ4C/BmQn6muiEcBf6EcyqJX9XU1By3nEeNgBaeAtbY2CjARThjQlcDK4ASq6G89TTwf+7tsZqamj7LedQoaeEJkcbGxnHAZcBV7u0CIGYx0likgWdwTgG6FnigpqZmn91IKl+08ISYW4guAM4GznLvlxO8S+0YnKtursMpNE8A62pqajqtplKe0cJTZNwxosU4hWgpztay+e79PCDu0aoNzhanZmB71m0b8Jxu7i4uWnjUCRobG6fiFKJZwCScq2RMxNmrugKnMJUBfVm33qyfe3AKzIGc2yEdk1H9tPAopXyne8UqpXynhUcp5TstPEop32nhUUr5TguPUsp3WnjUCUSkXESeFJGnReRZEfmi7UwqfHRzujqBezndccaYDvd63muAjxljHrccTYVIoR7HozxinG+iDvfXEvem304qr7SrpV5BRKIisgloA/5kjHnCciQVMlp41CsYY9LGmHOAucCFInKm5UgqZLTwqEEZY9pxLgNzneUoKmS08KgTiMgpIjLJ/bkCeDWw1WooFTo6uKxyzQLuEJEozhfTz40xv7ecSYWMbk5XSvlOu1pKKd9p4VFK+U4Lj1LKd1p4lFK+08KjlPKdFh6llO+08CilfKeFRynlOy08SinfaeFRSvlOC49SyndaeJRSvtPCo5TynRYepZTvtPAopXynhUcp5TstPEop32nhUUr5TguPUsp3/x/1c62OXy/bvgAAAABJRU5ErkJggg==\n" }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "# you can use various libraries to work with reviews: SentimentIntensityAnalyzer, transformers and textblob" ], "metadata": { "id": "gRp6ILtBFpGJ" }, "execution_count": 17, "outputs": [] }, { "cell_type": "code", "source": [ "pip install -q transformers" ], "metadata": { "id": "PSB7vEagTauK", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "73c1aa64-419a-49b0-9067-f9d55755ad29" }, "execution_count": 18, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m6.3/6.3 MB\u001b[0m \u001b[31m58.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.6/7.6 MB\u001b[0m \u001b[31m28.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m190.3/190.3 KB\u001b[0m \u001b[31m19.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h" ] } ] }, { "cell_type": "code", "source": [ "# create data frame reviews text, rt. Each review is in a single row.\n", "rt = data[[\"reviews.text\"]]\n", "#rt = str(rt).encode('utf-8')\n", "#rt[\"reviews.text\"] = pd.to_numeric(rt[\"reviews.text\"])\n", "# convert column \"reviews.text\" to string type\n", "rt = rt.astype({\"reviews.text\": str})\n", "rt" ], "metadata": { "id": "IS6EdnaEcchV", "colab": { "base_uri": "https://localhost:8080/", "height": 419 }, "outputId": "447ddf40-c104-4295-dd68-f80be0ea8588" }, "execution_count": 19, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " reviews.text\n", "0 Pleasant 10 min walk along the sea front to th...\n", "1 Really lovely hotel. Stayed on the very top fl...\n", "2 Ett mycket bra hotell. Det som drog ner betyge...\n", "3 We stayed here for four nights in October. The...\n", "4 We stayed here for four nights in October. The...\n", "... ...\n", "35907 Best of the Best!!!! My family and I stayed in...\n", "35908 Amazing Vacation in Beautiful Cabin We stayed ...\n", "35909 My husband and I stayed at Tree Tops which is ...\n", "35910 to share your opinion of this businesswith YP ...\n", "35911 xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx\n", "\n", "[35912 rows x 1 columns]" ], "text/html": [ "\n", "
\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
reviews.text
0Pleasant 10 min walk along the sea front to th...
1Really lovely hotel. Stayed on the very top fl...
2Ett mycket bra hotell. Det som drog ner betyge...
3We stayed here for four nights in October. The...
4We stayed here for four nights in October. The...
......
35907Best of the Best!!!! My family and I stayed in...
35908Amazing Vacation in Beautiful Cabin We stayed ...
35909My husband and I stayed at Tree Tops which is ...
35910to share your opinion of this businesswith YP ...
35911xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx
\n", "

35912 rows × 1 columns

\n", "
\n", " \n", " \n", " \n", "\n", " \n", "
\n", "
\n", " " ] }, "metadata": {}, "execution_count": 19 } ] }, { "cell_type": "code", "source": [ "# transforers library is using various pretrained models to classify and calculate score\n", "# well known model names are e.g. XLNet, BERT, XLM, RoBERTa, ...\n", "from transformers import AutoTokenizer, AutoModelForSequenceClassification, pipeline\n", "model_name = \"nlptown/bert-base-multilingual-uncased-sentiment\"\n", "model = AutoModelForSequenceClassification.from_pretrained(model_name)\n", "tokenizer = AutoTokenizer.from_pretrained(model_name)\n", "classifier = pipeline('sentiment-analysis', model=model, tokenizer=tokenizer)\n", "classifier(\"Really lovely hotel. The best one. Tip top.\")" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 195, "referenced_widgets": [ "00e8d3fcbf2d458bafe70cc30d0f4d71", "d7bf9f7e23424722ad51e66bb3d31f44", "c9bd1206b2994609bd8b24dc3c886c3d", "4d820a0721284de4be381f6bbe7c65d1", "0dd480987916438a9035503b9239bf40", "37023318069b4eef84f3d260f1ac50b0", "c1b27f95737543d0986adf61b65727b6", "46f00edbac234bbf8338cf348a1bcfbd", "0d658060ac90494cb1919f07f0e9997a", "4d781dd1856e4ef7bbb61c2499fa877e", "4196b57142dd48a886a9ace940eb0576", "cefb3a3a50df4328a3e1aa60badada6a", "33e5462c902a4b288a2ae70f2969e45c", "d343de84a884458ea45ae9165403ed4f", "44906a4d83194bbb93b9c2baf26488b0", "0833d76a8409412783b717428133224c", "342fb5d6c1cf4e2ba8bfce1399e31220", "2edb942445304bbf9b0459e5fa90e65a", "526ee09f2d484dcb847749a9783c988a", "2654938824504c94b4df4e611c1ef86b", "4abeac3a7e5d4509bfe8f641c1a1282a", "45c0f75862b342929e079aba2c4ac4b0", "3e3c80723f5f4711ac0c227236a1a201", "408426c5dcf04f8082ec780d29029c70", "435c05a24bf54d9cb91a3b4f2e9090d2", "0e7711bc07e64d85b7ac8abc860a58ce", "1e2a62f855e3494bb57a648336928846", "3c8df1db53ff4b43b8ccf14254f85d8f", "7b60fcabf8a043aa8d89acafe180a4b3", "96b7996fb677443ba8c1069462715117", "b567696494c34339ab1ae5aa8c181dcd", "14ed949745fb4da48ff76534a5bc717d", "2b937004c5d84052847af445e97f6bf1", "455ed1b6ed1b46de9c0ae7bf7ec96610", "1fe1ce8e634c4126af673f8944c04f0a", "049258c530914ffc94d1e7b094200a82", "7e8e512bba0f420d952111be7118ae32", "e931fbbdaa8043b6b13e2ef99932df1b", "cd9851e4c27c403b97b86627894da956", "3db33dafa4064615ac12ba02bab0912f", "8fcb8f329cac4c688c5cfd2c00bb6cc0", "fddeb9d892fe47b4accd3d0b9ea6c71d", "c68fe70b5a464fb39f42595edd5eccb3", "99715c01e04c4d55b5a3fd37a9f1a09b", "5045cfb8d210405ea681b5a5aedd81c3", "602e280b413a44f6b3fb594441e7c20b", "c99995914494484c877419709f18b27d", "e6ed602ce673438ba07f7c6cafdf38bf", "40c6cca6491f40558168c9e3b1b122e9", "06e4ef984cae41669bb2639ebcd37725", "765d919a626f41679c39eee4c13f6c44", "58979a1334ab4f16b18d6113f403e931", "e9f24b5c29ed416aadaddba33892e140", "e90ae2754c0441aa8a98c76034d4dc00", "6237552000bc4a57a62f677b3027d909" ] }, "id": "hY2iPiO7yM0Z", "outputId": "e5caf34d-0853-413e-9bff-65a65cfd3757" }, "execution_count": 20, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Downloading (…)lve/main/config.json: 0%| | 0.00/953 [00:00\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
reviews.textPositiveNegativeNeutralCompound
0Pleasant 10 min walk along the sea front to th...0.2520.0520.6950.8299
1Really lovely hotel. Stayed on the very top fl...0.4810.0190.5000.9828
2Ett mycket bra hotell. Det som drog ner betyge...0.0000.0001.0000.0000
3We stayed here for four nights in October. The...0.2890.0000.7110.9643
4We stayed here for four nights in October. The...0.2890.0000.7110.9643
\n", "
\n", " \n", " \n", " \n", "\n", " \n", "
\n", " \n", " " ] }, "metadata": {}, "execution_count": 23 } ] }, { "cell_type": "code", "source": [ "# classify column Compound\n", "score = rt[\"Compound\"].values\n", "sentiment = []\n", "for i in score:\n", " if i >= 0.05 :\n", " sentiment.append('Positive')\n", " elif i <= -0.05 :\n", " sentiment.append('Negative')\n", " else:\n", " sentiment.append('Neutral')\n", "rt[\"Sentiment\"] = sentiment\n", "rt.head()" ], "metadata": { "id": "9BxkcztYxPS8", "colab": { "base_uri": "https://localhost:8080/", "height": 204 }, "outputId": "c0e22331-40da-4210-f23d-6c96d6d8bbe5" }, "execution_count": 24, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " reviews.text Positive Negative \\\n", "0 Pleasant 10 min walk along the sea front to th... 0.252 0.052 \n", "1 Really lovely hotel. Stayed on the very top fl... 0.481 0.019 \n", "2 Ett mycket bra hotell. Det som drog ner betyge... 0.000 0.000 \n", "3 We stayed here for four nights in October. The... 0.289 0.000 \n", "4 We stayed here for four nights in October. The... 0.289 0.000 \n", "\n", " Neutral Compound Sentiment \n", "0 0.695 0.8299 Positive \n", "1 0.500 0.9828 Positive \n", "2 1.000 0.0000 Neutral \n", "3 0.711 0.9643 Positive \n", "4 0.711 0.9643 Positive " ], "text/html": [ "\n", "
\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
reviews.textPositiveNegativeNeutralCompoundSentiment
0Pleasant 10 min walk along the sea front to th...0.2520.0520.6950.8299Positive
1Really lovely hotel. Stayed on the very top fl...0.4810.0190.5000.9828Positive
2Ett mycket bra hotell. Det som drog ner betyge...0.0000.0001.0000.0000Neutral
3We stayed here for four nights in October. The...0.2890.0000.7110.9643Positive
4We stayed here for four nights in October. The...0.2890.0000.7110.9643Positive
\n", "
\n", " \n", " \n", " \n", "\n", " \n", "
\n", "
\n", " " ] }, "metadata": {}, "execution_count": 24 } ] }, { "cell_type": "code", "source": [ "print(rt[\"Sentiment\"].value_counts())" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "axjS8sPOE0kd", "outputId": "616fc816-ef6f-45c6-e4b2-ca7ef995a549" }, "execution_count": 27, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Positive 26819\n", "Negative 6201\n", "Neutral 2892\n", "Name: Sentiment, dtype: int64\n" ] } ] }, { "cell_type": "code", "source": [ "rt" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 419 }, "id": "v14_GEZ2rS67", "outputId": "132eadb5-713a-495c-979d-8cd72a153ed2" }, "execution_count": 28, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " reviews.text Positive Negative \\\n", "0 Pleasant 10 min walk along the sea front to th... 0.252 0.052 \n", "1 Really lovely hotel. Stayed on the very top fl... 0.481 0.019 \n", "2 Ett mycket bra hotell. Det som drog ner betyge... 0.000 0.000 \n", "3 We stayed here for four nights in October. The... 0.289 0.000 \n", "4 We stayed here for four nights in October. The... 0.289 0.000 \n", "... ... ... ... \n", "35907 Best of the Best!!!! My family and I stayed in... 0.293 0.011 \n", "35908 Amazing Vacation in Beautiful Cabin We stayed ... 0.288 0.000 \n", "35909 My husband and I stayed at Tree Tops which is ... 0.217 0.016 \n", "35910 to share your opinion of this businesswith YP ... 0.263 0.000 \n", "35911 xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx 0.000 0.000 \n", "\n", " Neutral Compound Sentiment \n", "0 0.695 0.8299 Positive \n", "1 0.500 0.9828 Positive \n", "2 1.000 0.0000 Neutral \n", "3 0.711 0.9643 Positive \n", "4 0.711 0.9643 Positive \n", "... ... ... ... \n", "35907 0.695 0.9854 Positive \n", "35908 0.712 0.9759 Positive \n", "35909 0.766 0.9965 Positive \n", "35910 0.737 0.6124 Positive \n", "35911 1.000 0.0000 Neutral \n", "\n", "[35912 rows x 6 columns]" ], "text/html": [ "\n", "
\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
reviews.textPositiveNegativeNeutralCompoundSentiment
0Pleasant 10 min walk along the sea front to th...0.2520.0520.6950.8299Positive
1Really lovely hotel. Stayed on the very top fl...0.4810.0190.5000.9828Positive
2Ett mycket bra hotell. Det som drog ner betyge...0.0000.0001.0000.0000Neutral
3We stayed here for four nights in October. The...0.2890.0000.7110.9643Positive
4We stayed here for four nights in October. The...0.2890.0000.7110.9643Positive
.....................
35907Best of the Best!!!! My family and I stayed in...0.2930.0110.6950.9854Positive
35908Amazing Vacation in Beautiful Cabin We stayed ...0.2880.0000.7120.9759Positive
35909My husband and I stayed at Tree Tops which is ...0.2170.0160.7660.9965Positive
35910to share your opinion of this businesswith YP ...0.2630.0000.7370.6124Positive
35911xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx0.0000.0001.0000.0000Neutral
\n", "

35912 rows × 6 columns

\n", "
\n", " \n", " \n", " \n", "\n", " \n", "
\n", "
\n", " " ] }, "metadata": {}, "execution_count": 28 } ] }, { "cell_type": "code", "source": [ "# install libraries for pieplot and define colors\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns \n", "cmap = (\"beige\", \"silver\",\"grey\")\n", "# print the shares\n", "plt.pie(x=rt[\"Sentiment\"].value_counts(), labels=rt[\"Sentiment\"].unique(), colors=cmap , autopct='%1.0f%%')\n", "plt.show()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 248 }, "id": "LOplb3NvpZBk", "outputId": "fb381756-9cb0-468b-cc99-e68a1fae78fa" }, "execution_count": 49, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "iVBORw0KGgoAAAANSUhEUgAAARIAAADnCAYAAADSH9k9AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/NK7nSAAAACXBIWXMAAAsTAAALEwEAmpwYAAAiDUlEQVR4nO3deXxU5d338c8vJKAHwiYJ+zoEEMqiLAIhHJWCuNSn0lat1aq1dam11u3R+txPY+3dqrXWWuvdhd63UhQqLq0LjyDKptYlIiooxTgQ9l0DyGFL5nr+OCcwYCDLZOY6M/N7v17zSjJz5pzfJJPvXNd1zrmOGGNQSqlE5NguQCmV/jRIlFIJ0yBRSiVMg0QplTANEqVUwjRIlFIJ0yBRSiVMg0QplTANEqVUwjRIlFIJ0yBRSiVMg0QplTANEqVUwjRIlFIJ0yBRSiVMg0QplTANEqVUwjRIlFIJ0yBRSiVMg0QplTANEqVUwjRIlFIJ0yBRSiVMg0QplTANEqVUwjRIlFIJ0yBRSiUs13YBqmE8L9oS6BHcugdfuwFtgZbBzYn7PgfYD+w76rYH2ARsOOq23nEiO1L2glRGEL2IeDh5XrQ5MBQ4Jfg6GBgInJSCzW8HlgEfxt0+cpzI3hRsW6UhDZKQCFoaLjARKMEPjuZWizpSDD9QFgDzgcWOE9lltyQVFhoklnheNAcYgR8cE4ExhCs46lINLMEPlZeA1x0nErNbkrJFgyTFPC96GvBt4EKgs+VymtIm4BngKTRUso4GSQp4XnQQfnhcDEQsl5MKG/FD5XHHibxjuxiVfBokSeJ50TzgW8CNwCjL5di0FPgz8ITjRL6wXYxKDg2SJuZ50QLgGuA6oIvlcsJkJ/A/wMOOE1ltuxjVtDRImojnRfsBd+B3YU6wXE6YxfDHUX7uOJEVtotRTUODJEGeF+0BlAKXA80sl5NOYsBM/EApt12MSowGSSN5XrQQ+D/43ZgWlstJZ9XAdOBu7fKkLw2SBvK86InAT4Gb8Q9BV03jIPAQfgtFB2XTjAZJA3he9GzgEaC37Voy2HrgJseJPG27EFV/KT37V0TuFJG/Hufx74jIy6msqT48L9rZ86KzgP+HhkiydQOe8rzoXM+LFtkuRtVPnS0SEakAOuL3ZffgHw79I2NMQs1PEekFrAbyjDFViawrWYLD2H8I/BJobbmcbLQf/3f/K8eJVNsuRh1bfVskXzPGtAJOxT8/5D+SV1I4eF60CzAPeBgNEVtaAHcDiz0vqi3BEGtQ18YYswG/RfIVETlfRD4SkUoRWSgiJ9csJyK3i8gGEdktIitFZEJw/10i8niw2OLga6WIfCEiY0TkChF5PVj2jyLym/jti8hzInJz8H0XEXlGRLaJyGoR+XHjfgVf5nnR84APgDObap0qIWOB9z0vepntQlTtGhQkItIdOAfYjX8MwE+AAvyxgxdEpLmI9Ad+BIw0xuQDZwEVtaxufPC1rTGmlTHmzaMenwlcJCISbLsdMAn4u4jkAC/g/7N3BSYAPxGRsxryeo7medEWnhf9fbDuDomsSzW51sDfPC86w/OibWwXo45U3yD5p4hUAq8Di4CPgdnGmHnGmIPAb4AT8T85qvGbpANFJM8YU2GMiTaittcAgz83B8A3gTeNMRuBkUCBMeZuY8wBY8wqYCr+SXGN4nnRvsDbwA2NXYdKiW8D73ledKDtQtRh9Q2Srxtj2hpjehpjfoh/DsmamgeNMTFgHdDVGPMpfkvlLmCriPxdRBp8zonxR4H/jv/GAbgEeCL4vifQJehWVQYhdyf+oHCDeV70dPwQGdqY56uU6wO85XnRc20XonyN3f27Ef+fGYCg+9Edf85PjDEzjDHjgmUMcF8t66jPASwzgW+KSE/gNPxT08EPrdVBuNXc8o0x5zT0hXhe9HvAy0D7hj5XWZUPPO950dtsF6IaHySzgHNFZIKI5AG34O+q+5eI9BeRM0WkBf4kw3vxz6s42rbg/j7H2ogxZin+/KF/BeYaYyqDh94BdgeDuieKSDMR+YqIjKzvC/C8aI7nRX8N/DeQV9/nqVDJAX7tedFpnhfV0xQsalSQGGNWApfi7xrdDnwNfxfxAfzxkXuD+zcDhfiHlB+9Dg//GIE3gu7J6GNsbgbw1eBrzXOrgfOAYfjHotSETb0G4YLD3J8B9NMsM3wXmOt50Va2C8lWWXeIvOdF84EXObzXSGWOt4HJjhOptF1ItsmqIPG8aDtgDtk9Y1mmWwpMcpzIdtuFZJOsCZIgRF7BPzpXZbaPga86TmST7UKyRVYEiYZIVvoUcB0nstF2Idkg44PE86IO/kWdtDuTfZYBJY4T2Wm7kEyX0RcR97xoM+BJNESy1WDgOd01nHwZHST4kxCdZ7sIZZULPBFMCaGSJGN/uZ4X/Sn+fKpKfQP/mCeVJBk5RuJ50UuBvwFiuxYVKrc6TuQB20VkoowLEs+LjgDeIL0uyK1SowqY4DiRxXUuqRoko4LE86Jt8Q9I6mW3EhVim4FT9RiTppVpYyTT0BBRx9cJmOV50VzbhWSSjAkSz4veCpxvuw6VFsYBv7ZdRCbJiK6N50XH4s/cpp8yqiEucJzIP20XkQnSPkiCU8eXEzfRklL1tBX4iuNEttkuJN1lQtfmHjREVOMUAn+yXUQmSOsWiedFi/Eva5EJgajsudhxIk/aLiKdpW2QBOdPvA8MsFyKSn9bgYGOE9lhu5B0lc6f5D9DQ0Q1jULgt7aLSGdp2SLxvOgg/NaI7qVRTcUAox0n8o7tQtJRurZI7kdDRDUtAR60XUS6Srsg8bzomcDZtutQGWms50UvtF1EOkqrIPG8qOC3RlKmsHDIEbf8/H7ccsvPAVizZj0tW/Y94vF77/3Doec++OBUevQYyYgRk1m+fOWh+998cwkXXXRtKl+Gqr97dSKkhku37sF3SPG8q1u3fnjo+y++2EOfPmO44IIjG0QbN75Hbu6Rv8pNm7byt789xfLl85kx4x+Ulv6GZ56ZSlVVFT/96a+YNu2hlNSvGqw3cCN6CH2DpE2LJPiU+E+bNfzzn3MpKDiJ4uK6L+i3fv1GhgwZSOvW+ZxxRjEVFWsB+MMfHuPccyfQs2e3ZJerGu9Oz4u2tl1EOkmbIAG+h+UjWJ944lkuueTr+Jc6PmzAAJeiomKuueZ2tm//DIA+fXry0UcrqazcxYIFb3DyyUWsX7+Rp59+kRtv/L6N8lX9tQGus11EOkmL3b/BfJsrgb62ali7dgODBp3BsmWv0qtXd8Dv6nzyySqGDDmZHTsqufnmUnbv3sPzzz8GwKxZL/C7302lsLADv//9L7j99l9y9dWXsmPH50yd+jht2rTmwQfvomvXzrZeljq2zUBvx4nss11IOkiXIPkm8JTNGu677xHmz3+duXNnHnOZzZu3EYmMYfPm98nPP/IytHPmLGDmzOd48MG7GD36PN599yVmz36VOXMW6HhJeF3nOBE9F6ce0qVrY/1i3zNm/INLLply3GVqujyx2JHhvHfvPkpLH+Dee39KNFpBt26dad06n+HDh7B8+b+TVrNK2G3BJU1UHUIfJJ4XHY/l69K89dZ7bNy4hSlTjtxbU1b2Pp98sopYLMaOHZ9z2213M378abRpk3/Ecvfd9wiXXjqFzp070q1bF8rLV7Nly3YWL36LXr16pPKlqIbpA+hxJfWQDrt/b7VdwBNPPMv550/6Undl9ep13HXXA2zbtoP8/FaceWYxjz76uyOWWbkyyquvvs7ChU8D0LlzITfffA0jR55NQUF7pk37fapehmqcG4Bj92cVEPIxEs+LdgXWkgYtJ5XRTnaciPZBjyPs/6CXEf4aVeb7nu0Cwi7s/6SX2y5AKeAynXX++EIbJJ4XHYXON6LCoRNwju0iwiy0QYK2RlS4XGW7gDAL5WCr50WbA5uA9rZrUSpwAOjgOJHdtgsJo7C2SMajIaLCpTlwlu0iwiqsQXKu7QKUqsXXbBcQVmENEh3YUmF0jh4yX7vQBYnnRfsC/WzXoVQtOgBjbBcRRqELErQ1osJNuze10CBRqmEm2C4gjEK1+zc4enAn4NiuRaljqALaOE7Es11ImIStRTIUDREVbrlA3ZP2ZpmwBYkOZKl0oO/To4QtSKxOYKRUPWmQHCVsQTLcdgFK1YMGyVFCM9jqedGWwC7CF25K1aaH40TW2S4iLML0TzuQcNWj1PH0t11AmITpH9faNWuUagQ9+jpOmIIkYrsApRpAgySOBolSjaNBEkeDRKnG0SCJE6Yg6WO7AKUaoJdOKXBYKIIkmFqxi+06lGqAZkA720WERSiCBH9aRbFdhFINdJLtAsIiLEHS1nYBSjWCBklAg0SpxtMgCWiQKNV4GiQBDRKlGk+DJBCWIGljuwClGuFE2wWERViCRC/QrNKRHkcSCEuQVNsuQKlG0CAJhKUloEGSJNHotvmLFpXFduz4bCj6xm9SeXnNDtx553/YLiMUNEgyXk7O4MFDzty1a1f58uXLdx44cGCE7YoyxcGD+ratoV2bDGeMf8Rw69ati8aOHTti4MCBS3JyclbaritDHLRdQFhoiyTDxWJHzqVZWFg4vKCgILZmzZrXKyoqIkBnS6VlAg2SQFhaJPtsF5CpjDFfOodJRHJ69eo1rqSkpE1hYeEi4AsLpWWCA7YLCIuwBMk22wVkquNN7t2sWTNn4MCB7pgxY/bm5+cvRluGDaUfgIGwdG222i4gU8VidZ9V3aJFi4Lhw4cX7N69O7p8+fLP9u/fr1eSq5/1tgsIC22RZLjaujbHkp+fHxkzZszIQYMGLc3Jyfl3MuvKEBW2CwiLsLRIduA3q/U4hyZWs9emIQoKCk7p0KGDWbt27RurV6/uTYomnfr888+ZPXs269evp1mzZgwcOJDJkydz8OBBnnrqKdavX0+/fv244IILyMnxPwOff/55+vbty8CBA1NRYjyDBskhoWiROE7EANtt15GJjDGN+huLiPTs2bO4pKSkfceOHRfhX7wsqWbPnk3Lli255ZZbuPbaa1mzZg1lZWW8++67dOrUidtuu43KykpWrFgBwLp169i9e7eNEAHYUlpaqmMkgVAESWCL7QIyUUO6NrVp1qzZCSeffLI7duzYA61bt14MVDVRaV9SWVnJoEGDyMvLIz8/n759+7Jt2zYqKyvp3bs3ubm59OjRg88//5xYLMacOXM4++yzk1VOXVbb2nAYhSlIPrFdQCYypmn+xs2bN+9w6qmnjh8xYsS6Fi1avNMU6zza6NGjWb58OQcOHGDXrl2Ul5fTt29fCgsLWbVqFQcPHmTt2rUUFhby9ttvU1RURPv27ZNRSn1U2NpwGIVljARAB/eSoLFdm2Np1apV7zFjxvTevn37+ytWrGheXV3dZP2Knj17smTJEu655x6MMQwdOpQBAwZQVVXFSy+9xNSpUykqKqJjx47Mnz+fK664ghdeeIFt27bRs2dPJkyY0FSl1Ie2SOKEKUhW2C4gEzVVi+RoHTp0GDZu3Dizbt26f61evbqHMaZbIuuLxWI8/vjjDB8+nKuuuooDBw7w3HPPMW/ePCZNmsT5559/aNlZs2YxYcIEPvzwQ4wxXHnllUyfPp3y8nKKiooSfm31VJGqDaWDMHVttEWSHEnbEyYi0qNHj7ElJSUFnTp1WgTsbOy69u7dy86dOxk1ahS5ubk4jsOwYcMoLy8/Yrny8nKMMRQVFbF161a6dOmCiNClSxe2bEnpMJu2SOKELUiOfRimahRjTNJ3qefk5LQYMGCAO3bs2Oo2bdosphHnoLRs2ZK2bdtSVlZGdXU1e/fu5YMPPqBjx46Hljl48CCvvPIKkydPBqBt27ZUVFRQVVXF2rVradcupZeZqUjlxsJOjncIdap5XrQC6Gm7jkyyZMmGj2Mxk9L9o3v27KlYtmzZ5n379o1uyPM2bdrEnDlz2LJlCyJC7969Oeecc2jVqhUA8+fPp0WLFhQXFwOwb98+Zs2axYYNGygqKmLKlCmHji9JsgNAfmlpqZ5rEwhbkDwFfNN2HZlkyZINK2Mx09/Gtj/77LMPP/roo2bV1dWDbGw/id4sLS0da7uIMAlT1wbgddsFZJpUdG2OpX379kNKSkoGRSKRN0Vkna06kiCt3qci8pKIXJ7MbWiQZD7rpx107959TElJScfOnTsvAipt19MEXqtrARGpEJGtItIy7r7vi8jCZBYmIneJyOPx9xljzjbGTEvmdsMWJO+jc2M0tVDs4s/JyWnev39/t7i42LRt23YR6TuXhwHeqOeyzYAbk1hLaIQqSBwnUg28ZbuOTGJMOIKkRl5eXrthw4a5o0aN2nziiSe+abueRvi4tLT0s3ouez9wq4i0PfoBERkgIvNE5DMRWSkiF8Y9dpKIvCAiu0SkTET+U0Rej3v8IRFZFzy+RERKgvsnA3cCF4nIFyLyQXD/wqA11EJEKkXkK3HrKhCRvSJSGPx8noi8Hyz3LxEZUp8XGqogCWj3pmnl2S6gNo7j9DjttNPGDBkyZFlubu4y2/U0wKsNWPZdYCFwa/ydQXdnHjADKAQuBv5LRGr2rj0C7AE6AZcHt3hlwDCgfbCOp0TkBGPMHOBXwJPGmFbGmKHxTzLG7AeeBb4dd/eFwCJjzFYROQX4H+Aa/KsI/hl4XkRa1PVCwxgkL9suIMOEqkVytPbt2w8eN27c4KKiordEZI3teuphTgOX/xlwg4gUxN13HlBhjHnUGFNljFkKPAN8S0SaAd8ASo0xnjHmY+CI8Q1jzOPGmB3Bcx8AWgD13TM3Az+4alwS3AdwNfBnY8zbxpjqYFxlP1DnbvwwBslbwGbbRWSQUAdJja5du44uKSnp0rVr10VAfbsOqbYPv4VRb8aY5cCLwB1xd/cETgu6D5UiUgl8B78FUoD/N4vfy3XEHi8RuVVEVojIzuC5bYAO9SxpAeCIyGki0gu/ZfOPuLpuOaqu7tRjPprQBUkwN8nztuvIIKHs2tQmJycnr6ioyC0uLm7Wrl27RfifhmGyuLS0dG8jnlcK/ADoGvy8Dr870Tbu1soYcx3+bIFVQPy5S91rvgnGQ/43fpeknTGmLf6pCTXTRRz3wDBjTDUwC797823gRWPM7ri6fnlUXY4xZmZdLzB0QRL4p+0CMkjaBEmNvLy8NkOHDnVHjRq1zXGcfxGeUydeasyTjDGfAk8CPw7uehHoJyKXiUhecBspIicH/+jPAneJiCMiA4Dvxq0uHz9otgG5IvIzoHXc41uAXiJyvP/tGcBF+K2gGXH3TwWuDVorIiItReRcEcmv6zWGNUheBXbXuZQ6LmNMjPD+jevkOE63UaNGjR06dOjHubm5H1guJ8bhLkBj3A20BAhaAJPwxyo24nfl78Mf6wD4EX53ZTMwHZjJ4dbZXPxxmk+ANfjdrfiuz1PB1x0i8l5thRhj3sYfzO1CXDgaY97Fbzn9Afgc+BS4oj4vLlSHyMfzvOiT+M031UixmNm/ZMmGOkfc08XGjRvfKS8vLzDG9Law+bmlpaWTLWwXEbkP6GSMSerRqYkI86fV320XkO6MMRl1JbguXbqMKikp6d6tW7fF+BOGp9JfUrWh4BiTIUH3YhRwFYm1hpIuzEHyInqZioTEYpkVJAA5OTm5ffv2HT9u3Li89u3bLyI1F6naTGp3AOTjj5PswR9beQB4LoXbb7DQdm0APC/6W+Am23WkqwMHqrd98MGmgrqXTF979+7dsGzZsgrP88ZCwy+9UU/3lJaW3pmkdWeEMLdIwB9FVo1kjEnajO9hceKJJ3YdNWpU8bBhw/6dl5f3fhI2YdD3YZ1CHSSOE1kBLLJdR7rKhiCp0bZt25OLi4uH9e/fv0xEVjXhql8pLS3VaRXrEOogCfzRdgHpKhZL3jVowqpz584jS0pKenTv3v01mmaMLWWDrOksHYLkWWCt7SLSUXBwU9bJycnJjUQiJePGjTvhpJNOWgg05mhU8A/uCvUgZ1iEPkgcJ3IQ+LXtOtJRLJY9XZva5Obm5g8ePPj00aNHV7Zs2fIN/IPKGuKx0tLSjNvzlQyhD5LAfwObbBeRbrK1RXK0E044ofPIkSOLTznllPK8vLxaj/asxUHgT8msK5OkRZA4TmQf8BvbdaQbY9AgidOmTZv+xcXFpw4YMODdnJycT+tY/K+lpaUVqagrE6RFkAT+BGy3XUQ6icVMQ5vyWaFTp04jSkpKevfo0eM1YGsti3jAL1JcVlpLmyBxnIgH/NZ2HelEuzbHJiLN+vTpUzJu3DinoKBgEX541Hi4tLRUu9INkDZBEngIWG+7iHSRaIvk2Wef5eqrr2bixIncc889h+6fN28ekydPPnQ766yzOP3001m5ciUAr7zyClOmTOGiiy5i6dKlh563YcMGrr/+eqqrw5Nvubm5rQYNGuSOHj16V6tWrV7Hn1TpPtt1pZu0mD2rhuNEPM+L3gE8XufCilgssfMfOnTowGWXXUZZWRn79x+eY2jixIlMnDjx0M8vvfQS06dPp1+/flRVVfGXv/yFqVOnsnLlSh566CEee+wxAB5++GGuv/56mjWzfoWMLznhhBM6jRgxopPneTedffbZn9uuJ92kW4sEx4k8AfzLdh3pINHB1vHjx1NSUkLr1q2Pu9zcuXOZNGkSIsKuXbvo0KEDJ510EsOHD2fTJr+HsHDhQjp06MDAgSm9emhDrXYcRw+AbIS0C5LAjYRn1qzQSsVg6+bNm/nwww8566yzAP/C3rt27WLr1q0sWbKEXr164Xke06dP5wc/+EGyy0nUba7rhm16x7SQVl2bGo4TedfzotOo5+xN2cqk4NTul19+mcGDB9O5c2cAcnJyuOmmmygtLaV58+bceuutPProo0yZMoVVq1Yxbdo08vLyuO666+jTp0+yy2uI2a7rPmO7iHSVlkESuAM4H//aHqoWiY6R1MfcuXO59NJLj7hv+PDhDB8+HIBPP/2UlStXcu2113LxxRfz8MMPs3XrVu6//37++MfQ9CJ2A9faLiKdpWvXBseJbMGf21IdQ7JbJMuWLWPHjh24rnus7fPQQw9xww03sHPnTmKxGJ06dWLAgAGsWtWUJ+gm7HbXdXVvYALSNkgAHCcyk8OT3aqjxGKJ5UhVVRX79+8nFosRi8XYv38/VVWHT9+ZO3cu48ePx3GcWp8/e/Zs+vXrR1FREa1bt2b//v1UVFSwdOnSQ12hEHgNPRQ+YenctanxQ2A80NF2IWETiyU2ID19+nSmTTt8kbd58+Zx+eWXc+WVV7J//34WLFjA3XffXetzKysrefrpp3nkkUcAyM3N5cYbb+Smm26iefPm3HHHHbU+L8X2Ad93XVcH7hMU6qkW68vzol9DL6r1JatWfbZwxw7vdNt1hNg1ruvqfCNNIK27NjUcJ/IC/sWPVZxM+JBIopkaIk0nI4Ik8CNgaZ1LZZFEx0gyWDlwje0iMknGBInjRPYCU0j99U5CSxsktdoPXOi6rl7JsQllTJAAOE6kAv8yiOE5K8wiY0yyLs+Qzm5wXfd920VkmowKEgDHibwC6DVIgFhMg+Qov3VdVy8tkQQZFyQAjhP5NXrJT+3aHOkfwG22i8hUGRkkgcuBV20XYZN2bQ4pAy51XVdnjEuSjA0Sx4kcAL6O/ybKSsaYjP37NsBa4HzXdb06l1SNltFvNMeJfAGcA/zbdi02GJO0a+Gmi03AV13X3Wy7kEyX0UEC4DiR7cAkYJ3tWlIty1skm4EzXNctt11INsiKN5rjRNYBE4ENtmtJJWOy4+9bi63ABNd1V9ouJFtkzRvNcSIrgXFA1HYtqZKlLZLt+N2Zj20Xkk2y6o0WHLA2DlhuuZSUyMIWyXr87swy24Vkm2x7o+E4kc2AC7xtu5ZkM4bwTdeePMuBMa7rZsWHRNhkXZAAOE7kM+CrwDzbtSRX1nRtFgLjdJYze7LljfYlcbuGH7JdS7JkSYvk78BZruvutF1INsvaIAFwnEiV40R+gj8bfSZehiCTgyQG/F/gEtd1D9guJttlwlSLCXOcyDTPi67APx+ji+16mooxJlP/vtuBb7uu+4rtQpQvq1sk8Rwn8g4wHHjDdi1NKBOD5G3gVA2RcNEgiRO3R+cuMmBOkwwbIzHAw8B413Wz7ijlsMuIyZ+TwfOiY4DpQMR2LY1VVrZ+M9DJdh1NYA1wleu6WX02d5hpi+QYHCfyJjAUeIT0vc5wJnRt/gIM1hAJN22R1IPnRc/AD5STbdfSEGVl63cCbWzX0Ujr8FshGX6sT2bQFkk9OE5kATAEuBnYZbmchkjHFskB4F5goIZI+tAWSQN5XrQjcB/wXQj3fB9lZesPAnm262iAF4Gb9dT/9KNB0kjBYOxvgLG2azmWsrK0OWL8feAW13Xn2y5ENY52bRrJcSJvOk6kGP+cndds13M0Y0xV3UtZtxT/WkSnpnOIiMhCEfm+7TpsSsc+dKg4TuRV4FXPi54OlAKnWy0oYIw5SHj/vm8Dv3Bdd3Z9FhaRCsABehtj9gT3fR+41BhzeiKFiIgBiowxnyaynmynLZIm4jiRhY4TOQP/gLZnAastgliMgza3XwsDzAUmua47ur4hEqcZcGPTl3V8IhLWMA4VDZIm5jiRxY4T+QbQE7+FYmWgIkRdm234g9MR13UnJ7An5n7gVhFpe/QDIjJAROaJyGcislJELox77Ihuh4hcISKvB98vDu7+QES+EJGLROR0EVkvIreLyGbgURFpJyIvisg2Efk8+L5bI19HRtIgSRLHiWx0nMjdQC/gfwEvkcJWijFWW0TVwHzgEqCb67p3uK67OsF1vos/78it8XeKSEv8eWVmAIX4l2z9LxEZWNcKjTHjg2+HGmNaGWOeDH7uBLTH/zC4Gv//5NHg5x7AXuAPCb6ejKLNtiRznEg18DzwvOdFTwLOB76BPxl182RtNxgjSaVq/H/0p4FnXdfdmoRt/Ax4Q0Ti55A5D6gwxjwa/LxURJ4BvgX8vJHbiQGlxpiaqSX2As/UPCgivwQWNHLdGUmDJIUcJ7ID/5PtUc+LtgbOxQ+VM4F2TbmtWCwlXZtKYDH+8R//cF13ezI3ZoxZLiIvAncAK4K7ewKniUhl3KK5+OdJNdY2Y8y+mh9ExAEeBCZz+O+ULyLNjDFpf3JnU9AgscRxIruAmcBMz4vmAIPxB2pdYDzQIZH1J+kNvgd/V/cC/K7LexYug1kKvAc8EPy8DlhkjJl4jOX34O/xqVGfkxiPPrjqFqA/cJoxZrOIDMPfdR3qAxJTSYMkBBwnEgM+CG6/97yo4J/XMwIYBHwl+NqDer55jUl4GoRtQT3vx339t+u6VgdxjTGfisiTwI+BZfitoXtF5DIOXzh+GPCFMWYFft1TROSv+JNWXQVsiVvlFqAPcLzdv/n43ZtKEWmPH2YqjgZJCDlOxAAfB7dDPC/aChgIFAGd8T9d428dgZbACcfo2hwEvoi77QI24n+qrw1u64CKkF/m8m7gMgBjzG4RmQT8Nrjl4AffzcGyDwIj8QPjQ+AJ/IMIa9wFTBORE/EHVmsb2/kd/mDudvzf1wP415VWAT1EPkNt3Li8eXn5jjz8fywB9uncpipZNEiUUgnT40iUUgnTIFFKJUyDRCmVMA0SpVTCNEiUUgnTIFFKJUyDRCmVMA0SpVTCNEiUUgnTIFFKJUyDRCmVMA0SpVTCNEiUUgnTIFFKJUyDRCmVMA0SpVTCNEiUUgnTIFFKJUyDRCmVMA0SpVTCNEiUUgnTIFFKJUyDRCmVMA0SpVTCNEiUUgnTIFFKJUyDRCmVsP8PRL9kiyM9rb8AAAAASUVORK5CYII=\n" }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "# save data frame to csv\n", "rt.to_csv(\"sentiment.csv\")" ], "metadata": { "id": "Ws3dPGaEE1RB" }, "execution_count": 26, "outputs": [] } ] }